{"current_steps": 1, "total_steps": 9627, "loss": 2.4557, "learning_rate": 9.9999997337695e-05, "epoch": 0.00010387451958034694, "percentage": 0.01, "elapsed_time": "0:00:22", "remaining_time": "2 days, 13:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 9627, "loss": 2.1366, "learning_rate": 9.999998935078033e-05, "epoch": 0.00020774903916069389, "percentage": 0.02, "elapsed_time": "0:00:44", "remaining_time": "2 days, 11:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 9627, "loss": 1.9955, "learning_rate": 9.999997603925677e-05, "epoch": 0.0003116235587410408, "percentage": 0.03, "elapsed_time": "0:01:07", "remaining_time": "2 days, 11:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 9627, "loss": 2.1548, "learning_rate": 9.99999574031258e-05, "epoch": 0.00041549807832138777, "percentage": 0.04, "elapsed_time": "0:01:34", "remaining_time": "2 days, 15:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 9627, "loss": 2.0443, "learning_rate": 9.999993344238936e-05, "epoch": 0.0005193725979017347, "percentage": 0.05, "elapsed_time": "0:01:59", "remaining_time": "2 days, 15:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 9627, "loss": 2.0479, "learning_rate": 9.999990415705005e-05, "epoch": 0.0006232471174820816, "percentage": 0.06, "elapsed_time": "0:02:24", "remaining_time": "2 days, 16:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 9627, "loss": 2.0064, "learning_rate": 9.999986954711094e-05, "epoch": 0.0007271216370624286, "percentage": 0.07, "elapsed_time": "0:02:49", "remaining_time": "2 days, 16:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 9627, "loss": 1.8892, "learning_rate": 9.999982961257574e-05, "epoch": 0.0008309961566427755, "percentage": 0.08, "elapsed_time": "0:03:15", "remaining_time": "2 days, 17:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 9627, "loss": 1.9309, "learning_rate": 9.999978435344872e-05, "epoch": 0.0009348706762231225, "percentage": 0.09, "elapsed_time": "0:03:41", "remaining_time": "2 days, 17:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 9627, "loss": 1.6737, "learning_rate": 9.999973376973466e-05, "epoch": 0.0010387451958034693, "percentage": 0.1, "elapsed_time": "0:04:06", "remaining_time": "2 days, 17:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 9627, "loss": 1.8743, "learning_rate": 9.999967786143895e-05, "epoch": 0.0011426197153838163, "percentage": 0.11, "elapsed_time": "0:04:32", "remaining_time": "2 days, 18:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 9627, "loss": 1.8595, "learning_rate": 9.99996166285676e-05, "epoch": 0.0012464942349641633, "percentage": 0.12, "elapsed_time": "0:04:58", "remaining_time": "2 days, 18:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 9627, "loss": 1.8856, "learning_rate": 9.999955007112706e-05, "epoch": 0.0013503687545445102, "percentage": 0.14, "elapsed_time": "0:05:24", "remaining_time": "2 days, 18:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 9627, "loss": 2.0519, "learning_rate": 9.999947818912448e-05, "epoch": 0.0014542432741248572, "percentage": 0.15, "elapsed_time": "0:05:50", "remaining_time": "2 days, 18:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 9627, "loss": 1.8855, "learning_rate": 9.999940098256747e-05, "epoch": 0.0015581177937052041, "percentage": 0.16, "elapsed_time": "0:06:15", "remaining_time": "2 days, 18:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 9627, "loss": 2.0608, "learning_rate": 9.999931845146424e-05, "epoch": 0.001661992313285551, "percentage": 0.17, "elapsed_time": "0:06:41", "remaining_time": "2 days, 19:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 9627, "loss": 2.2282, "learning_rate": 9.999923059582363e-05, "epoch": 0.001765866832865898, "percentage": 0.18, "elapsed_time": "0:07:07", "remaining_time": "2 days, 19:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 9627, "loss": 2.0698, "learning_rate": 9.999913741565496e-05, "epoch": 0.001869741352446245, "percentage": 0.19, "elapsed_time": "0:07:33", "remaining_time": "2 days, 19:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 9627, "loss": 2.0232, "learning_rate": 9.999903891096817e-05, "epoch": 0.0019736158720265917, "percentage": 0.2, "elapsed_time": "0:07:58", "remaining_time": "2 days, 19:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 9627, "loss": 1.8005, "learning_rate": 9.999893508177373e-05, "epoch": 0.0020774903916069387, "percentage": 0.21, "elapsed_time": "0:08:24", "remaining_time": "2 days, 19:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 9627, "loss": 1.8358, "learning_rate": 9.999882592808274e-05, "epoch": 0.0021813649111872857, "percentage": 0.22, "elapsed_time": "0:08:50", "remaining_time": "2 days, 19:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 9627, "loss": 1.8202, "learning_rate": 9.999871144990677e-05, "epoch": 0.0022852394307676326, "percentage": 0.23, "elapsed_time": "0:09:16", "remaining_time": "2 days, 19:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 9627, "loss": 1.9011, "learning_rate": 9.999859164725804e-05, "epoch": 0.0023891139503479796, "percentage": 0.24, "elapsed_time": "0:09:41", "remaining_time": "2 days, 19:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 9627, "loss": 1.8046, "learning_rate": 9.999846652014931e-05, "epoch": 0.0024929884699283265, "percentage": 0.25, "elapsed_time": "0:10:08", "remaining_time": "2 days, 19:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 9627, "loss": 1.7041, "learning_rate": 9.99983360685939e-05, "epoch": 0.0025968629895086735, "percentage": 0.26, "elapsed_time": "0:10:33", "remaining_time": "2 days, 19:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 9627, "loss": 1.8635, "learning_rate": 9.999820029260569e-05, "epoch": 0.0027007375090890204, "percentage": 0.27, "elapsed_time": "0:10:59", "remaining_time": "2 days, 19:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 9627, "loss": 2.025, "learning_rate": 9.999805919219916e-05, "epoch": 0.0028046120286693674, "percentage": 0.28, "elapsed_time": "0:11:25", "remaining_time": "2 days, 19:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 9627, "loss": 1.9266, "learning_rate": 9.999791276738933e-05, "epoch": 0.0029084865482497143, "percentage": 0.29, "elapsed_time": "0:11:51", "remaining_time": "2 days, 19:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 9627, "loss": 1.923, "learning_rate": 9.999776101819177e-05, "epoch": 0.0030123610678300613, "percentage": 0.3, "elapsed_time": "0:12:17", "remaining_time": "2 days, 19:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 9627, "loss": 1.876, "learning_rate": 9.999760394462268e-05, "epoch": 0.0031162355874104083, "percentage": 0.31, "elapsed_time": "0:12:43", "remaining_time": "2 days, 19:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 9627, "loss": 2.0935, "learning_rate": 9.999744154669874e-05, "epoch": 0.0032201101069907552, "percentage": 0.32, "elapsed_time": "0:13:08", "remaining_time": "2 days, 19:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 9627, "loss": 1.7944, "learning_rate": 9.999727382443728e-05, "epoch": 0.003323984626571102, "percentage": 0.33, "elapsed_time": "0:13:35", "remaining_time": "2 days, 19:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 9627, "loss": 2.0774, "learning_rate": 9.999710077785616e-05, "epoch": 0.003427859146151449, "percentage": 0.34, "elapsed_time": "0:14:00", "remaining_time": "2 days, 19:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 9627, "loss": 1.7769, "learning_rate": 9.99969224069738e-05, "epoch": 0.003531733665731796, "percentage": 0.35, "elapsed_time": "0:14:27", "remaining_time": "2 days, 19:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 9627, "loss": 1.9222, "learning_rate": 9.99967387118092e-05, "epoch": 0.003635608185312143, "percentage": 0.36, "elapsed_time": "0:14:52", "remaining_time": "2 days, 19:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 9627, "loss": 2.0162, "learning_rate": 9.99965496923819e-05, "epoch": 0.00373948270489249, "percentage": 0.37, "elapsed_time": "0:15:17", "remaining_time": "2 days, 19:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 9627, "loss": 2.0374, "learning_rate": 9.999635534871205e-05, "epoch": 0.003843357224472837, "percentage": 0.38, "elapsed_time": "0:15:44", "remaining_time": "2 days, 19:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 9627, "loss": 1.7788, "learning_rate": 9.999615568082036e-05, "epoch": 0.0039472317440531835, "percentage": 0.39, "elapsed_time": "0:16:10", "remaining_time": "2 days, 20:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 9627, "loss": 1.6986, "learning_rate": 9.999595068872805e-05, "epoch": 0.0040511062636335304, "percentage": 0.41, "elapsed_time": "0:16:35", "remaining_time": "2 days, 19:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 9627, "loss": 1.9754, "learning_rate": 9.9995740372457e-05, "epoch": 0.004154980783213877, "percentage": 0.42, "elapsed_time": "0:17:01", "remaining_time": "2 days, 20:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 9627, "loss": 1.699, "learning_rate": 9.999552473202955e-05, "epoch": 0.004258855302794224, "percentage": 0.43, "elapsed_time": "0:17:27", "remaining_time": "2 days, 20:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 9627, "loss": 2.1077, "learning_rate": 9.999530376746873e-05, "epoch": 0.004362729822374571, "percentage": 0.44, "elapsed_time": "0:17:52", "remaining_time": "2 days, 20:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 9627, "loss": 1.9693, "learning_rate": 9.999507747879802e-05, "epoch": 0.004466604341954918, "percentage": 0.45, "elapsed_time": "0:18:20", "remaining_time": "2 days, 20:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 9627, "loss": 1.9005, "learning_rate": 9.999484586604154e-05, "epoch": 0.004570478861535265, "percentage": 0.46, "elapsed_time": "0:18:44", "remaining_time": "2 days, 20:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 9627, "loss": 1.8829, "learning_rate": 9.999460892922394e-05, "epoch": 0.004674353381115612, "percentage": 0.47, "elapsed_time": "0:19:11", "remaining_time": "2 days, 20:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 9627, "loss": 1.9172, "learning_rate": 9.999436666837048e-05, "epoch": 0.004778227900695959, "percentage": 0.48, "elapsed_time": "0:19:36", "remaining_time": "2 days, 20:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 9627, "loss": 1.8282, "learning_rate": 9.999411908350692e-05, "epoch": 0.004882102420276306, "percentage": 0.49, "elapsed_time": "0:20:03", "remaining_time": "2 days, 20:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 9627, "loss": 1.8652, "learning_rate": 9.999386617465966e-05, "epoch": 0.004985976939856653, "percentage": 0.5, "elapsed_time": "0:20:28", "remaining_time": "2 days, 20:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 9627, "loss": 1.9479, "learning_rate": 9.999360794185562e-05, "epoch": 0.005089851459437, "percentage": 0.51, "elapsed_time": "0:20:55", "remaining_time": "2 days, 20:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 9627, "loss": 1.8856, "learning_rate": 9.999334438512228e-05, "epoch": 0.005193725979017347, "percentage": 0.52, "elapsed_time": "0:21:20", "remaining_time": "2 days, 20:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 9627, "loss": 2.26, "learning_rate": 9.999307550448776e-05, "epoch": 0.005297600498597694, "percentage": 0.53, "elapsed_time": "0:21:46", "remaining_time": "2 days, 20:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 9627, "loss": 1.9131, "learning_rate": 9.999280129998063e-05, "epoch": 0.005401475018178041, "percentage": 0.54, "elapsed_time": "0:22:12", "remaining_time": "2 days, 20:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 9627, "loss": 1.7429, "learning_rate": 9.999252177163013e-05, "epoch": 0.005505349537758388, "percentage": 0.55, "elapsed_time": "0:22:38", "remaining_time": "2 days, 20:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 9627, "loss": 1.8882, "learning_rate": 9.999223691946602e-05, "epoch": 0.005609224057338735, "percentage": 0.56, "elapsed_time": "0:23:04", "remaining_time": "2 days, 20:11:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 9627, "loss": 2.2768, "learning_rate": 9.999194674351864e-05, "epoch": 0.005713098576919082, "percentage": 0.57, "elapsed_time": "0:23:30", "remaining_time": "2 days, 20:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 9627, "loss": 1.7684, "learning_rate": 9.999165124381887e-05, "epoch": 0.005816973096499429, "percentage": 0.58, "elapsed_time": "0:23:56", "remaining_time": "2 days, 20:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 9627, "loss": 1.8547, "learning_rate": 9.99913504203982e-05, "epoch": 0.005920847616079776, "percentage": 0.59, "elapsed_time": "0:24:22", "remaining_time": "2 days, 20:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 9627, "loss": 1.9773, "learning_rate": 9.999104427328865e-05, "epoch": 0.006024722135660123, "percentage": 0.6, "elapsed_time": "0:24:48", "remaining_time": "2 days, 20:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 9627, "loss": 1.9732, "learning_rate": 9.999073280252283e-05, "epoch": 0.0061285966552404696, "percentage": 0.61, "elapsed_time": "0:25:15", "remaining_time": "2 days, 20:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 9627, "loss": 1.9285, "learning_rate": 9.999041600813393e-05, "epoch": 0.0062324711748208165, "percentage": 0.62, "elapsed_time": "0:25:40", "remaining_time": "2 days, 20:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 9627, "loss": 1.9619, "learning_rate": 9.999009389015564e-05, "epoch": 0.0063363456944011635, "percentage": 0.63, "elapsed_time": "0:26:05", "remaining_time": "2 days, 20:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 9627, "loss": 2.0373, "learning_rate": 9.99897664486223e-05, "epoch": 0.0064402202139815104, "percentage": 0.64, "elapsed_time": "0:26:31", "remaining_time": "2 days, 20:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 9627, "loss": 1.8389, "learning_rate": 9.998943368356877e-05, "epoch": 0.006544094733561857, "percentage": 0.65, "elapsed_time": "0:26:58", "remaining_time": "2 days, 20:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 9627, "loss": 2.0334, "learning_rate": 9.998909559503048e-05, "epoch": 0.006647969253142204, "percentage": 0.66, "elapsed_time": "0:27:24", "remaining_time": "2 days, 20:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 9627, "loss": 2.0735, "learning_rate": 9.998875218304345e-05, "epoch": 0.006751843772722551, "percentage": 0.68, "elapsed_time": "0:27:50", "remaining_time": "2 days, 20:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 9627, "loss": 1.7135, "learning_rate": 9.998840344764422e-05, "epoch": 0.006855718292302898, "percentage": 0.69, "elapsed_time": "0:28:15", "remaining_time": "2 days, 20:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 9627, "loss": 1.9234, "learning_rate": 9.998804938886997e-05, "epoch": 0.006959592811883245, "percentage": 0.7, "elapsed_time": "0:28:43", "remaining_time": "2 days, 20:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 9627, "loss": 1.6909, "learning_rate": 9.998769000675836e-05, "epoch": 0.007063467331463592, "percentage": 0.71, "elapsed_time": "0:29:09", "remaining_time": "2 days, 20:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 9627, "loss": 1.7841, "learning_rate": 9.99873253013477e-05, "epoch": 0.007167341851043939, "percentage": 0.72, "elapsed_time": "0:29:35", "remaining_time": "2 days, 20:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 9627, "loss": 1.8755, "learning_rate": 9.998695527267681e-05, "epoch": 0.007271216370624286, "percentage": 0.73, "elapsed_time": "0:30:00", "remaining_time": "2 days, 20:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 9627, "loss": 1.8373, "learning_rate": 9.998657992078509e-05, "epoch": 0.007375090890204633, "percentage": 0.74, "elapsed_time": "0:30:27", "remaining_time": "2 days, 20:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 9627, "loss": 2.0858, "learning_rate": 9.998619924571251e-05, "epoch": 0.00747896540978498, "percentage": 0.75, "elapsed_time": "0:30:53", "remaining_time": "2 days, 20:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 9627, "loss": 1.7906, "learning_rate": 9.998581324749964e-05, "epoch": 0.007582839929365327, "percentage": 0.76, "elapsed_time": "0:31:19", "remaining_time": "2 days, 20:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 9627, "loss": 1.8037, "learning_rate": 9.998542192618755e-05, "epoch": 0.007686714448945674, "percentage": 0.77, "elapsed_time": "0:31:45", "remaining_time": "2 days, 20:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 9627, "loss": 1.6548, "learning_rate": 9.998502528181793e-05, "epoch": 0.007790588968526021, "percentage": 0.78, "elapsed_time": "0:32:11", "remaining_time": "2 days, 20:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 9627, "loss": 2.0898, "learning_rate": 9.998462331443301e-05, "epoch": 0.007894463488106367, "percentage": 0.79, "elapsed_time": "0:32:38", "remaining_time": "2 days, 20:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 9627, "loss": 1.9709, "learning_rate": 9.99842160240756e-05, "epoch": 0.007998338007686715, "percentage": 0.8, "elapsed_time": "0:33:03", "remaining_time": "2 days, 20:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 9627, "loss": 1.6921, "learning_rate": 9.998380341078909e-05, "epoch": 0.008102212527267061, "percentage": 0.81, "elapsed_time": "0:33:30", "remaining_time": "2 days, 20:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 9627, "loss": 1.8009, "learning_rate": 9.99833854746174e-05, "epoch": 0.008206087046847409, "percentage": 0.82, "elapsed_time": "0:33:56", "remaining_time": "2 days, 20:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 9627, "loss": 1.9141, "learning_rate": 9.998296221560504e-05, "epoch": 0.008309961566427755, "percentage": 0.83, "elapsed_time": "0:34:22", "remaining_time": "2 days, 20:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 9627, "loss": 1.8365, "learning_rate": 9.998253363379708e-05, "epoch": 0.008413836086008103, "percentage": 0.84, "elapsed_time": "0:34:49", "remaining_time": "2 days, 20:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 9627, "loss": 2.0948, "learning_rate": 9.998209972923918e-05, "epoch": 0.008517710605588449, "percentage": 0.85, "elapsed_time": "0:35:14", "remaining_time": "2 days, 20:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 9627, "loss": 1.8404, "learning_rate": 9.998166050197751e-05, "epoch": 0.008621585125168797, "percentage": 0.86, "elapsed_time": "0:35:41", "remaining_time": "2 days, 20:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 9627, "loss": 1.8201, "learning_rate": 9.998121595205889e-05, "epoch": 0.008725459644749143, "percentage": 0.87, "elapsed_time": "0:36:07", "remaining_time": "2 days, 20:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 9627, "loss": 1.9134, "learning_rate": 9.998076607953064e-05, "epoch": 0.00882933416432949, "percentage": 0.88, "elapsed_time": "0:36:34", "remaining_time": "2 days, 20:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 9627, "loss": 1.9558, "learning_rate": 9.998031088444067e-05, "epoch": 0.008933208683909837, "percentage": 0.89, "elapsed_time": "0:36:59", "remaining_time": "2 days, 20:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 9627, "loss": 2.045, "learning_rate": 9.997985036683744e-05, "epoch": 0.009037083203490184, "percentage": 0.9, "elapsed_time": "0:37:25", "remaining_time": "2 days, 20:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 9627, "loss": 1.7929, "learning_rate": 9.997938452677e-05, "epoch": 0.00914095772307053, "percentage": 0.91, "elapsed_time": "0:37:51", "remaining_time": "2 days, 20:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 9627, "loss": 1.8742, "learning_rate": 9.997891336428797e-05, "epoch": 0.009244832242650878, "percentage": 0.92, "elapsed_time": "0:38:17", "remaining_time": "2 days, 20:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 9627, "loss": 1.9634, "learning_rate": 9.997843687944152e-05, "epoch": 0.009348706762231224, "percentage": 0.93, "elapsed_time": "0:38:44", "remaining_time": "2 days, 20:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 9627, "loss": 1.8137, "learning_rate": 9.997795507228139e-05, "epoch": 0.009452581281811572, "percentage": 0.95, "elapsed_time": "0:39:10", "remaining_time": "2 days, 20:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 9627, "loss": 1.9342, "learning_rate": 9.997746794285887e-05, "epoch": 0.009556455801391918, "percentage": 0.96, "elapsed_time": "0:39:37", "remaining_time": "2 days, 20:26:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 9627, "loss": 1.8772, "learning_rate": 9.997697549122586e-05, "epoch": 0.009660330320972266, "percentage": 0.97, "elapsed_time": "0:40:02", "remaining_time": "2 days, 20:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 9627, "loss": 1.8048, "learning_rate": 9.997647771743482e-05, "epoch": 0.009764204840552612, "percentage": 0.98, "elapsed_time": "0:40:29", "remaining_time": "2 days, 20:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 9627, "loss": 1.8228, "learning_rate": 9.997597462153871e-05, "epoch": 0.00986807936013296, "percentage": 0.99, "elapsed_time": "0:40:55", "remaining_time": "2 days, 20:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 9627, "loss": 1.8203, "learning_rate": 9.997546620359114e-05, "epoch": 0.009971953879713306, "percentage": 1.0, "elapsed_time": "0:41:22", "remaining_time": "2 days, 20:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 9627, "loss": 1.7667, "learning_rate": 9.997495246364624e-05, "epoch": 0.010075828399293654, "percentage": 1.01, "elapsed_time": "0:41:47", "remaining_time": "2 days, 20:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 9627, "loss": 1.7176, "learning_rate": 9.997443340175872e-05, "epoch": 0.010179702918874, "percentage": 1.02, "elapsed_time": "0:42:14", "remaining_time": "2 days, 20:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 9627, "loss": 1.7196, "learning_rate": 9.997390901798386e-05, "epoch": 0.010283577438454348, "percentage": 1.03, "elapsed_time": "0:42:39", "remaining_time": "2 days, 20:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 9627, "loss": 1.6993, "learning_rate": 9.997337931237751e-05, "epoch": 0.010387451958034694, "percentage": 1.04, "elapsed_time": "0:43:06", "remaining_time": "2 days, 20:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 9627, "loss": 1.9082, "learning_rate": 9.997284428499605e-05, "epoch": 0.010491326477615042, "percentage": 1.05, "elapsed_time": "0:43:32", "remaining_time": "2 days, 20:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 9627, "loss": 1.8484, "learning_rate": 9.99723039358965e-05, "epoch": 0.010595200997195388, "percentage": 1.06, "elapsed_time": "0:43:58", "remaining_time": "2 days, 20:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 9627, "loss": 2.0352, "learning_rate": 9.997175826513637e-05, "epoch": 0.010699075516775736, "percentage": 1.07, "elapsed_time": "0:44:24", "remaining_time": "2 days, 20:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 9627, "loss": 2.1032, "learning_rate": 9.997120727277378e-05, "epoch": 0.010802950036356082, "percentage": 1.08, "elapsed_time": "0:44:50", "remaining_time": "2 days, 20:26:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 9627, "loss": 1.7161, "learning_rate": 9.997065095886741e-05, "epoch": 0.01090682455593643, "percentage": 1.09, "elapsed_time": "0:45:17", "remaining_time": "2 days, 20:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 9627, "loss": 1.8586, "learning_rate": 9.997008932347649e-05, "epoch": 0.011010699075516776, "percentage": 1.1, "elapsed_time": "0:45:43", "remaining_time": "2 days, 20:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 9627, "loss": 1.8134, "learning_rate": 9.996952236666084e-05, "epoch": 0.011114573595097123, "percentage": 1.11, "elapsed_time": "0:46:08", "remaining_time": "2 days, 20:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 9627, "loss": 1.9237, "learning_rate": 9.996895008848085e-05, "epoch": 0.01121844811467747, "percentage": 1.12, "elapsed_time": "0:46:35", "remaining_time": "2 days, 20:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 9627, "loss": 1.8897, "learning_rate": 9.996837248899741e-05, "epoch": 0.011322322634257817, "percentage": 1.13, "elapsed_time": "0:47:01", "remaining_time": "2 days, 20:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 9627, "loss": 1.9856, "learning_rate": 9.99677895682721e-05, "epoch": 0.011426197153838163, "percentage": 1.14, "elapsed_time": "0:47:28", "remaining_time": "2 days, 20:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 9627, "loss": 1.6574, "learning_rate": 9.996720132636697e-05, "epoch": 0.011530071673418511, "percentage": 1.15, "elapsed_time": "0:47:54", "remaining_time": "2 days, 20:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 9627, "loss": 1.7604, "learning_rate": 9.996660776334464e-05, "epoch": 0.011633946192998857, "percentage": 1.16, "elapsed_time": "0:48:20", "remaining_time": "2 days, 20:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 9627, "loss": 1.766, "learning_rate": 9.996600887926834e-05, "epoch": 0.011737820712579203, "percentage": 1.17, "elapsed_time": "0:48:46", "remaining_time": "2 days, 20:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 9627, "loss": 1.7565, "learning_rate": 9.996540467420186e-05, "epoch": 0.011841695232159551, "percentage": 1.18, "elapsed_time": "0:49:13", "remaining_time": "2 days, 20:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 9627, "loss": 1.8874, "learning_rate": 9.996479514820952e-05, "epoch": 0.011945569751739897, "percentage": 1.19, "elapsed_time": "0:49:40", "remaining_time": "2 days, 20:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 9627, "loss": 2.0761, "learning_rate": 9.996418030135622e-05, "epoch": 0.012049444271320245, "percentage": 1.2, "elapsed_time": "0:50:05", "remaining_time": "2 days, 20:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 9627, "loss": 2.0269, "learning_rate": 9.996356013370747e-05, "epoch": 0.012153318790900591, "percentage": 1.22, "elapsed_time": "0:50:32", "remaining_time": "2 days, 20:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 9627, "loss": 1.7982, "learning_rate": 9.99629346453293e-05, "epoch": 0.012257193310480939, "percentage": 1.23, "elapsed_time": "0:50:57", "remaining_time": "2 days, 20:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 9627, "loss": 1.9449, "learning_rate": 9.996230383628831e-05, "epoch": 0.012361067830061285, "percentage": 1.24, "elapsed_time": "0:51:25", "remaining_time": "2 days, 20:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 9627, "loss": 1.9453, "learning_rate": 9.996166770665167e-05, "epoch": 0.012464942349641633, "percentage": 1.25, "elapsed_time": "0:51:51", "remaining_time": "2 days, 20:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 9627, "loss": 1.7562, "learning_rate": 9.996102625648715e-05, "epoch": 0.012568816869221979, "percentage": 1.26, "elapsed_time": "0:52:17", "remaining_time": "2 days, 20:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 9627, "loss": 1.9439, "learning_rate": 9.996037948586305e-05, "epoch": 0.012672691388802327, "percentage": 1.27, "elapsed_time": "0:52:43", "remaining_time": "2 days, 20:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 9627, "loss": 1.7729, "learning_rate": 9.995972739484822e-05, "epoch": 0.012776565908382673, "percentage": 1.28, "elapsed_time": "0:53:09", "remaining_time": "2 days, 20:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 9627, "loss": 2.246, "learning_rate": 9.995906998351215e-05, "epoch": 0.012880440427963021, "percentage": 1.29, "elapsed_time": "0:53:36", "remaining_time": "2 days, 20:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 9627, "loss": 1.9098, "learning_rate": 9.99584072519248e-05, "epoch": 0.012984314947543367, "percentage": 1.3, "elapsed_time": "0:54:02", "remaining_time": "2 days, 20:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 9627, "loss": 1.7569, "learning_rate": 9.995773920015679e-05, "epoch": 0.013088189467123715, "percentage": 1.31, "elapsed_time": "0:54:28", "remaining_time": "2 days, 20:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 9627, "loss": 2.0098, "learning_rate": 9.995706582827922e-05, "epoch": 0.013192063986704061, "percentage": 1.32, "elapsed_time": "0:54:54", "remaining_time": "2 days, 20:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 9627, "loss": 1.9661, "learning_rate": 9.995638713636382e-05, "epoch": 0.013295938506284409, "percentage": 1.33, "elapsed_time": "0:55:21", "remaining_time": "2 days, 20:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 9627, "loss": 1.768, "learning_rate": 9.995570312448289e-05, "epoch": 0.013399813025864755, "percentage": 1.34, "elapsed_time": "0:55:46", "remaining_time": "2 days, 20:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 9627, "loss": 1.649, "learning_rate": 9.995501379270922e-05, "epoch": 0.013503687545445103, "percentage": 1.35, "elapsed_time": "0:56:13", "remaining_time": "2 days, 20:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 9627, "loss": 1.904, "learning_rate": 9.995431914111624e-05, "epoch": 0.013607562065025449, "percentage": 1.36, "elapsed_time": "0:56:38", "remaining_time": "2 days, 20:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 9627, "loss": 1.9214, "learning_rate": 9.995361916977795e-05, "epoch": 0.013711436584605797, "percentage": 1.37, "elapsed_time": "0:57:06", "remaining_time": "2 days, 20:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 9627, "loss": 1.9647, "learning_rate": 9.995291387876886e-05, "epoch": 0.013815311104186143, "percentage": 1.38, "elapsed_time": "0:57:32", "remaining_time": "2 days, 20:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 9627, "loss": 1.8797, "learning_rate": 9.99522032681641e-05, "epoch": 0.01391918562376649, "percentage": 1.39, "elapsed_time": "0:57:57", "remaining_time": "2 days, 20:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 9627, "loss": 1.9065, "learning_rate": 9.995148733803933e-05, "epoch": 0.014023060143346837, "percentage": 1.4, "elapsed_time": "0:58:25", "remaining_time": "2 days, 20:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 9627, "loss": 1.7649, "learning_rate": 9.995076608847078e-05, "epoch": 0.014126934662927184, "percentage": 1.41, "elapsed_time": "0:58:51", "remaining_time": "2 days, 20:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 9627, "loss": 1.7482, "learning_rate": 9.99500395195353e-05, "epoch": 0.01423080918250753, "percentage": 1.42, "elapsed_time": "0:59:17", "remaining_time": "2 days, 20:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 9627, "loss": 2.0021, "learning_rate": 9.994930763131022e-05, "epoch": 0.014334683702087878, "percentage": 1.43, "elapsed_time": "0:59:44", "remaining_time": "2 days, 20:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 9627, "loss": 1.9293, "learning_rate": 9.99485704238735e-05, "epoch": 0.014438558221668224, "percentage": 1.44, "elapsed_time": "1:00:09", "remaining_time": "2 days, 20:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 9627, "loss": 1.789, "learning_rate": 9.994782789730363e-05, "epoch": 0.014542432741248572, "percentage": 1.45, "elapsed_time": "1:00:35", "remaining_time": "2 days, 20:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 9627, "loss": 2.0092, "learning_rate": 9.994708005167972e-05, "epoch": 0.014646307260828918, "percentage": 1.46, "elapsed_time": "1:01:02", "remaining_time": "2 days, 20:27:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 9627, "loss": 1.9393, "learning_rate": 9.994632688708138e-05, "epoch": 0.014750181780409266, "percentage": 1.48, "elapsed_time": "1:01:28", "remaining_time": "2 days, 20:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 9627, "loss": 1.7967, "learning_rate": 9.994556840358882e-05, "epoch": 0.014854056299989612, "percentage": 1.49, "elapsed_time": "1:01:55", "remaining_time": "2 days, 20:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 9627, "loss": 1.8901, "learning_rate": 9.994480460128282e-05, "epoch": 0.01495793081956996, "percentage": 1.5, "elapsed_time": "1:02:20", "remaining_time": "2 days, 20:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 9627, "loss": 1.8006, "learning_rate": 9.99440354802447e-05, "epoch": 0.015061805339150306, "percentage": 1.51, "elapsed_time": "1:02:47", "remaining_time": "2 days, 20:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 9627, "loss": 1.9967, "learning_rate": 9.994326104055639e-05, "epoch": 0.015165679858730654, "percentage": 1.52, "elapsed_time": "1:03:13", "remaining_time": "2 days, 20:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 9627, "loss": 1.9811, "learning_rate": 9.994248128230035e-05, "epoch": 0.015269554378311, "percentage": 1.53, "elapsed_time": "1:03:40", "remaining_time": "2 days, 20:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 9627, "loss": 1.7302, "learning_rate": 9.994169620555962e-05, "epoch": 0.015373428897891348, "percentage": 1.54, "elapsed_time": "1:04:06", "remaining_time": "2 days, 20:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 9627, "loss": 1.8822, "learning_rate": 9.994090581041781e-05, "epoch": 0.015477303417471694, "percentage": 1.55, "elapsed_time": "1:04:33", "remaining_time": "2 days, 20:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 9627, "loss": 2.0916, "learning_rate": 9.994011009695908e-05, "epoch": 0.015581177937052042, "percentage": 1.56, "elapsed_time": "1:04:59", "remaining_time": "2 days, 20:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 9627, "loss": 1.6987, "learning_rate": 9.993930906526818e-05, "epoch": 0.01568505245663239, "percentage": 1.57, "elapsed_time": "1:05:25", "remaining_time": "2 days, 20:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 9627, "loss": 1.6714, "learning_rate": 9.993850271543039e-05, "epoch": 0.015788926976212734, "percentage": 1.58, "elapsed_time": "1:05:50", "remaining_time": "2 days, 20:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 9627, "loss": 2.0209, "learning_rate": 9.99376910475316e-05, "epoch": 0.015892801495793082, "percentage": 1.59, "elapsed_time": "1:06:17", "remaining_time": "2 days, 20:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 9627, "loss": 1.6677, "learning_rate": 9.993687406165826e-05, "epoch": 0.01599667601537343, "percentage": 1.6, "elapsed_time": "1:06:44", "remaining_time": "2 days, 20:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 9627, "loss": 1.863, "learning_rate": 9.993605175789733e-05, "epoch": 0.016100550534953777, "percentage": 1.61, "elapsed_time": "1:07:10", "remaining_time": "2 days, 20:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 9627, "loss": 1.9312, "learning_rate": 9.993522413633643e-05, "epoch": 0.016204425054534122, "percentage": 1.62, "elapsed_time": "1:07:37", "remaining_time": "2 days, 20:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 9627, "loss": 2.0446, "learning_rate": 9.993439119706364e-05, "epoch": 0.01630829957411447, "percentage": 1.63, "elapsed_time": "1:08:02", "remaining_time": "2 days, 20:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 9627, "loss": 1.7413, "learning_rate": 9.993355294016771e-05, "epoch": 0.016412174093694817, "percentage": 1.64, "elapsed_time": "1:08:29", "remaining_time": "2 days, 20:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 9627, "loss": 1.8413, "learning_rate": 9.993270936573788e-05, "epoch": 0.016516048613275165, "percentage": 1.65, "elapsed_time": "1:08:56", "remaining_time": "2 days, 20:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 9627, "loss": 1.9083, "learning_rate": 9.9931860473864e-05, "epoch": 0.01661992313285551, "percentage": 1.66, "elapsed_time": "1:09:22", "remaining_time": "2 days, 20:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 9627, "loss": 1.8213, "learning_rate": 9.993100626463646e-05, "epoch": 0.016723797652435857, "percentage": 1.67, "elapsed_time": "1:09:48", "remaining_time": "2 days, 20:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 9627, "loss": 2.1405, "learning_rate": 9.993014673814624e-05, "epoch": 0.016827672172016205, "percentage": 1.68, "elapsed_time": "1:10:14", "remaining_time": "2 days, 20:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 9627, "loss": 1.8398, "learning_rate": 9.992928189448484e-05, "epoch": 0.016931546691596553, "percentage": 1.69, "elapsed_time": "1:10:41", "remaining_time": "2 days, 20:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 9627, "loss": 1.8151, "learning_rate": 9.992841173374441e-05, "epoch": 0.017035421211176897, "percentage": 1.7, "elapsed_time": "1:11:07", "remaining_time": "2 days, 20:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 9627, "loss": 1.7062, "learning_rate": 9.992753625601756e-05, "epoch": 0.017139295730757245, "percentage": 1.71, "elapsed_time": "1:11:32", "remaining_time": "2 days, 20:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 9627, "loss": 1.6682, "learning_rate": 9.992665546139757e-05, "epoch": 0.017243170250337593, "percentage": 1.72, "elapsed_time": "1:12:00", "remaining_time": "2 days, 20:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 9627, "loss": 1.9738, "learning_rate": 9.992576934997819e-05, "epoch": 0.017347044769917937, "percentage": 1.73, "elapsed_time": "1:12:26", "remaining_time": "2 days, 20:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 9627, "loss": 1.9593, "learning_rate": 9.992487792185383e-05, "epoch": 0.017450919289498285, "percentage": 1.75, "elapsed_time": "1:12:53", "remaining_time": "2 days, 20:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 9627, "loss": 1.8838, "learning_rate": 9.992398117711941e-05, "epoch": 0.017554793809078633, "percentage": 1.76, "elapsed_time": "1:13:18", "remaining_time": "2 days, 20:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 9627, "loss": 1.7701, "learning_rate": 9.99230791158704e-05, "epoch": 0.01765866832865898, "percentage": 1.77, "elapsed_time": "1:13:44", "remaining_time": "2 days, 20:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 9627, "loss": 1.8656, "learning_rate": 9.992217173820288e-05, "epoch": 0.017762542848239325, "percentage": 1.78, "elapsed_time": "1:14:11", "remaining_time": "2 days, 20:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 9627, "loss": 1.7344, "learning_rate": 9.992125904421348e-05, "epoch": 0.017866417367819673, "percentage": 1.79, "elapsed_time": "1:14:37", "remaining_time": "2 days, 20:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 9627, "loss": 1.6855, "learning_rate": 9.992034103399939e-05, "epoch": 0.01797029188740002, "percentage": 1.8, "elapsed_time": "1:15:02", "remaining_time": "2 days, 20:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 9627, "loss": 1.8554, "learning_rate": 9.991941770765838e-05, "epoch": 0.01807416640698037, "percentage": 1.81, "elapsed_time": "1:15:30", "remaining_time": "2 days, 20:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 9627, "loss": 1.9407, "learning_rate": 9.991848906528876e-05, "epoch": 0.018178040926560713, "percentage": 1.82, "elapsed_time": "1:15:55", "remaining_time": "2 days, 20:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 9627, "loss": 1.8553, "learning_rate": 9.991755510698944e-05, "epoch": 0.01828191544614106, "percentage": 1.83, "elapsed_time": "1:16:21", "remaining_time": "2 days, 20:20:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 9627, "loss": 1.77, "learning_rate": 9.991661583285987e-05, "epoch": 0.01838578996572141, "percentage": 1.84, "elapsed_time": "1:16:48", "remaining_time": "2 days, 20:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 9627, "loss": 1.8825, "learning_rate": 9.991567124300009e-05, "epoch": 0.018489664485301757, "percentage": 1.85, "elapsed_time": "1:17:14", "remaining_time": "2 days, 20:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 9627, "loss": 1.9889, "learning_rate": 9.991472133751067e-05, "epoch": 0.0185935390048821, "percentage": 1.86, "elapsed_time": "1:17:41", "remaining_time": "2 days, 20:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 9627, "loss": 1.683, "learning_rate": 9.991376611649279e-05, "epoch": 0.01869741352446245, "percentage": 1.87, "elapsed_time": "1:18:08", "remaining_time": "2 days, 20:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 9627, "loss": 1.9933, "learning_rate": 9.991280558004815e-05, "epoch": 0.018801288044042797, "percentage": 1.88, "elapsed_time": "1:18:32", "remaining_time": "2 days, 20:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 9627, "loss": 1.8897, "learning_rate": 9.991183972827904e-05, "epoch": 0.018905162563623144, "percentage": 1.89, "elapsed_time": "1:19:00", "remaining_time": "2 days, 20:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 9627, "loss": 1.6934, "learning_rate": 9.991086856128833e-05, "epoch": 0.01900903708320349, "percentage": 1.9, "elapsed_time": "1:19:26", "remaining_time": "2 days, 20:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 9627, "loss": 1.9867, "learning_rate": 9.990989207917944e-05, "epoch": 0.019112911602783837, "percentage": 1.91, "elapsed_time": "1:19:53", "remaining_time": "2 days, 20:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 9627, "loss": 2.0397, "learning_rate": 9.990891028205636e-05, "epoch": 0.019216786122364184, "percentage": 1.92, "elapsed_time": "1:20:19", "remaining_time": "2 days, 20:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 9627, "loss": 1.6816, "learning_rate": 9.990792317002364e-05, "epoch": 0.019320660641944532, "percentage": 1.93, "elapsed_time": "1:20:45", "remaining_time": "2 days, 20:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 9627, "loss": 1.8124, "learning_rate": 9.99069307431864e-05, "epoch": 0.019424535161524877, "percentage": 1.94, "elapsed_time": "1:21:12", "remaining_time": "2 days, 20:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 9627, "loss": 1.6452, "learning_rate": 9.990593300165033e-05, "epoch": 0.019528409681105224, "percentage": 1.95, "elapsed_time": "1:21:38", "remaining_time": "2 days, 20:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 9627, "loss": 2.088, "learning_rate": 9.990492994552167e-05, "epoch": 0.019632284200685572, "percentage": 1.96, "elapsed_time": "1:22:04", "remaining_time": "2 days, 20:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 9627, "loss": 1.9396, "learning_rate": 9.990392157490724e-05, "epoch": 0.01973615872026592, "percentage": 1.97, "elapsed_time": "1:22:31", "remaining_time": "2 days, 20:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 9627, "loss": 1.9863, "learning_rate": 9.990290788991443e-05, "epoch": 0.019840033239846264, "percentage": 1.98, "elapsed_time": "1:22:57", "remaining_time": "2 days, 20:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 9627, "loss": 1.902, "learning_rate": 9.99018888906512e-05, "epoch": 0.019943907759426612, "percentage": 1.99, "elapsed_time": "1:23:24", "remaining_time": "2 days, 20:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 9627, "loss": 1.8484, "learning_rate": 9.990086457722604e-05, "epoch": 0.02004778227900696, "percentage": 2.0, "elapsed_time": "1:23:50", "remaining_time": "2 days, 20:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 9627, "loss": 1.9543, "learning_rate": 9.989983494974805e-05, "epoch": 0.020151656798587308, "percentage": 2.02, "elapsed_time": "1:24:16", "remaining_time": "2 days, 20:17:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 9627, "loss": 1.8695, "learning_rate": 9.989880000832686e-05, "epoch": 0.020255531318167652, "percentage": 2.03, "elapsed_time": "1:24:42", "remaining_time": "2 days, 20:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 9627, "loss": 1.7589, "learning_rate": 9.989775975307272e-05, "epoch": 0.020359405837748, "percentage": 2.04, "elapsed_time": "1:25:09", "remaining_time": "2 days, 20:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 9627, "loss": 2.1527, "learning_rate": 9.989671418409636e-05, "epoch": 0.020463280357328348, "percentage": 2.05, "elapsed_time": "1:25:35", "remaining_time": "2 days, 20:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 9627, "loss": 1.7132, "learning_rate": 9.989566330150914e-05, "epoch": 0.020567154876908696, "percentage": 2.06, "elapsed_time": "1:26:02", "remaining_time": "2 days, 20:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 9627, "loss": 1.8913, "learning_rate": 9.989460710542301e-05, "epoch": 0.02067102939648904, "percentage": 2.07, "elapsed_time": "1:26:28", "remaining_time": "2 days, 20:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 9627, "loss": 2.191, "learning_rate": 9.98935455959504e-05, "epoch": 0.020774903916069388, "percentage": 2.08, "elapsed_time": "1:26:54", "remaining_time": "2 days, 20:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 9627, "loss": 1.9199, "learning_rate": 9.989247877320436e-05, "epoch": 0.020878778435649736, "percentage": 2.09, "elapsed_time": "1:27:20", "remaining_time": "2 days, 20:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 9627, "loss": 1.831, "learning_rate": 9.989140663729852e-05, "epoch": 0.020982652955230083, "percentage": 2.1, "elapsed_time": "1:27:47", "remaining_time": "2 days, 20:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 9627, "loss": 1.8922, "learning_rate": 9.989032918834704e-05, "epoch": 0.021086527474810428, "percentage": 2.11, "elapsed_time": "1:28:13", "remaining_time": "2 days, 20:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 9627, "loss": 1.8271, "learning_rate": 9.988924642646466e-05, "epoch": 0.021190401994390776, "percentage": 2.12, "elapsed_time": "1:28:39", "remaining_time": "2 days, 20:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 9627, "loss": 1.9391, "learning_rate": 9.988815835176668e-05, "epoch": 0.021294276513971123, "percentage": 2.13, "elapsed_time": "1:29:05", "remaining_time": "2 days, 20:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 9627, "loss": 1.6495, "learning_rate": 9.9887064964369e-05, "epoch": 0.02139815103355147, "percentage": 2.14, "elapsed_time": "1:29:32", "remaining_time": "2 days, 20:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 9627, "loss": 1.8272, "learning_rate": 9.988596626438801e-05, "epoch": 0.021502025553131816, "percentage": 2.15, "elapsed_time": "1:29:58", "remaining_time": "2 days, 20:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 9627, "loss": 1.8506, "learning_rate": 9.988486225194075e-05, "epoch": 0.021605900072712163, "percentage": 2.16, "elapsed_time": "1:30:24", "remaining_time": "2 days, 20:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 9627, "loss": 1.8219, "learning_rate": 9.988375292714478e-05, "epoch": 0.02170977459229251, "percentage": 2.17, "elapsed_time": "1:30:50", "remaining_time": "2 days, 20:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 9627, "loss": 1.8984, "learning_rate": 9.988263829011822e-05, "epoch": 0.02181364911187286, "percentage": 2.18, "elapsed_time": "1:31:17", "remaining_time": "2 days, 20:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 9627, "loss": 1.8276, "learning_rate": 9.988151834097979e-05, "epoch": 0.021917523631453203, "percentage": 2.19, "elapsed_time": "1:31:43", "remaining_time": "2 days, 20:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 9627, "loss": 1.8979, "learning_rate": 9.988039307984874e-05, "epoch": 0.02202139815103355, "percentage": 2.2, "elapsed_time": "1:32:09", "remaining_time": "2 days, 20:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 9627, "loss": 1.8392, "learning_rate": 9.987926250684491e-05, "epoch": 0.0221252726706139, "percentage": 2.21, "elapsed_time": "1:32:37", "remaining_time": "2 days, 20:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 9627, "loss": 1.8287, "learning_rate": 9.98781266220887e-05, "epoch": 0.022229147190194247, "percentage": 2.22, "elapsed_time": "1:33:02", "remaining_time": "2 days, 20:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 9627, "loss": 1.8612, "learning_rate": 9.987698542570107e-05, "epoch": 0.02233302170977459, "percentage": 2.23, "elapsed_time": "1:33:30", "remaining_time": "2 days, 20:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 9627, "loss": 1.9711, "learning_rate": 9.987583891780355e-05, "epoch": 0.02243689622935494, "percentage": 2.24, "elapsed_time": "1:33:56", "remaining_time": "2 days, 20:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 9627, "loss": 1.7615, "learning_rate": 9.987468709851823e-05, "epoch": 0.022540770748935287, "percentage": 2.25, "elapsed_time": "1:34:21", "remaining_time": "2 days, 20:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 9627, "loss": 1.694, "learning_rate": 9.987352996796777e-05, "epoch": 0.022644645268515635, "percentage": 2.26, "elapsed_time": "1:34:49", "remaining_time": "2 days, 20:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 9627, "loss": 1.7834, "learning_rate": 9.98723675262754e-05, "epoch": 0.02274851978809598, "percentage": 2.27, "elapsed_time": "1:35:14", "remaining_time": "2 days, 20:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 9627, "loss": 1.8788, "learning_rate": 9.987119977356491e-05, "epoch": 0.022852394307676327, "percentage": 2.29, "elapsed_time": "1:35:42", "remaining_time": "2 days, 20:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 9627, "loss": 1.9663, "learning_rate": 9.987002670996064e-05, "epoch": 0.022956268827256675, "percentage": 2.3, "elapsed_time": "1:36:07", "remaining_time": "2 days, 20:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 9627, "loss": 1.822, "learning_rate": 9.986884833558754e-05, "epoch": 0.023060143346837023, "percentage": 2.31, "elapsed_time": "1:36:35", "remaining_time": "2 days, 20:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 9627, "loss": 1.8147, "learning_rate": 9.986766465057108e-05, "epoch": 0.023164017866417367, "percentage": 2.32, "elapsed_time": "1:37:01", "remaining_time": "2 days, 20:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 9627, "loss": 1.7854, "learning_rate": 9.986647565503731e-05, "epoch": 0.023267892385997715, "percentage": 2.33, "elapsed_time": "1:37:27", "remaining_time": "2 days, 20:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 9627, "loss": 1.6783, "learning_rate": 9.986528134911288e-05, "epoch": 0.023371766905578063, "percentage": 2.34, "elapsed_time": "1:37:54", "remaining_time": "2 days, 20:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 9627, "loss": 1.9996, "learning_rate": 9.986408173292492e-05, "epoch": 0.023475641425158407, "percentage": 2.35, "elapsed_time": "1:38:21", "remaining_time": "2 days, 20:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 9627, "loss": 1.8241, "learning_rate": 9.986287680660123e-05, "epoch": 0.023579515944738755, "percentage": 2.36, "elapsed_time": "1:38:47", "remaining_time": "2 days, 20:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 9627, "loss": 1.9336, "learning_rate": 9.98616665702701e-05, "epoch": 0.023683390464319103, "percentage": 2.37, "elapsed_time": "1:39:13", "remaining_time": "2 days, 20:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 9627, "loss": 1.7719, "learning_rate": 9.986045102406042e-05, "epoch": 0.02378726498389945, "percentage": 2.38, "elapsed_time": "1:39:40", "remaining_time": "2 days, 20:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 9627, "loss": 1.8026, "learning_rate": 9.985923016810163e-05, "epoch": 0.023891139503479795, "percentage": 2.39, "elapsed_time": "1:40:06", "remaining_time": "2 days, 20:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 9627, "loss": 1.9196, "learning_rate": 9.985800400252374e-05, "epoch": 0.023995014023060143, "percentage": 2.4, "elapsed_time": "1:40:33", "remaining_time": "2 days, 20:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 9627, "loss": 1.8512, "learning_rate": 9.985677252745733e-05, "epoch": 0.02409888854264049, "percentage": 2.41, "elapsed_time": "1:40:59", "remaining_time": "2 days, 20:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 9627, "loss": 1.8336, "learning_rate": 9.985553574303354e-05, "epoch": 0.024202763062220838, "percentage": 2.42, "elapsed_time": "1:41:25", "remaining_time": "2 days, 20:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 9627, "loss": 1.6927, "learning_rate": 9.98542936493841e-05, "epoch": 0.024306637581801183, "percentage": 2.43, "elapsed_time": "1:41:51", "remaining_time": "2 days, 20:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 9627, "loss": 1.8582, "learning_rate": 9.985304624664125e-05, "epoch": 0.02441051210138153, "percentage": 2.44, "elapsed_time": "1:42:18", "remaining_time": "2 days, 20:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 9627, "loss": 1.9107, "learning_rate": 9.985179353493785e-05, "epoch": 0.024514386620961878, "percentage": 2.45, "elapsed_time": "1:42:44", "remaining_time": "2 days, 20:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 9627, "loss": 1.6351, "learning_rate": 9.98505355144073e-05, "epoch": 0.024618261140542226, "percentage": 2.46, "elapsed_time": "1:43:11", "remaining_time": "2 days, 20:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 9627, "loss": 1.7564, "learning_rate": 9.984927218518356e-05, "epoch": 0.02472213566012257, "percentage": 2.47, "elapsed_time": "1:43:38", "remaining_time": "2 days, 20:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 9627, "loss": 1.7372, "learning_rate": 9.984800354740117e-05, "epoch": 0.024826010179702918, "percentage": 2.48, "elapsed_time": "1:44:04", "remaining_time": "2 days, 20:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 9627, "loss": 1.7131, "learning_rate": 9.984672960119523e-05, "epoch": 0.024929884699283266, "percentage": 2.49, "elapsed_time": "1:44:30", "remaining_time": "2 days, 20:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 9627, "loss": 1.7636, "learning_rate": 9.984545034670142e-05, "epoch": 0.025033759218863614, "percentage": 2.5, "elapsed_time": "1:44:57", "remaining_time": "2 days, 20:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 9627, "loss": 1.9847, "learning_rate": 9.984416578405596e-05, "epoch": 0.025137633738443958, "percentage": 2.51, "elapsed_time": "1:45:23", "remaining_time": "2 days, 20:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 9627, "loss": 2.0124, "learning_rate": 9.984287591339562e-05, "epoch": 0.025241508258024306, "percentage": 2.52, "elapsed_time": "1:45:49", "remaining_time": "2 days, 20:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 9627, "loss": 1.8527, "learning_rate": 9.98415807348578e-05, "epoch": 0.025345382777604654, "percentage": 2.53, "elapsed_time": "1:46:15", "remaining_time": "2 days, 20:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 9627, "loss": 1.8608, "learning_rate": 9.984028024858041e-05, "epoch": 0.025449257297185002, "percentage": 2.54, "elapsed_time": "1:46:42", "remaining_time": "2 days, 20:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 9627, "loss": 2.029, "learning_rate": 9.983897445470194e-05, "epoch": 0.025553131816765346, "percentage": 2.56, "elapsed_time": "1:47:08", "remaining_time": "2 days, 20:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 9627, "loss": 1.9682, "learning_rate": 9.983766335336144e-05, "epoch": 0.025657006336345694, "percentage": 2.57, "elapsed_time": "1:47:34", "remaining_time": "2 days, 20:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 9627, "loss": 1.6414, "learning_rate": 9.983634694469855e-05, "epoch": 0.025760880855926042, "percentage": 2.58, "elapsed_time": "1:48:01", "remaining_time": "2 days, 20:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 9627, "loss": 1.7982, "learning_rate": 9.983502522885347e-05, "epoch": 0.02586475537550639, "percentage": 2.59, "elapsed_time": "1:48:27", "remaining_time": "2 days, 20:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 9627, "loss": 1.8246, "learning_rate": 9.983369820596691e-05, "epoch": 0.025968629895086734, "percentage": 2.6, "elapsed_time": "1:48:53", "remaining_time": "2 days, 20:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 9627, "loss": 1.733, "learning_rate": 9.98323658761802e-05, "epoch": 0.026072504414667082, "percentage": 2.61, "elapsed_time": "1:49:20", "remaining_time": "2 days, 20:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 9627, "loss": 1.6995, "learning_rate": 9.983102823963524e-05, "epoch": 0.02617637893424743, "percentage": 2.62, "elapsed_time": "1:49:47", "remaining_time": "2 days, 20:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 9627, "loss": 1.5215, "learning_rate": 9.982968529647447e-05, "epoch": 0.026280253453827777, "percentage": 2.63, "elapsed_time": "1:50:13", "remaining_time": "2 days, 20:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 9627, "loss": 1.8707, "learning_rate": 9.982833704684091e-05, "epoch": 0.026384127973408122, "percentage": 2.64, "elapsed_time": "1:50:39", "remaining_time": "2 days, 20:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 9627, "loss": 1.7123, "learning_rate": 9.982698349087812e-05, "epoch": 0.02648800249298847, "percentage": 2.65, "elapsed_time": "1:51:06", "remaining_time": "2 days, 20:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 9627, "loss": 1.7335, "learning_rate": 9.982562462873026e-05, "epoch": 0.026591877012568817, "percentage": 2.66, "elapsed_time": "1:51:32", "remaining_time": "2 days, 20:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 9627, "loss": 1.9431, "learning_rate": 9.982426046054204e-05, "epoch": 0.026695751532149165, "percentage": 2.67, "elapsed_time": "1:51:59", "remaining_time": "2 days, 20:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 9627, "loss": 1.8024, "learning_rate": 9.982289098645872e-05, "epoch": 0.02679962605172951, "percentage": 2.68, "elapsed_time": "1:52:25", "remaining_time": "2 days, 20:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 9627, "loss": 1.8129, "learning_rate": 9.982151620662612e-05, "epoch": 0.026903500571309857, "percentage": 2.69, "elapsed_time": "1:52:52", "remaining_time": "2 days, 20:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 9627, "loss": 1.8653, "learning_rate": 9.98201361211907e-05, "epoch": 0.027007375090890205, "percentage": 2.7, "elapsed_time": "1:53:18", "remaining_time": "2 days, 20:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 9627, "loss": 1.7716, "learning_rate": 9.981875073029938e-05, "epoch": 0.027111249610470553, "percentage": 2.71, "elapsed_time": "1:53:44", "remaining_time": "2 days, 20:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 9627, "loss": 1.8481, "learning_rate": 9.981736003409971e-05, "epoch": 0.027215124130050897, "percentage": 2.72, "elapsed_time": "1:54:13", "remaining_time": "2 days, 20:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 9627, "loss": 2.0175, "learning_rate": 9.981596403273978e-05, "epoch": 0.027318998649631245, "percentage": 2.73, "elapsed_time": "1:54:38", "remaining_time": "2 days, 20:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 9627, "loss": 1.6928, "learning_rate": 9.981456272636826e-05, "epoch": 0.027422873169211593, "percentage": 2.74, "elapsed_time": "1:55:05", "remaining_time": "2 days, 20:02:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 9627, "loss": 1.9024, "learning_rate": 9.981315611513438e-05, "epoch": 0.02752674768879194, "percentage": 2.75, "elapsed_time": "1:55:32", "remaining_time": "2 days, 20:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 9627, "loss": 1.8439, "learning_rate": 9.981174419918795e-05, "epoch": 0.027630622208372285, "percentage": 2.76, "elapsed_time": "1:55:59", "remaining_time": "2 days, 20:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 9627, "loss": 2.0282, "learning_rate": 9.981032697867929e-05, "epoch": 0.027734496727952633, "percentage": 2.77, "elapsed_time": "1:56:26", "remaining_time": "2 days, 20:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 9627, "loss": 1.7793, "learning_rate": 9.980890445375934e-05, "epoch": 0.02783837124753298, "percentage": 2.78, "elapsed_time": "1:56:51", "remaining_time": "2 days, 20:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 9627, "loss": 1.8332, "learning_rate": 9.980747662457961e-05, "epoch": 0.02794224576711333, "percentage": 2.79, "elapsed_time": "1:57:19", "remaining_time": "2 days, 20:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 9627, "loss": 1.6546, "learning_rate": 9.980604349129211e-05, "epoch": 0.028046120286693673, "percentage": 2.8, "elapsed_time": "1:57:44", "remaining_time": "2 days, 20:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 9627, "loss": 1.9148, "learning_rate": 9.980460505404949e-05, "epoch": 0.02814999480627402, "percentage": 2.81, "elapsed_time": "1:58:12", "remaining_time": "2 days, 20:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 9627, "loss": 1.8963, "learning_rate": 9.980316131300493e-05, "epoch": 0.02825386932585437, "percentage": 2.83, "elapsed_time": "1:58:38", "remaining_time": "2 days, 20:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 9627, "loss": 1.7182, "learning_rate": 9.980171226831216e-05, "epoch": 0.028357743845434717, "percentage": 2.84, "elapsed_time": "1:59:05", "remaining_time": "2 days, 20:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 9627, "loss": 1.7612, "learning_rate": 9.980025792012551e-05, "epoch": 0.02846161836501506, "percentage": 2.85, "elapsed_time": "1:59:32", "remaining_time": "2 days, 20:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 9627, "loss": 1.8107, "learning_rate": 9.979879826859983e-05, "epoch": 0.02856549288459541, "percentage": 2.86, "elapsed_time": "1:59:59", "remaining_time": "2 days, 20:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 9627, "loss": 1.8116, "learning_rate": 9.97973333138906e-05, "epoch": 0.028669367404175757, "percentage": 2.87, "elapsed_time": "2:00:25", "remaining_time": "2 days, 20:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 9627, "loss": 1.968, "learning_rate": 9.97958630561538e-05, "epoch": 0.028773241923756104, "percentage": 2.88, "elapsed_time": "2:00:52", "remaining_time": "2 days, 19:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 9627, "loss": 1.7281, "learning_rate": 9.9794387495546e-05, "epoch": 0.02887711644333645, "percentage": 2.89, "elapsed_time": "2:01:19", "remaining_time": "2 days, 19:59:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 9627, "loss": 1.8249, "learning_rate": 9.979290663222434e-05, "epoch": 0.028980990962916797, "percentage": 2.9, "elapsed_time": "2:01:45", "remaining_time": "2 days, 19:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 9627, "loss": 1.8084, "learning_rate": 9.979142046634653e-05, "epoch": 0.029084865482497144, "percentage": 2.91, "elapsed_time": "2:02:12", "remaining_time": "2 days, 19:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 9627, "loss": 1.9606, "learning_rate": 9.978992899807084e-05, "epoch": 0.02918874000207749, "percentage": 2.92, "elapsed_time": "2:02:38", "remaining_time": "2 days, 19:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 9627, "loss": 1.8753, "learning_rate": 9.978843222755607e-05, "epoch": 0.029292614521657837, "percentage": 2.93, "elapsed_time": "2:03:05", "remaining_time": "2 days, 19:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 9627, "loss": 1.948, "learning_rate": 9.978693015496165e-05, "epoch": 0.029396489041238184, "percentage": 2.94, "elapsed_time": "2:03:31", "remaining_time": "2 days, 19:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 9627, "loss": 1.8796, "learning_rate": 9.978542278044751e-05, "epoch": 0.029500363560818532, "percentage": 2.95, "elapsed_time": "2:03:57", "remaining_time": "2 days, 19:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 9627, "loss": 1.8221, "learning_rate": 9.978391010417418e-05, "epoch": 0.029604238080398877, "percentage": 2.96, "elapsed_time": "2:04:25", "remaining_time": "2 days, 19:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 9627, "loss": 1.7903, "learning_rate": 9.978239212630277e-05, "epoch": 0.029708112599979224, "percentage": 2.97, "elapsed_time": "2:04:52", "remaining_time": "2 days, 19:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 9627, "loss": 1.9183, "learning_rate": 9.978086884699492e-05, "epoch": 0.029811987119559572, "percentage": 2.98, "elapsed_time": "2:05:18", "remaining_time": "2 days, 19:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 9627, "loss": 1.8877, "learning_rate": 9.977934026641282e-05, "epoch": 0.02991586163913992, "percentage": 2.99, "elapsed_time": "2:05:46", "remaining_time": "2 days, 19:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 9627, "loss": 1.7437, "learning_rate": 9.977780638471928e-05, "epoch": 0.030019736158720264, "percentage": 3.0, "elapsed_time": "2:06:12", "remaining_time": "2 days, 19:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 9627, "loss": 1.794, "learning_rate": 9.977626720207764e-05, "epoch": 0.030123610678300612, "percentage": 3.01, "elapsed_time": "2:06:38", "remaining_time": "2 days, 19:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 9627, "loss": 1.8116, "learning_rate": 9.977472271865182e-05, "epoch": 0.03022748519788096, "percentage": 3.02, "elapsed_time": "2:07:04", "remaining_time": "2 days, 19:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 9627, "loss": 1.7871, "learning_rate": 9.977317293460631e-05, "epoch": 0.030331359717461308, "percentage": 3.03, "elapsed_time": "2:07:32", "remaining_time": "2 days, 19:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 9627, "loss": 1.8669, "learning_rate": 9.97716178501061e-05, "epoch": 0.030435234237041652, "percentage": 3.04, "elapsed_time": "2:07:58", "remaining_time": "2 days, 19:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 9627, "loss": 1.8061, "learning_rate": 9.977005746531682e-05, "epoch": 0.030539108756622, "percentage": 3.05, "elapsed_time": "2:08:24", "remaining_time": "2 days, 19:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 9627, "loss": 1.8189, "learning_rate": 9.976849178040466e-05, "epoch": 0.030642983276202348, "percentage": 3.06, "elapsed_time": "2:08:52", "remaining_time": "2 days, 19:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 9627, "loss": 1.7308, "learning_rate": 9.976692079553633e-05, "epoch": 0.030746857795782696, "percentage": 3.07, "elapsed_time": "2:09:18", "remaining_time": "2 days, 19:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 9627, "loss": 1.881, "learning_rate": 9.976534451087913e-05, "epoch": 0.03085073231536304, "percentage": 3.09, "elapsed_time": "2:09:45", "remaining_time": "2 days, 19:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 9627, "loss": 2.0111, "learning_rate": 9.976376292660091e-05, "epoch": 0.030954606834943388, "percentage": 3.1, "elapsed_time": "2:10:11", "remaining_time": "2 days, 19:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 9627, "loss": 2.1103, "learning_rate": 9.976217604287013e-05, "epoch": 0.031058481354523736, "percentage": 3.11, "elapsed_time": "2:10:38", "remaining_time": "2 days, 19:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 9627, "loss": 1.8858, "learning_rate": 9.976058385985575e-05, "epoch": 0.031162355874104083, "percentage": 3.12, "elapsed_time": "2:11:05", "remaining_time": "2 days, 19:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 9627, "loss": 1.7076, "learning_rate": 9.975898637772734e-05, "epoch": 0.03126623039368443, "percentage": 3.13, "elapsed_time": "2:11:31", "remaining_time": "2 days, 19:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 9627, "loss": 1.8058, "learning_rate": 9.975738359665501e-05, "epoch": 0.03137010491326478, "percentage": 3.14, "elapsed_time": "2:11:58", "remaining_time": "2 days, 19:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 9627, "loss": 1.8827, "learning_rate": 9.975577551680946e-05, "epoch": 0.03147397943284512, "percentage": 3.15, "elapsed_time": "2:12:24", "remaining_time": "2 days, 19:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 9627, "loss": 1.801, "learning_rate": 9.975416213836193e-05, "epoch": 0.03157785395242547, "percentage": 3.16, "elapsed_time": "2:12:51", "remaining_time": "2 days, 19:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 9627, "loss": 1.7826, "learning_rate": 9.975254346148422e-05, "epoch": 0.031681728472005816, "percentage": 3.17, "elapsed_time": "2:13:17", "remaining_time": "2 days, 19:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 9627, "loss": 1.7969, "learning_rate": 9.975091948634871e-05, "epoch": 0.031785602991586163, "percentage": 3.18, "elapsed_time": "2:13:45", "remaining_time": "2 days, 19:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 9627, "loss": 1.9499, "learning_rate": 9.974929021312836e-05, "epoch": 0.03188947751116651, "percentage": 3.19, "elapsed_time": "2:14:11", "remaining_time": "2 days, 19:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 9627, "loss": 1.9003, "learning_rate": 9.974765564199665e-05, "epoch": 0.03199335203074686, "percentage": 3.2, "elapsed_time": "2:14:37", "remaining_time": "2 days, 19:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 9627, "loss": 1.8738, "learning_rate": 9.974601577312768e-05, "epoch": 0.03209722655032721, "percentage": 3.21, "elapsed_time": "2:15:05", "remaining_time": "2 days, 19:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 9627, "loss": 1.8817, "learning_rate": 9.974437060669603e-05, "epoch": 0.032201101069907555, "percentage": 3.22, "elapsed_time": "2:15:31", "remaining_time": "2 days, 19:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 9627, "loss": 1.8391, "learning_rate": 9.974272014287697e-05, "epoch": 0.032304975589487896, "percentage": 3.23, "elapsed_time": "2:15:57", "remaining_time": "2 days, 19:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 9627, "loss": 1.8881, "learning_rate": 9.97410643818462e-05, "epoch": 0.032408850109068243, "percentage": 3.24, "elapsed_time": "2:16:25", "remaining_time": "2 days, 19:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 9627, "loss": 1.8975, "learning_rate": 9.973940332378007e-05, "epoch": 0.03251272462864859, "percentage": 3.25, "elapsed_time": "2:16:51", "remaining_time": "2 days, 19:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 9627, "loss": 1.7162, "learning_rate": 9.973773696885547e-05, "epoch": 0.03261659914822894, "percentage": 3.26, "elapsed_time": "2:17:18", "remaining_time": "2 days, 19:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 9627, "loss": 1.9902, "learning_rate": 9.973606531724985e-05, "epoch": 0.03272047366780929, "percentage": 3.27, "elapsed_time": "2:17:45", "remaining_time": "2 days, 19:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 9627, "loss": 1.9183, "learning_rate": 9.973438836914124e-05, "epoch": 0.032824348187389635, "percentage": 3.28, "elapsed_time": "2:18:11", "remaining_time": "2 days, 19:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 9627, "loss": 1.8884, "learning_rate": 9.973270612470822e-05, "epoch": 0.03292822270696998, "percentage": 3.29, "elapsed_time": "2:18:39", "remaining_time": "2 days, 19:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 9627, "loss": 1.9219, "learning_rate": 9.97310185841299e-05, "epoch": 0.03303209722655033, "percentage": 3.3, "elapsed_time": "2:19:06", "remaining_time": "2 days, 19:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 9627, "loss": 1.9071, "learning_rate": 9.972932574758604e-05, "epoch": 0.03313597174613067, "percentage": 3.31, "elapsed_time": "2:19:32", "remaining_time": "2 days, 19:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 9627, "loss": 1.7418, "learning_rate": 9.972762761525689e-05, "epoch": 0.03323984626571102, "percentage": 3.32, "elapsed_time": "2:19:59", "remaining_time": "2 days, 19:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 9627, "loss": 1.7941, "learning_rate": 9.972592418732327e-05, "epoch": 0.03334372078529137, "percentage": 3.33, "elapsed_time": "2:20:26", "remaining_time": "2 days, 19:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 9627, "loss": 1.8983, "learning_rate": 9.972421546396662e-05, "epoch": 0.033447595304871715, "percentage": 3.34, "elapsed_time": "2:20:52", "remaining_time": "2 days, 19:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 9627, "loss": 1.947, "learning_rate": 9.972250144536888e-05, "epoch": 0.03355146982445206, "percentage": 3.36, "elapsed_time": "2:21:19", "remaining_time": "2 days, 19:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 9627, "loss": 1.7318, "learning_rate": 9.972078213171259e-05, "epoch": 0.03365534434403241, "percentage": 3.37, "elapsed_time": "2:21:46", "remaining_time": "2 days, 19:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 9627, "loss": 1.6396, "learning_rate": 9.971905752318084e-05, "epoch": 0.03375921886361276, "percentage": 3.38, "elapsed_time": "2:22:14", "remaining_time": "2 days, 19:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 9627, "loss": 1.8063, "learning_rate": 9.971732761995728e-05, "epoch": 0.033863093383193106, "percentage": 3.39, "elapsed_time": "2:22:39", "remaining_time": "2 days, 19:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 9627, "loss": 1.7624, "learning_rate": 9.971559242222615e-05, "epoch": 0.03396696790277345, "percentage": 3.4, "elapsed_time": "2:23:08", "remaining_time": "2 days, 19:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 9627, "loss": 1.7963, "learning_rate": 9.971385193017221e-05, "epoch": 0.034070842422353795, "percentage": 3.41, "elapsed_time": "2:23:33", "remaining_time": "2 days, 19:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 9627, "loss": 1.7648, "learning_rate": 9.971210614398084e-05, "epoch": 0.03417471694193414, "percentage": 3.42, "elapsed_time": "2:24:01", "remaining_time": "2 days, 19:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 9627, "loss": 1.8365, "learning_rate": 9.971035506383792e-05, "epoch": 0.03427859146151449, "percentage": 3.43, "elapsed_time": "2:24:27", "remaining_time": "2 days, 19:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 9627, "loss": 1.9249, "learning_rate": 9.970859868992995e-05, "epoch": 0.03438246598109484, "percentage": 3.44, "elapsed_time": "2:24:55", "remaining_time": "2 days, 19:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 9627, "loss": 1.881, "learning_rate": 9.970683702244395e-05, "epoch": 0.034486340500675186, "percentage": 3.45, "elapsed_time": "2:25:21", "remaining_time": "2 days, 19:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 9627, "loss": 1.8085, "learning_rate": 9.970507006156755e-05, "epoch": 0.034590215020255534, "percentage": 3.46, "elapsed_time": "2:25:49", "remaining_time": "2 days, 19:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 9627, "loss": 1.8762, "learning_rate": 9.970329780748888e-05, "epoch": 0.034694089539835875, "percentage": 3.47, "elapsed_time": "2:26:15", "remaining_time": "2 days, 19:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 9627, "loss": 1.7262, "learning_rate": 9.970152026039672e-05, "epoch": 0.03479796405941622, "percentage": 3.48, "elapsed_time": "2:26:43", "remaining_time": "2 days, 19:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 9627, "loss": 1.7248, "learning_rate": 9.969973742048032e-05, "epoch": 0.03490183857899657, "percentage": 3.49, "elapsed_time": "2:27:09", "remaining_time": "2 days, 19:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 9627, "loss": 1.7031, "learning_rate": 9.969794928792957e-05, "epoch": 0.03500571309857692, "percentage": 3.5, "elapsed_time": "2:27:36", "remaining_time": "2 days, 19:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 9627, "loss": 2.0297, "learning_rate": 9.969615586293488e-05, "epoch": 0.035109587618157266, "percentage": 3.51, "elapsed_time": "2:28:02", "remaining_time": "2 days, 19:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 9627, "loss": 1.9272, "learning_rate": 9.969435714568722e-05, "epoch": 0.035213462137737614, "percentage": 3.52, "elapsed_time": "2:28:30", "remaining_time": "2 days, 19:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 9627, "loss": 1.8647, "learning_rate": 9.969255313637818e-05, "epoch": 0.03531733665731796, "percentage": 3.53, "elapsed_time": "2:28:57", "remaining_time": "2 days, 19:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 9627, "loss": 1.8622, "learning_rate": 9.969074383519983e-05, "epoch": 0.03542121117689831, "percentage": 3.54, "elapsed_time": "2:29:23", "remaining_time": "2 days, 19:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 9627, "loss": 1.7988, "learning_rate": 9.968892924234487e-05, "epoch": 0.03552508569647865, "percentage": 3.55, "elapsed_time": "2:29:50", "remaining_time": "2 days, 19:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 9627, "loss": 1.8039, "learning_rate": 9.968710935800652e-05, "epoch": 0.035628960216059, "percentage": 3.56, "elapsed_time": "2:30:18", "remaining_time": "2 days, 19:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 9627, "loss": 2.0847, "learning_rate": 9.968528418237862e-05, "epoch": 0.035732834735639346, "percentage": 3.57, "elapsed_time": "2:30:44", "remaining_time": "2 days, 19:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 9627, "loss": 2.0207, "learning_rate": 9.96834537156555e-05, "epoch": 0.035836709255219694, "percentage": 3.58, "elapsed_time": "2:31:12", "remaining_time": "2 days, 19:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 9627, "loss": 1.9464, "learning_rate": 9.96816179580321e-05, "epoch": 0.03594058377480004, "percentage": 3.59, "elapsed_time": "2:31:38", "remaining_time": "2 days, 19:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 9627, "loss": 1.9318, "learning_rate": 9.967977690970393e-05, "epoch": 0.03604445829438039, "percentage": 3.6, "elapsed_time": "2:32:05", "remaining_time": "2 days, 19:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 9627, "loss": 1.8081, "learning_rate": 9.967793057086706e-05, "epoch": 0.03614833281396074, "percentage": 3.61, "elapsed_time": "2:32:32", "remaining_time": "2 days, 19:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 9627, "loss": 1.7424, "learning_rate": 9.967607894171804e-05, "epoch": 0.036252207333541085, "percentage": 3.63, "elapsed_time": "2:32:59", "remaining_time": "2 days, 19:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 9627, "loss": 1.9266, "learning_rate": 9.967422202245413e-05, "epoch": 0.036356081853121426, "percentage": 3.64, "elapsed_time": "2:33:26", "remaining_time": "2 days, 19:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 9627, "loss": 1.8344, "learning_rate": 9.967235981327304e-05, "epoch": 0.036459956372701774, "percentage": 3.65, "elapsed_time": "2:33:53", "remaining_time": "2 days, 19:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 9627, "loss": 1.7158, "learning_rate": 9.967049231437309e-05, "epoch": 0.03656383089228212, "percentage": 3.66, "elapsed_time": "2:34:19", "remaining_time": "2 days, 19:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 9627, "loss": 1.9844, "learning_rate": 9.966861952595316e-05, "epoch": 0.03666770541186247, "percentage": 3.67, "elapsed_time": "2:34:47", "remaining_time": "2 days, 19:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 9627, "loss": 2.0037, "learning_rate": 9.966674144821266e-05, "epoch": 0.03677157993144282, "percentage": 3.68, "elapsed_time": "2:35:14", "remaining_time": "2 days, 19:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 9627, "loss": 1.7922, "learning_rate": 9.966485808135165e-05, "epoch": 0.036875454451023165, "percentage": 3.69, "elapsed_time": "2:35:41", "remaining_time": "2 days, 19:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 9627, "loss": 1.8094, "learning_rate": 9.966296942557062e-05, "epoch": 0.03697932897060351, "percentage": 3.7, "elapsed_time": "2:36:08", "remaining_time": "2 days, 19:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 9627, "loss": 1.803, "learning_rate": 9.966107548107074e-05, "epoch": 0.03708320349018386, "percentage": 3.71, "elapsed_time": "2:36:35", "remaining_time": "2 days, 19:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 9627, "loss": 1.9305, "learning_rate": 9.96591762480537e-05, "epoch": 0.0371870780097642, "percentage": 3.72, "elapsed_time": "2:37:01", "remaining_time": "2 days, 19:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 9627, "loss": 1.781, "learning_rate": 9.965727172672174e-05, "epoch": 0.03729095252934455, "percentage": 3.73, "elapsed_time": "2:37:29", "remaining_time": "2 days, 19:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 9627, "loss": 1.886, "learning_rate": 9.965536191727769e-05, "epoch": 0.0373948270489249, "percentage": 3.74, "elapsed_time": "2:37:56", "remaining_time": "2 days, 19:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 9627, "loss": 1.8182, "learning_rate": 9.965344681992491e-05, "epoch": 0.037498701568505245, "percentage": 3.75, "elapsed_time": "2:38:23", "remaining_time": "2 days, 19:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 9627, "loss": 1.8175, "learning_rate": 9.965152643486738e-05, "epoch": 0.03760257608808559, "percentage": 3.76, "elapsed_time": "2:38:49", "remaining_time": "2 days, 19:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 9627, "loss": 1.7128, "learning_rate": 9.964960076230955e-05, "epoch": 0.03770645060766594, "percentage": 3.77, "elapsed_time": "2:39:17", "remaining_time": "2 days, 19:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 9627, "loss": 1.8029, "learning_rate": 9.964766980245653e-05, "epoch": 0.03781032512724629, "percentage": 3.78, "elapsed_time": "2:39:44", "remaining_time": "2 days, 19:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 9627, "loss": 1.6429, "learning_rate": 9.964573355551394e-05, "epoch": 0.037914199646826637, "percentage": 3.79, "elapsed_time": "2:40:11", "remaining_time": "2 days, 19:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 9627, "loss": 1.9152, "learning_rate": 9.964379202168799e-05, "epoch": 0.03801807416640698, "percentage": 3.8, "elapsed_time": "2:40:38", "remaining_time": "2 days, 19:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 9627, "loss": 1.7536, "learning_rate": 9.964184520118542e-05, "epoch": 0.038121948685987325, "percentage": 3.81, "elapsed_time": "2:41:06", "remaining_time": "2 days, 19:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 9627, "loss": 1.7626, "learning_rate": 9.963989309421356e-05, "epoch": 0.03822582320556767, "percentage": 3.82, "elapsed_time": "2:41:32", "remaining_time": "2 days, 19:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 9627, "loss": 1.822, "learning_rate": 9.96379357009803e-05, "epoch": 0.03832969772514802, "percentage": 3.83, "elapsed_time": "2:42:00", "remaining_time": "2 days, 19:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 9627, "loss": 1.7122, "learning_rate": 9.963597302169406e-05, "epoch": 0.03843357224472837, "percentage": 3.84, "elapsed_time": "2:42:26", "remaining_time": "2 days, 19:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 9627, "loss": 1.8249, "learning_rate": 9.963400505656388e-05, "epoch": 0.038537446764308717, "percentage": 3.85, "elapsed_time": "2:42:54", "remaining_time": "2 days, 19:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 9627, "loss": 2.1094, "learning_rate": 9.963203180579932e-05, "epoch": 0.038641321283889064, "percentage": 3.86, "elapsed_time": "2:43:20", "remaining_time": "2 days, 19:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 9627, "loss": 1.8247, "learning_rate": 9.963005326961052e-05, "epoch": 0.03874519580346941, "percentage": 3.87, "elapsed_time": "2:43:47", "remaining_time": "2 days, 19:43:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 9627, "loss": 2.1071, "learning_rate": 9.962806944820817e-05, "epoch": 0.03884907032304975, "percentage": 3.88, "elapsed_time": "2:44:15", "remaining_time": "2 days, 19:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 9627, "loss": 1.8242, "learning_rate": 9.962608034180353e-05, "epoch": 0.0389529448426301, "percentage": 3.9, "elapsed_time": "2:44:41", "remaining_time": "2 days, 19:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 9627, "loss": 2.0001, "learning_rate": 9.962408595060845e-05, "epoch": 0.03905681936221045, "percentage": 3.91, "elapsed_time": "2:45:09", "remaining_time": "2 days, 19:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 9627, "loss": 1.8534, "learning_rate": 9.962208627483529e-05, "epoch": 0.039160693881790797, "percentage": 3.92, "elapsed_time": "2:45:36", "remaining_time": "2 days, 19:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 9627, "loss": 1.6624, "learning_rate": 9.962008131469703e-05, "epoch": 0.039264568401371144, "percentage": 3.93, "elapsed_time": "2:46:02", "remaining_time": "2 days, 19:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 9627, "loss": 1.7612, "learning_rate": 9.961807107040712e-05, "epoch": 0.03936844292095149, "percentage": 3.94, "elapsed_time": "2:46:30", "remaining_time": "2 days, 19:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 9627, "loss": 1.8432, "learning_rate": 9.96160555421797e-05, "epoch": 0.03947231744053184, "percentage": 3.95, "elapsed_time": "2:46:56", "remaining_time": "2 days, 19:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 9627, "loss": 1.8842, "learning_rate": 9.961403473022939e-05, "epoch": 0.03957619196011219, "percentage": 3.96, "elapsed_time": "2:47:24", "remaining_time": "2 days, 19:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 9627, "loss": 2.0091, "learning_rate": 9.961200863477139e-05, "epoch": 0.03968006647969253, "percentage": 3.97, "elapsed_time": "2:47:51", "remaining_time": "2 days, 19:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 9627, "loss": 1.8124, "learning_rate": 9.960997725602144e-05, "epoch": 0.039783940999272877, "percentage": 3.98, "elapsed_time": "2:48:18", "remaining_time": "2 days, 19:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 9627, "loss": 1.9146, "learning_rate": 9.96079405941959e-05, "epoch": 0.039887815518853224, "percentage": 3.99, "elapsed_time": "2:48:45", "remaining_time": "2 days, 19:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 9627, "loss": 1.8714, "learning_rate": 9.960589864951162e-05, "epoch": 0.03999169003843357, "percentage": 4.0, "elapsed_time": "2:49:12", "remaining_time": "2 days, 19:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 9627, "loss": 1.8268, "learning_rate": 9.960385142218609e-05, "epoch": 0.04009556455801392, "percentage": 4.01, "elapsed_time": "2:49:40", "remaining_time": "2 days, 19:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 9627, "loss": 1.6027, "learning_rate": 9.960179891243731e-05, "epoch": 0.04019943907759427, "percentage": 4.02, "elapsed_time": "2:50:07", "remaining_time": "2 days, 19:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 9627, "loss": 1.9221, "learning_rate": 9.959974112048386e-05, "epoch": 0.040303313597174616, "percentage": 4.03, "elapsed_time": "2:50:33", "remaining_time": "2 days, 19:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 9627, "loss": 1.8234, "learning_rate": 9.959767804654487e-05, "epoch": 0.040407188116754963, "percentage": 4.04, "elapsed_time": "2:51:01", "remaining_time": "2 days, 19:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 9627, "loss": 1.9483, "learning_rate": 9.959560969084003e-05, "epoch": 0.040511062636335304, "percentage": 4.05, "elapsed_time": "2:51:29", "remaining_time": "2 days, 19:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 9627, "loss": 1.7024, "learning_rate": 9.959353605358964e-05, "epoch": 0.04061493715591565, "percentage": 4.06, "elapsed_time": "2:51:55", "remaining_time": "2 days, 19:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 9627, "loss": 1.884, "learning_rate": 9.95914571350145e-05, "epoch": 0.040718811675496, "percentage": 4.07, "elapsed_time": "2:52:23", "remaining_time": "2 days, 19:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 9627, "loss": 1.8548, "learning_rate": 9.958937293533599e-05, "epoch": 0.04082268619507635, "percentage": 4.08, "elapsed_time": "2:52:50", "remaining_time": "2 days, 19:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 9627, "loss": 2.0568, "learning_rate": 9.958728345477608e-05, "epoch": 0.040926560714656696, "percentage": 4.09, "elapsed_time": "2:53:17", "remaining_time": "2 days, 19:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 9627, "loss": 1.7908, "learning_rate": 9.958518869355728e-05, "epoch": 0.041030435234237043, "percentage": 4.1, "elapsed_time": "2:53:43", "remaining_time": "2 days, 19:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 9627, "loss": 1.8225, "learning_rate": 9.958308865190267e-05, "epoch": 0.04113430975381739, "percentage": 4.11, "elapsed_time": "2:54:10", "remaining_time": "2 days, 19:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 9627, "loss": 1.7719, "learning_rate": 9.958098333003588e-05, "epoch": 0.04123818427339773, "percentage": 4.12, "elapsed_time": "2:54:37", "remaining_time": "2 days, 19:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 9627, "loss": 1.9513, "learning_rate": 9.957887272818112e-05, "epoch": 0.04134205879297808, "percentage": 4.13, "elapsed_time": "2:55:05", "remaining_time": "2 days, 19:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 9627, "loss": 1.8509, "learning_rate": 9.957675684656312e-05, "epoch": 0.04144593331255843, "percentage": 4.14, "elapsed_time": "2:55:31", "remaining_time": "2 days, 19:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 9627, "loss": 1.8173, "learning_rate": 9.957463568540725e-05, "epoch": 0.041549807832138776, "percentage": 4.15, "elapsed_time": "2:56:00", "remaining_time": "2 days, 19:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 9627, "loss": 1.8059, "learning_rate": 9.957250924493938e-05, "epoch": 0.041653682351719123, "percentage": 4.17, "elapsed_time": "2:56:26", "remaining_time": "2 days, 19:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 9627, "loss": 1.9456, "learning_rate": 9.957037752538592e-05, "epoch": 0.04175755687129947, "percentage": 4.18, "elapsed_time": "2:56:53", "remaining_time": "2 days, 19:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 9627, "loss": 1.7831, "learning_rate": 9.956824052697395e-05, "epoch": 0.04186143139087982, "percentage": 4.19, "elapsed_time": "2:57:20", "remaining_time": "2 days, 19:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 9627, "loss": 1.791, "learning_rate": 9.956609824993099e-05, "epoch": 0.04196530591046017, "percentage": 4.2, "elapsed_time": "2:57:48", "remaining_time": "2 days, 19:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 9627, "loss": 1.8728, "learning_rate": 9.956395069448523e-05, "epoch": 0.04206918043004051, "percentage": 4.21, "elapsed_time": "2:58:15", "remaining_time": "2 days, 19:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 9627, "loss": 1.8004, "learning_rate": 9.95617978608653e-05, "epoch": 0.042173054949620856, "percentage": 4.22, "elapsed_time": "2:58:42", "remaining_time": "2 days, 19:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 9627, "loss": 1.7891, "learning_rate": 9.955963974930052e-05, "epoch": 0.042276929469201203, "percentage": 4.23, "elapsed_time": "2:59:08", "remaining_time": "2 days, 19:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 9627, "loss": 1.9755, "learning_rate": 9.955747636002068e-05, "epoch": 0.04238080398878155, "percentage": 4.24, "elapsed_time": "2:59:36", "remaining_time": "2 days, 19:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 9627, "loss": 1.6478, "learning_rate": 9.955530769325616e-05, "epoch": 0.0424846785083619, "percentage": 4.25, "elapsed_time": "3:00:03", "remaining_time": "2 days, 19:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 9627, "loss": 1.9403, "learning_rate": 9.955313374923791e-05, "epoch": 0.04258855302794225, "percentage": 4.26, "elapsed_time": "3:00:29", "remaining_time": "2 days, 19:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 9627, "loss": 2.0413, "learning_rate": 9.955095452819747e-05, "epoch": 0.042692427547522595, "percentage": 4.27, "elapsed_time": "3:00:56", "remaining_time": "2 days, 19:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 9627, "loss": 1.6253, "learning_rate": 9.954877003036687e-05, "epoch": 0.04279630206710294, "percentage": 4.28, "elapsed_time": "3:01:24", "remaining_time": "2 days, 19:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 9627, "loss": 2.1789, "learning_rate": 9.954658025597876e-05, "epoch": 0.042900176586683283, "percentage": 4.29, "elapsed_time": "3:01:50", "remaining_time": "2 days, 19:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 9627, "loss": 1.4562, "learning_rate": 9.954438520526635e-05, "epoch": 0.04300405110626363, "percentage": 4.3, "elapsed_time": "3:02:17", "remaining_time": "2 days, 19:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 9627, "loss": 1.7904, "learning_rate": 9.954218487846334e-05, "epoch": 0.04310792562584398, "percentage": 4.31, "elapsed_time": "3:02:44", "remaining_time": "2 days, 19:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 9627, "loss": 1.8548, "learning_rate": 9.953997927580411e-05, "epoch": 0.04321180014542433, "percentage": 4.32, "elapsed_time": "3:03:12", "remaining_time": "2 days, 19:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 9627, "loss": 1.7331, "learning_rate": 9.953776839752351e-05, "epoch": 0.043315674665004675, "percentage": 4.33, "elapsed_time": "3:03:39", "remaining_time": "2 days, 19:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 9627, "loss": 1.883, "learning_rate": 9.953555224385698e-05, "epoch": 0.04341954918458502, "percentage": 4.34, "elapsed_time": "3:04:06", "remaining_time": "2 days, 19:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 9627, "loss": 1.6892, "learning_rate": 9.953333081504052e-05, "epoch": 0.04352342370416537, "percentage": 4.35, "elapsed_time": "3:04:33", "remaining_time": "2 days, 19:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 9627, "loss": 1.734, "learning_rate": 9.953110411131072e-05, "epoch": 0.04362729822374572, "percentage": 4.36, "elapsed_time": "3:05:00", "remaining_time": "2 days, 19:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 9627, "loss": 1.8173, "learning_rate": 9.952887213290469e-05, "epoch": 0.04373117274332606, "percentage": 4.37, "elapsed_time": "3:05:28", "remaining_time": "2 days, 19:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 9627, "loss": 1.9877, "learning_rate": 9.952663488006011e-05, "epoch": 0.04383504726290641, "percentage": 4.38, "elapsed_time": "3:05:55", "remaining_time": "2 days, 19:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 9627, "loss": 1.8042, "learning_rate": 9.952439235301522e-05, "epoch": 0.043938921782486755, "percentage": 4.39, "elapsed_time": "3:06:22", "remaining_time": "2 days, 19:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 9627, "loss": 1.7833, "learning_rate": 9.952214455200887e-05, "epoch": 0.0440427963020671, "percentage": 4.4, "elapsed_time": "3:06:50", "remaining_time": "2 days, 19:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 9627, "loss": 1.9778, "learning_rate": 9.951989147728043e-05, "epoch": 0.04414667082164745, "percentage": 4.41, "elapsed_time": "3:07:17", "remaining_time": "2 days, 19:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 9627, "loss": 1.8447, "learning_rate": 9.951763312906979e-05, "epoch": 0.0442505453412278, "percentage": 4.43, "elapsed_time": "3:07:44", "remaining_time": "2 days, 19:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 9627, "loss": 1.6772, "learning_rate": 9.951536950761748e-05, "epoch": 0.044354419860808146, "percentage": 4.44, "elapsed_time": "3:08:11", "remaining_time": "2 days, 19:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 9627, "loss": 1.8328, "learning_rate": 9.951310061316455e-05, "epoch": 0.044458294380388494, "percentage": 4.45, "elapsed_time": "3:08:38", "remaining_time": "2 days, 19:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 9627, "loss": 1.8814, "learning_rate": 9.951082644595264e-05, "epoch": 0.044562168899968835, "percentage": 4.46, "elapsed_time": "3:09:05", "remaining_time": "2 days, 19:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 9627, "loss": 1.8108, "learning_rate": 9.95085470062239e-05, "epoch": 0.04466604341954918, "percentage": 4.47, "elapsed_time": "3:09:32", "remaining_time": "2 days, 19:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 9627, "loss": 1.7423, "learning_rate": 9.950626229422107e-05, "epoch": 0.04476991793912953, "percentage": 4.48, "elapsed_time": "3:10:00", "remaining_time": "2 days, 19:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 9627, "loss": 1.7873, "learning_rate": 9.950397231018748e-05, "epoch": 0.04487379245870988, "percentage": 4.49, "elapsed_time": "3:10:26", "remaining_time": "2 days, 19:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 9627, "loss": 1.9949, "learning_rate": 9.950167705436699e-05, "epoch": 0.044977666978290226, "percentage": 4.5, "elapsed_time": "3:10:54", "remaining_time": "2 days, 19:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 9627, "loss": 1.5736, "learning_rate": 9.949937652700402e-05, "epoch": 0.045081541497870574, "percentage": 4.51, "elapsed_time": "3:11:21", "remaining_time": "2 days, 19:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 9627, "loss": 1.7662, "learning_rate": 9.949707072834356e-05, "epoch": 0.04518541601745092, "percentage": 4.52, "elapsed_time": "3:11:48", "remaining_time": "2 days, 19:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 9627, "loss": 1.8209, "learning_rate": 9.949475965863116e-05, "epoch": 0.04528929053703127, "percentage": 4.53, "elapsed_time": "3:12:15", "remaining_time": "2 days, 19:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 9627, "loss": 2.1643, "learning_rate": 9.949244331811293e-05, "epoch": 0.04539316505661161, "percentage": 4.54, "elapsed_time": "3:12:43", "remaining_time": "2 days, 19:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 9627, "loss": 1.8557, "learning_rate": 9.949012170703556e-05, "epoch": 0.04549703957619196, "percentage": 4.55, "elapsed_time": "3:13:10", "remaining_time": "2 days, 19:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 9627, "loss": 1.7119, "learning_rate": 9.948779482564624e-05, "epoch": 0.045600914095772306, "percentage": 4.56, "elapsed_time": "3:13:37", "remaining_time": "2 days, 19:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 9627, "loss": 1.8411, "learning_rate": 9.948546267419278e-05, "epoch": 0.045704788615352654, "percentage": 4.57, "elapsed_time": "3:14:05", "remaining_time": "2 days, 19:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 9627, "loss": 1.7674, "learning_rate": 9.948312525292358e-05, "epoch": 0.045808663134933, "percentage": 4.58, "elapsed_time": "3:14:31", "remaining_time": "2 days, 19:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 9627, "loss": 1.9521, "learning_rate": 9.948078256208751e-05, "epoch": 0.04591253765451335, "percentage": 4.59, "elapsed_time": "3:14:59", "remaining_time": "2 days, 19:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 9627, "loss": 1.9358, "learning_rate": 9.947843460193407e-05, "epoch": 0.0460164121740937, "percentage": 4.6, "elapsed_time": "3:15:27", "remaining_time": "2 days, 19:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 9627, "loss": 1.8426, "learning_rate": 9.947608137271328e-05, "epoch": 0.046120286693674045, "percentage": 4.61, "elapsed_time": "3:15:54", "remaining_time": "2 days, 19:31:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 9627, "loss": 1.7263, "learning_rate": 9.947372287467576e-05, "epoch": 0.046224161213254386, "percentage": 4.62, "elapsed_time": "3:16:20", "remaining_time": "2 days, 19:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 9627, "loss": 1.9716, "learning_rate": 9.947135910807265e-05, "epoch": 0.046328035732834734, "percentage": 4.63, "elapsed_time": "3:16:49", "remaining_time": "2 days, 19:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 9627, "loss": 1.7952, "learning_rate": 9.946899007315569e-05, "epoch": 0.04643191025241508, "percentage": 4.64, "elapsed_time": "3:17:16", "remaining_time": "2 days, 19:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 9627, "loss": 1.8804, "learning_rate": 9.946661577017717e-05, "epoch": 0.04653578477199543, "percentage": 4.65, "elapsed_time": "3:17:43", "remaining_time": "2 days, 19:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 9627, "loss": 2.0071, "learning_rate": 9.946423619938992e-05, "epoch": 0.04663965929157578, "percentage": 4.66, "elapsed_time": "3:18:11", "remaining_time": "2 days, 19:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 9627, "loss": 1.6811, "learning_rate": 9.946185136104735e-05, "epoch": 0.046743533811156125, "percentage": 4.67, "elapsed_time": "3:18:37", "remaining_time": "2 days, 19:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 9627, "loss": 1.7127, "learning_rate": 9.945946125540343e-05, "epoch": 0.04684740833073647, "percentage": 4.68, "elapsed_time": "3:19:05", "remaining_time": "2 days, 19:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 9627, "loss": 1.7116, "learning_rate": 9.945706588271269e-05, "epoch": 0.046951282850316814, "percentage": 4.7, "elapsed_time": "3:19:32", "remaining_time": "2 days, 19:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 9627, "loss": 1.7475, "learning_rate": 9.94546652432302e-05, "epoch": 0.04705515736989716, "percentage": 4.71, "elapsed_time": "3:19:59", "remaining_time": "2 days, 19:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 9627, "loss": 1.7588, "learning_rate": 9.945225933721163e-05, "epoch": 0.04715903188947751, "percentage": 4.72, "elapsed_time": "3:20:27", "remaining_time": "2 days, 19:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 9627, "loss": 1.6391, "learning_rate": 9.944984816491318e-05, "epoch": 0.04726290640905786, "percentage": 4.73, "elapsed_time": "3:20:54", "remaining_time": "2 days, 19:29:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 9627, "loss": 1.7689, "learning_rate": 9.944743172659164e-05, "epoch": 0.047366780928638205, "percentage": 4.74, "elapsed_time": "3:21:21", "remaining_time": "2 days, 19:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 9627, "loss": 1.6911, "learning_rate": 9.94450100225043e-05, "epoch": 0.04747065544821855, "percentage": 4.75, "elapsed_time": "3:21:49", "remaining_time": "2 days, 19:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 9627, "loss": 1.949, "learning_rate": 9.944258305290908e-05, "epoch": 0.0475745299677989, "percentage": 4.76, "elapsed_time": "3:22:16", "remaining_time": "2 days, 19:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 9627, "loss": 1.9012, "learning_rate": 9.944015081806445e-05, "epoch": 0.04767840448737925, "percentage": 4.77, "elapsed_time": "3:22:44", "remaining_time": "2 days, 19:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 9627, "loss": 2.0238, "learning_rate": 9.94377133182294e-05, "epoch": 0.04778227900695959, "percentage": 4.78, "elapsed_time": "3:23:11", "remaining_time": "2 days, 19:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 9627, "loss": 1.7753, "learning_rate": 9.943527055366351e-05, "epoch": 0.04788615352653994, "percentage": 4.79, "elapsed_time": "3:23:38", "remaining_time": "2 days, 19:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 9627, "loss": 1.7137, "learning_rate": 9.94328225246269e-05, "epoch": 0.047990028046120285, "percentage": 4.8, "elapsed_time": "3:24:05", "remaining_time": "2 days, 19:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 9627, "loss": 1.7599, "learning_rate": 9.943036923138032e-05, "epoch": 0.04809390256570063, "percentage": 4.81, "elapsed_time": "3:24:33", "remaining_time": "2 days, 19:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 9627, "loss": 1.7868, "learning_rate": 9.942791067418496e-05, "epoch": 0.04819777708528098, "percentage": 4.82, "elapsed_time": "3:25:00", "remaining_time": "2 days, 19:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 9627, "loss": 1.93, "learning_rate": 9.942544685330267e-05, "epoch": 0.04830165160486133, "percentage": 4.83, "elapsed_time": "3:25:27", "remaining_time": "2 days, 19:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 9627, "loss": 1.9025, "learning_rate": 9.942297776899583e-05, "epoch": 0.048405526124441677, "percentage": 4.84, "elapsed_time": "3:25:56", "remaining_time": "2 days, 19:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 9627, "loss": 1.7295, "learning_rate": 9.942050342152736e-05, "epoch": 0.048509400644022024, "percentage": 4.85, "elapsed_time": "3:26:22", "remaining_time": "2 days, 19:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 9627, "loss": 1.5522, "learning_rate": 9.941802381116078e-05, "epoch": 0.048613275163602365, "percentage": 4.86, "elapsed_time": "3:26:50", "remaining_time": "2 days, 19:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 9627, "loss": 1.7374, "learning_rate": 9.941553893816014e-05, "epoch": 0.04871714968318271, "percentage": 4.87, "elapsed_time": "3:27:18", "remaining_time": "2 days, 19:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 9627, "loss": 1.7781, "learning_rate": 9.941304880279005e-05, "epoch": 0.04882102420276306, "percentage": 4.88, "elapsed_time": "3:27:45", "remaining_time": "2 days, 19:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 9627, "loss": 1.9754, "learning_rate": 9.941055340531571e-05, "epoch": 0.04892489872234341, "percentage": 4.89, "elapsed_time": "3:28:13", "remaining_time": "2 days, 19:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 9627, "loss": 1.8484, "learning_rate": 9.940805274600285e-05, "epoch": 0.049028773241923757, "percentage": 4.9, "elapsed_time": "3:28:40", "remaining_time": "2 days, 19:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 9627, "loss": 1.9061, "learning_rate": 9.940554682511775e-05, "epoch": 0.049132647761504104, "percentage": 4.91, "elapsed_time": "3:29:08", "remaining_time": "2 days, 19:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 9627, "loss": 1.759, "learning_rate": 9.940303564292731e-05, "epoch": 0.04923652228108445, "percentage": 4.92, "elapsed_time": "3:29:35", "remaining_time": "2 days, 19:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 9627, "loss": 1.8638, "learning_rate": 9.940051919969893e-05, "epoch": 0.0493403968006648, "percentage": 4.93, "elapsed_time": "3:30:02", "remaining_time": "2 days, 19:26:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 9627, "loss": 1.9465, "learning_rate": 9.939799749570059e-05, "epoch": 0.04944427132024514, "percentage": 4.94, "elapsed_time": "3:30:30", "remaining_time": "2 days, 19:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 9627, "loss": 1.8029, "learning_rate": 9.939547053120084e-05, "epoch": 0.04954814583982549, "percentage": 4.95, "elapsed_time": "3:30:57", "remaining_time": "2 days, 19:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 9627, "loss": 1.6021, "learning_rate": 9.939293830646878e-05, "epoch": 0.049652020359405837, "percentage": 4.97, "elapsed_time": "3:31:25", "remaining_time": "2 days, 19:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 9627, "loss": 1.9107, "learning_rate": 9.939040082177407e-05, "epoch": 0.049755894878986184, "percentage": 4.98, "elapsed_time": "3:31:52", "remaining_time": "2 days, 19:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 9627, "loss": 2.0531, "learning_rate": 9.938785807738693e-05, "epoch": 0.04985976939856653, "percentage": 4.99, "elapsed_time": "3:32:20", "remaining_time": "2 days, 19:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 9627, "loss": 1.9953, "learning_rate": 9.938531007357813e-05, "epoch": 0.04996364391814688, "percentage": 5.0, "elapsed_time": "3:32:47", "remaining_time": "2 days, 19:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 9627, "loss": 1.75, "learning_rate": 9.938275681061903e-05, "epoch": 0.05006751843772723, "percentage": 5.01, "elapsed_time": "3:33:15", "remaining_time": "2 days, 19:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 9627, "loss": 1.9639, "learning_rate": 9.938019828878155e-05, "epoch": 0.050171392957307576, "percentage": 5.02, "elapsed_time": "3:33:42", "remaining_time": "2 days, 19:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 9627, "loss": 1.8305, "learning_rate": 9.937763450833813e-05, "epoch": 0.050275267476887917, "percentage": 5.03, "elapsed_time": "3:34:10", "remaining_time": "2 days, 19:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 9627, "loss": 1.8667, "learning_rate": 9.93750654695618e-05, "epoch": 0.050379141996468264, "percentage": 5.04, "elapsed_time": "3:34:36", "remaining_time": "2 days, 19:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 9627, "loss": 1.8097, "learning_rate": 9.937249117272612e-05, "epoch": 0.05048301651604861, "percentage": 5.05, "elapsed_time": "3:35:05", "remaining_time": "2 days, 19:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 9627, "loss": 1.872, "learning_rate": 9.936991161810525e-05, "epoch": 0.05058689103562896, "percentage": 5.06, "elapsed_time": "3:35:32", "remaining_time": "2 days, 19:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 9627, "loss": 1.777, "learning_rate": 9.93673268059739e-05, "epoch": 0.05069076555520931, "percentage": 5.07, "elapsed_time": "3:35:59", "remaining_time": "2 days, 19:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 9627, "loss": 1.8364, "learning_rate": 9.936473673660733e-05, "epoch": 0.050794640074789656, "percentage": 5.08, "elapsed_time": "3:36:26", "remaining_time": "2 days, 19:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 9627, "loss": 1.7858, "learning_rate": 9.936214141028135e-05, "epoch": 0.050898514594370003, "percentage": 5.09, "elapsed_time": "3:36:55", "remaining_time": "2 days, 19:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 9627, "loss": 2.1136, "learning_rate": 9.935954082727235e-05, "epoch": 0.05100238911395035, "percentage": 5.1, "elapsed_time": "3:37:22", "remaining_time": "2 days, 19:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 9627, "loss": 1.8873, "learning_rate": 9.935693498785728e-05, "epoch": 0.05110626363353069, "percentage": 5.11, "elapsed_time": "3:37:48", "remaining_time": "2 days, 19:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 9627, "loss": 1.6858, "learning_rate": 9.93543238923136e-05, "epoch": 0.05121013815311104, "percentage": 5.12, "elapsed_time": "3:38:16", "remaining_time": "2 days, 19:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 9627, "loss": 1.8528, "learning_rate": 9.935170754091945e-05, "epoch": 0.05131401267269139, "percentage": 5.13, "elapsed_time": "3:38:44", "remaining_time": "2 days, 19:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 9627, "loss": 1.7657, "learning_rate": 9.934908593395338e-05, "epoch": 0.051417887192271736, "percentage": 5.14, "elapsed_time": "3:39:11", "remaining_time": "2 days, 19:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 9627, "loss": 1.7152, "learning_rate": 9.934645907169459e-05, "epoch": 0.051521761711852083, "percentage": 5.15, "elapsed_time": "3:39:40", "remaining_time": "2 days, 19:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 9627, "loss": 1.6483, "learning_rate": 9.934382695442284e-05, "epoch": 0.05162563623143243, "percentage": 5.16, "elapsed_time": "3:40:06", "remaining_time": "2 days, 19:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 9627, "loss": 1.8188, "learning_rate": 9.934118958241842e-05, "epoch": 0.05172951075101278, "percentage": 5.17, "elapsed_time": "3:40:35", "remaining_time": "2 days, 19:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 9627, "loss": 1.6657, "learning_rate": 9.933854695596216e-05, "epoch": 0.05183338527059313, "percentage": 5.18, "elapsed_time": "3:41:02", "remaining_time": "2 days, 19:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 9627, "loss": 1.7714, "learning_rate": 9.933589907533554e-05, "epoch": 0.05193725979017347, "percentage": 5.19, "elapsed_time": "3:41:30", "remaining_time": "2 days, 19:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 9627, "loss": 1.9087, "learning_rate": 9.933324594082048e-05, "epoch": 0.052041134309753816, "percentage": 5.2, "elapsed_time": "3:41:57", "remaining_time": "2 days, 19:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 9627, "loss": 1.8386, "learning_rate": 9.933058755269955e-05, "epoch": 0.052145008829334163, "percentage": 5.21, "elapsed_time": "3:42:24", "remaining_time": "2 days, 19:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 9627, "loss": 1.7782, "learning_rate": 9.932792391125583e-05, "epoch": 0.05224888334891451, "percentage": 5.22, "elapsed_time": "3:42:53", "remaining_time": "2 days, 19:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 9627, "loss": 1.8822, "learning_rate": 9.932525501677299e-05, "epoch": 0.05235275786849486, "percentage": 5.24, "elapsed_time": "3:43:20", "remaining_time": "2 days, 19:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 9627, "loss": 1.8777, "learning_rate": 9.932258086953525e-05, "epoch": 0.05245663238807521, "percentage": 5.25, "elapsed_time": "3:43:48", "remaining_time": "2 days, 19:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 9627, "loss": 1.6693, "learning_rate": 9.931990146982736e-05, "epoch": 0.052560506907655555, "percentage": 5.26, "elapsed_time": "3:44:15", "remaining_time": "2 days, 19:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 9627, "loss": 1.6766, "learning_rate": 9.931721681793468e-05, "epoch": 0.052664381427235896, "percentage": 5.27, "elapsed_time": "3:44:42", "remaining_time": "2 days, 19:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 9627, "loss": 1.9316, "learning_rate": 9.931452691414311e-05, "epoch": 0.052768255946816243, "percentage": 5.28, "elapsed_time": "3:45:11", "remaining_time": "2 days, 19:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 9627, "loss": 1.9157, "learning_rate": 9.93118317587391e-05, "epoch": 0.05287213046639659, "percentage": 5.29, "elapsed_time": "3:45:38", "remaining_time": "2 days, 19:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 9627, "loss": 1.718, "learning_rate": 9.930913135200963e-05, "epoch": 0.05297600498597694, "percentage": 5.3, "elapsed_time": "3:46:05", "remaining_time": "2 days, 19:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 9627, "loss": 1.7702, "learning_rate": 9.930642569424231e-05, "epoch": 0.05307987950555729, "percentage": 5.31, "elapsed_time": "3:46:34", "remaining_time": "2 days, 19:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 9627, "loss": 1.6665, "learning_rate": 9.930371478572526e-05, "epoch": 0.053183754025137635, "percentage": 5.32, "elapsed_time": "3:47:01", "remaining_time": "2 days, 19:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 9627, "loss": 1.7484, "learning_rate": 9.930099862674716e-05, "epoch": 0.05328762854471798, "percentage": 5.33, "elapsed_time": "3:47:28", "remaining_time": "2 days, 19:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 9627, "loss": 1.9197, "learning_rate": 9.929827721759728e-05, "epoch": 0.05339150306429833, "percentage": 5.34, "elapsed_time": "3:47:57", "remaining_time": "2 days, 19:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 9627, "loss": 1.8467, "learning_rate": 9.92955505585654e-05, "epoch": 0.05349537758387867, "percentage": 5.35, "elapsed_time": "3:48:24", "remaining_time": "2 days, 19:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 9627, "loss": 1.8709, "learning_rate": 9.929281864994193e-05, "epoch": 0.05359925210345902, "percentage": 5.36, "elapsed_time": "3:48:53", "remaining_time": "2 days, 19:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 9627, "loss": 1.9486, "learning_rate": 9.929008149201774e-05, "epoch": 0.05370312662303937, "percentage": 5.37, "elapsed_time": "3:49:20", "remaining_time": "2 days, 19:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 9627, "loss": 1.7749, "learning_rate": 9.928733908508438e-05, "epoch": 0.053807001142619715, "percentage": 5.38, "elapsed_time": "3:49:48", "remaining_time": "2 days, 19:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 9627, "loss": 1.8424, "learning_rate": 9.928459142943385e-05, "epoch": 0.05391087566220006, "percentage": 5.39, "elapsed_time": "3:50:16", "remaining_time": "2 days, 19:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 9627, "loss": 1.8719, "learning_rate": 9.928183852535877e-05, "epoch": 0.05401475018178041, "percentage": 5.4, "elapsed_time": "3:50:44", "remaining_time": "2 days, 19:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 9627, "loss": 1.8434, "learning_rate": 9.92790803731523e-05, "epoch": 0.05411862470136076, "percentage": 5.41, "elapsed_time": "3:51:12", "remaining_time": "2 days, 19:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 9627, "loss": 1.9473, "learning_rate": 9.927631697310816e-05, "epoch": 0.054222499220941106, "percentage": 5.42, "elapsed_time": "3:51:39", "remaining_time": "2 days, 19:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 9627, "loss": 1.9063, "learning_rate": 9.927354832552063e-05, "epoch": 0.05432637374052145, "percentage": 5.43, "elapsed_time": "3:52:07", "remaining_time": "2 days, 19:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 9627, "loss": 1.7318, "learning_rate": 9.927077443068455e-05, "epoch": 0.054430248260101795, "percentage": 5.44, "elapsed_time": "3:52:35", "remaining_time": "2 days, 19:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 9627, "loss": 1.8991, "learning_rate": 9.926799528889534e-05, "epoch": 0.05453412277968214, "percentage": 5.45, "elapsed_time": "3:53:02", "remaining_time": "2 days, 19:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 9627, "loss": 2.1391, "learning_rate": 9.926521090044891e-05, "epoch": 0.05463799729926249, "percentage": 5.46, "elapsed_time": "3:53:30", "remaining_time": "2 days, 19:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 9627, "loss": 1.8072, "learning_rate": 9.926242126564182e-05, "epoch": 0.05474187181884284, "percentage": 5.47, "elapsed_time": "3:53:58", "remaining_time": "2 days, 19:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 9627, "loss": 1.7599, "learning_rate": 9.925962638477113e-05, "epoch": 0.054845746338423186, "percentage": 5.48, "elapsed_time": "3:54:26", "remaining_time": "2 days, 19:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 9627, "loss": 1.7878, "learning_rate": 9.925682625813446e-05, "epoch": 0.054949620858003534, "percentage": 5.49, "elapsed_time": "3:54:54", "remaining_time": "2 days, 19:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 9627, "loss": 1.7764, "learning_rate": 9.925402088603e-05, "epoch": 0.05505349537758388, "percentage": 5.51, "elapsed_time": "3:55:21", "remaining_time": "2 days, 19:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 9627, "loss": 1.7976, "learning_rate": 9.925121026875654e-05, "epoch": 0.05515736989716422, "percentage": 5.52, "elapsed_time": "3:55:49", "remaining_time": "2 days, 19:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 9627, "loss": 1.8439, "learning_rate": 9.924839440661334e-05, "epoch": 0.05526124441674457, "percentage": 5.53, "elapsed_time": "3:56:17", "remaining_time": "2 days, 19:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 9627, "loss": 1.9871, "learning_rate": 9.92455732999003e-05, "epoch": 0.05536511893632492, "percentage": 5.54, "elapsed_time": "3:56:43", "remaining_time": "2 days, 19:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 9627, "loss": 1.7941, "learning_rate": 9.924274694891782e-05, "epoch": 0.055468993455905266, "percentage": 5.55, "elapsed_time": "3:57:12", "remaining_time": "2 days, 19:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 9627, "loss": 1.7015, "learning_rate": 9.92399153539669e-05, "epoch": 0.055572867975485614, "percentage": 5.56, "elapsed_time": "3:57:39", "remaining_time": "2 days, 19:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 9627, "loss": 1.791, "learning_rate": 9.923707851534909e-05, "epoch": 0.05567674249506596, "percentage": 5.57, "elapsed_time": "3:58:08", "remaining_time": "2 days, 19:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 9627, "loss": 1.7576, "learning_rate": 9.923423643336648e-05, "epoch": 0.05578061701464631, "percentage": 5.58, "elapsed_time": "3:58:34", "remaining_time": "2 days, 19:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 9627, "loss": 1.963, "learning_rate": 9.923138910832172e-05, "epoch": 0.05588449153422666, "percentage": 5.59, "elapsed_time": "3:59:03", "remaining_time": "2 days, 19:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 9627, "loss": 1.6796, "learning_rate": 9.922853654051806e-05, "epoch": 0.055988366053807, "percentage": 5.6, "elapsed_time": "3:59:29", "remaining_time": "2 days, 19:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 9627, "loss": 1.7261, "learning_rate": 9.922567873025924e-05, "epoch": 0.056092240573387346, "percentage": 5.61, "elapsed_time": "3:59:58", "remaining_time": "2 days, 19:18:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 9627, "loss": 1.825, "learning_rate": 9.922281567784961e-05, "epoch": 0.056196115092967694, "percentage": 5.62, "elapsed_time": "4:00:25", "remaining_time": "2 days, 19:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 9627, "loss": 1.791, "learning_rate": 9.921994738359409e-05, "epoch": 0.05629998961254804, "percentage": 5.63, "elapsed_time": "4:00:53", "remaining_time": "2 days, 19:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 9627, "loss": 1.8141, "learning_rate": 9.921707384779807e-05, "epoch": 0.05640386413212839, "percentage": 5.64, "elapsed_time": "4:01:20", "remaining_time": "2 days, 19:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 9627, "loss": 1.7599, "learning_rate": 9.92141950707676e-05, "epoch": 0.05650773865170874, "percentage": 5.65, "elapsed_time": "4:01:49", "remaining_time": "2 days, 19:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 9627, "loss": 1.5647, "learning_rate": 9.921131105280925e-05, "epoch": 0.056611613171289085, "percentage": 5.66, "elapsed_time": "4:02:18", "remaining_time": "2 days, 19:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 9627, "loss": 1.9926, "learning_rate": 9.920842179423013e-05, "epoch": 0.05671548769086943, "percentage": 5.67, "elapsed_time": "4:02:45", "remaining_time": "2 days, 19:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 9627, "loss": 1.6564, "learning_rate": 9.920552729533792e-05, "epoch": 0.056819362210449774, "percentage": 5.68, "elapsed_time": "4:03:13", "remaining_time": "2 days, 19:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 9627, "loss": 1.8871, "learning_rate": 9.92026275564409e-05, "epoch": 0.05692323673003012, "percentage": 5.69, "elapsed_time": "4:03:41", "remaining_time": "2 days, 19:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 9627, "loss": 2.0246, "learning_rate": 9.919972257784783e-05, "epoch": 0.05702711124961047, "percentage": 5.7, "elapsed_time": "4:04:08", "remaining_time": "2 days, 19:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 9627, "loss": 1.8523, "learning_rate": 9.919681235986806e-05, "epoch": 0.05713098576919082, "percentage": 5.71, "elapsed_time": "4:04:37", "remaining_time": "2 days, 19:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 9627, "loss": 1.7427, "learning_rate": 9.919389690281154e-05, "epoch": 0.057234860288771165, "percentage": 5.72, "elapsed_time": "4:05:03", "remaining_time": "2 days, 19:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 9627, "loss": 1.8491, "learning_rate": 9.919097620698872e-05, "epoch": 0.05733873480835151, "percentage": 5.73, "elapsed_time": "4:05:32", "remaining_time": "2 days, 19:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 9627, "loss": 1.7309, "learning_rate": 9.918805027271064e-05, "epoch": 0.05744260932793186, "percentage": 5.74, "elapsed_time": "4:05:59", "remaining_time": "2 days, 19:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 9627, "loss": 1.8213, "learning_rate": 9.918511910028888e-05, "epoch": 0.05754648384751221, "percentage": 5.75, "elapsed_time": "4:06:27", "remaining_time": "2 days, 19:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 9627, "loss": 1.6017, "learning_rate": 9.918218269003561e-05, "epoch": 0.05765035836709255, "percentage": 5.77, "elapsed_time": "4:06:54", "remaining_time": "2 days, 19:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 9627, "loss": 1.7434, "learning_rate": 9.917924104226351e-05, "epoch": 0.0577542328866729, "percentage": 5.78, "elapsed_time": "4:07:23", "remaining_time": "2 days, 19:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 9627, "loss": 1.8997, "learning_rate": 9.917629415728584e-05, "epoch": 0.057858107406253245, "percentage": 5.79, "elapsed_time": "4:07:49", "remaining_time": "2 days, 19:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 9627, "loss": 1.8736, "learning_rate": 9.917334203541645e-05, "epoch": 0.05796198192583359, "percentage": 5.8, "elapsed_time": "4:08:18", "remaining_time": "2 days, 19:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 9627, "loss": 1.8951, "learning_rate": 9.917038467696968e-05, "epoch": 0.05806585644541394, "percentage": 5.81, "elapsed_time": "4:08:45", "remaining_time": "2 days, 19:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 9627, "loss": 1.9565, "learning_rate": 9.916742208226051e-05, "epoch": 0.05816973096499429, "percentage": 5.82, "elapsed_time": "4:09:14", "remaining_time": "2 days, 19:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 9627, "loss": 1.9673, "learning_rate": 9.91644542516044e-05, "epoch": 0.058273605484574637, "percentage": 5.83, "elapsed_time": "4:09:42", "remaining_time": "2 days, 19:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 9627, "loss": 2.0416, "learning_rate": 9.91614811853174e-05, "epoch": 0.05837748000415498, "percentage": 5.84, "elapsed_time": "4:10:09", "remaining_time": "2 days, 19:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 9627, "loss": 1.8444, "learning_rate": 9.915850288371616e-05, "epoch": 0.058481354523735325, "percentage": 5.85, "elapsed_time": "4:10:37", "remaining_time": "2 days, 19:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 9627, "loss": 1.7398, "learning_rate": 9.915551934711777e-05, "epoch": 0.05858522904331567, "percentage": 5.86, "elapsed_time": "4:11:05", "remaining_time": "2 days, 19:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 9627, "loss": 1.5016, "learning_rate": 9.915253057584003e-05, "epoch": 0.05868910356289602, "percentage": 5.87, "elapsed_time": "4:11:33", "remaining_time": "2 days, 19:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 9627, "loss": 1.7225, "learning_rate": 9.914953657020118e-05, "epoch": 0.05879297808247637, "percentage": 5.88, "elapsed_time": "4:12:00", "remaining_time": "2 days, 19:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 9627, "loss": 1.7444, "learning_rate": 9.914653733052006e-05, "epoch": 0.058896852602056717, "percentage": 5.89, "elapsed_time": "4:12:29", "remaining_time": "2 days, 19:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 9627, "loss": 1.8678, "learning_rate": 9.914353285711607e-05, "epoch": 0.059000727121637064, "percentage": 5.9, "elapsed_time": "4:12:57", "remaining_time": "2 days, 19:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 9627, "loss": 1.9416, "learning_rate": 9.914052315030917e-05, "epoch": 0.05910460164121741, "percentage": 5.91, "elapsed_time": "4:13:25", "remaining_time": "2 days, 19:14:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 9627, "loss": 1.8087, "learning_rate": 9.913750821041987e-05, "epoch": 0.05920847616079775, "percentage": 5.92, "elapsed_time": "4:13:53", "remaining_time": "2 days, 19:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 9627, "loss": 1.9329, "learning_rate": 9.913448803776922e-05, "epoch": 0.0593123506803781, "percentage": 5.93, "elapsed_time": "4:14:21", "remaining_time": "2 days, 19:14:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 9627, "loss": 1.882, "learning_rate": 9.913146263267887e-05, "epoch": 0.05941622519995845, "percentage": 5.94, "elapsed_time": "4:14:48", "remaining_time": "2 days, 19:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 9627, "loss": 1.6253, "learning_rate": 9.912843199547099e-05, "epoch": 0.059520099719538797, "percentage": 5.95, "elapsed_time": "4:15:17", "remaining_time": "2 days, 19:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 9627, "loss": 1.7809, "learning_rate": 9.912539612646832e-05, "epoch": 0.059623974239119144, "percentage": 5.96, "elapsed_time": "4:15:44", "remaining_time": "2 days, 19:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 9627, "loss": 2.0883, "learning_rate": 9.912235502599414e-05, "epoch": 0.05972784875869949, "percentage": 5.97, "elapsed_time": "4:16:12", "remaining_time": "2 days, 19:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 9627, "loss": 1.7313, "learning_rate": 9.911930869437233e-05, "epoch": 0.05983172327827984, "percentage": 5.98, "elapsed_time": "4:16:41", "remaining_time": "2 days, 19:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 9627, "loss": 1.906, "learning_rate": 9.911625713192729e-05, "epoch": 0.05993559779786019, "percentage": 5.99, "elapsed_time": "4:17:08", "remaining_time": "2 days, 19:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 9627, "loss": 1.8296, "learning_rate": 9.911320033898398e-05, "epoch": 0.06003947231744053, "percentage": 6.0, "elapsed_time": "4:17:37", "remaining_time": "2 days, 19:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 9627, "loss": 1.8199, "learning_rate": 9.911013831586795e-05, "epoch": 0.060143346837020877, "percentage": 6.01, "elapsed_time": "4:18:05", "remaining_time": "2 days, 19:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 9627, "loss": 1.6965, "learning_rate": 9.910707106290525e-05, "epoch": 0.060247221356601224, "percentage": 6.02, "elapsed_time": "4:18:32", "remaining_time": "2 days, 19:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 9627, "loss": 1.7974, "learning_rate": 9.910399858042252e-05, "epoch": 0.06035109587618157, "percentage": 6.04, "elapsed_time": "4:19:02", "remaining_time": "2 days, 19:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 9627, "loss": 1.7587, "learning_rate": 9.910092086874699e-05, "epoch": 0.06045497039576192, "percentage": 6.05, "elapsed_time": "4:19:28", "remaining_time": "2 days, 19:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 9627, "loss": 1.7185, "learning_rate": 9.909783792820637e-05, "epoch": 0.06055884491534227, "percentage": 6.06, "elapsed_time": "4:19:57", "remaining_time": "2 days, 19:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 9627, "loss": 1.9277, "learning_rate": 9.909474975912899e-05, "epoch": 0.060662719434922616, "percentage": 6.07, "elapsed_time": "4:20:25", "remaining_time": "2 days, 19:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 9627, "loss": 1.8624, "learning_rate": 9.909165636184372e-05, "epoch": 0.060766593954502963, "percentage": 6.08, "elapsed_time": "4:20:53", "remaining_time": "2 days, 19:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 9627, "loss": 1.8565, "learning_rate": 9.908855773667997e-05, "epoch": 0.060870468474083304, "percentage": 6.09, "elapsed_time": "4:21:22", "remaining_time": "2 days, 19:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 9627, "loss": 1.8135, "learning_rate": 9.908545388396775e-05, "epoch": 0.06097434299366365, "percentage": 6.1, "elapsed_time": "4:21:49", "remaining_time": "2 days, 19:12:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 9627, "loss": 1.7439, "learning_rate": 9.908234480403755e-05, "epoch": 0.061078217513244, "percentage": 6.11, "elapsed_time": "4:22:18", "remaining_time": "2 days, 19:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 9627, "loss": 1.8637, "learning_rate": 9.90792304972205e-05, "epoch": 0.06118209203282435, "percentage": 6.12, "elapsed_time": "4:22:46", "remaining_time": "2 days, 19:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 9627, "loss": 1.6959, "learning_rate": 9.907611096384823e-05, "epoch": 0.061285966552404696, "percentage": 6.13, "elapsed_time": "4:23:14", "remaining_time": "2 days, 19:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 9627, "loss": 1.7969, "learning_rate": 9.907298620425294e-05, "epoch": 0.061389841071985043, "percentage": 6.14, "elapsed_time": "4:23:42", "remaining_time": "2 days, 19:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 9627, "loss": 1.8457, "learning_rate": 9.90698562187674e-05, "epoch": 0.06149371559156539, "percentage": 6.15, "elapsed_time": "4:24:10", "remaining_time": "2 days, 19:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 9627, "loss": 1.6876, "learning_rate": 9.906672100772496e-05, "epoch": 0.06159759011114574, "percentage": 6.16, "elapsed_time": "4:24:38", "remaining_time": "2 days, 19:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 9627, "loss": 1.7644, "learning_rate": 9.906358057145945e-05, "epoch": 0.06170146463072608, "percentage": 6.17, "elapsed_time": "4:25:06", "remaining_time": "2 days, 19:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 9627, "loss": 1.9074, "learning_rate": 9.906043491030532e-05, "epoch": 0.06180533915030643, "percentage": 6.18, "elapsed_time": "4:25:34", "remaining_time": "2 days, 19:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 9627, "loss": 1.834, "learning_rate": 9.905728402459755e-05, "epoch": 0.061909213669886776, "percentage": 6.19, "elapsed_time": "4:26:02", "remaining_time": "2 days, 19:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 9627, "loss": 1.7292, "learning_rate": 9.905412791467171e-05, "epoch": 0.062013088189467123, "percentage": 6.2, "elapsed_time": "4:26:30", "remaining_time": "2 days, 19:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 9627, "loss": 2.0142, "learning_rate": 9.905096658086387e-05, "epoch": 0.06211696270904747, "percentage": 6.21, "elapsed_time": "4:26:58", "remaining_time": "2 days, 19:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 9627, "loss": 1.852, "learning_rate": 9.904780002351071e-05, "epoch": 0.06222083722862782, "percentage": 6.22, "elapsed_time": "4:27:25", "remaining_time": "2 days, 19:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 9627, "loss": 1.7035, "learning_rate": 9.904462824294944e-05, "epoch": 0.06232471174820817, "percentage": 6.23, "elapsed_time": "4:27:54", "remaining_time": "2 days, 19:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 9627, "loss": 1.7046, "learning_rate": 9.904145123951781e-05, "epoch": 0.062428586267788515, "percentage": 6.24, "elapsed_time": "4:28:23", "remaining_time": "2 days, 19:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 9627, "loss": 1.8107, "learning_rate": 9.903826901355417e-05, "epoch": 0.06253246078736886, "percentage": 6.25, "elapsed_time": "4:28:51", "remaining_time": "2 days, 19:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 9627, "loss": 1.8613, "learning_rate": 9.90350815653974e-05, "epoch": 0.0626363353069492, "percentage": 6.26, "elapsed_time": "4:29:18", "remaining_time": "2 days, 19:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 9627, "loss": 1.6605, "learning_rate": 9.903188889538692e-05, "epoch": 0.06274020982652956, "percentage": 6.27, "elapsed_time": "4:29:47", "remaining_time": "2 days, 19:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 9627, "loss": 1.8248, "learning_rate": 9.902869100386273e-05, "epoch": 0.0628440843461099, "percentage": 6.28, "elapsed_time": "4:30:15", "remaining_time": "2 days, 19:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 9627, "loss": 1.8456, "learning_rate": 9.90254878911654e-05, "epoch": 0.06294795886569024, "percentage": 6.29, "elapsed_time": "4:30:42", "remaining_time": "2 days, 19:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 9627, "loss": 1.6454, "learning_rate": 9.902227955763602e-05, "epoch": 0.0630518333852706, "percentage": 6.31, "elapsed_time": "4:31:11", "remaining_time": "2 days, 19:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 9627, "loss": 1.8036, "learning_rate": 9.901906600361625e-05, "epoch": 0.06315570790485094, "percentage": 6.32, "elapsed_time": "4:31:39", "remaining_time": "2 days, 19:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 9627, "loss": 1.8153, "learning_rate": 9.901584722944833e-05, "epoch": 0.06325958242443129, "percentage": 6.33, "elapsed_time": "4:32:07", "remaining_time": "2 days, 19:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 9627, "loss": 1.7256, "learning_rate": 9.9012623235475e-05, "epoch": 0.06336345694401163, "percentage": 6.34, "elapsed_time": "4:32:36", "remaining_time": "2 days, 19:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 9627, "loss": 2.0305, "learning_rate": 9.900939402203962e-05, "epoch": 0.06346733146359199, "percentage": 6.35, "elapsed_time": "4:33:03", "remaining_time": "2 days, 19:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 9627, "loss": 1.7801, "learning_rate": 9.900615958948606e-05, "epoch": 0.06357120598317233, "percentage": 6.36, "elapsed_time": "4:33:32", "remaining_time": "2 days, 19:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 9627, "loss": 1.6963, "learning_rate": 9.900291993815877e-05, "epoch": 0.06367508050275267, "percentage": 6.37, "elapsed_time": "4:34:00", "remaining_time": "2 days, 19:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 9627, "loss": 1.8211, "learning_rate": 9.899967506840273e-05, "epoch": 0.06377895502233302, "percentage": 6.38, "elapsed_time": "4:34:29", "remaining_time": "2 days, 19:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 9627, "loss": 1.8328, "learning_rate": 9.899642498056353e-05, "epoch": 0.06388282954191336, "percentage": 6.39, "elapsed_time": "4:34:57", "remaining_time": "2 days, 19:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 9627, "loss": 1.9433, "learning_rate": 9.899316967498724e-05, "epoch": 0.06398670406149372, "percentage": 6.4, "elapsed_time": "4:35:25", "remaining_time": "2 days, 19:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 9627, "loss": 1.8383, "learning_rate": 9.898990915202055e-05, "epoch": 0.06409057858107406, "percentage": 6.41, "elapsed_time": "4:35:53", "remaining_time": "2 days, 19:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 9627, "loss": 1.8279, "learning_rate": 9.898664341201067e-05, "epoch": 0.06419445310065441, "percentage": 6.42, "elapsed_time": "4:36:22", "remaining_time": "2 days, 19:08:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 9627, "loss": 1.6484, "learning_rate": 9.898337245530536e-05, "epoch": 0.06429832762023475, "percentage": 6.43, "elapsed_time": "4:36:50", "remaining_time": "2 days, 19:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 9627, "loss": 1.9679, "learning_rate": 9.8980096282253e-05, "epoch": 0.06440220213981511, "percentage": 6.44, "elapsed_time": "4:37:18", "remaining_time": "2 days, 19:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 9627, "loss": 1.8297, "learning_rate": 9.897681489320242e-05, "epoch": 0.06450607665939545, "percentage": 6.45, "elapsed_time": "4:37:46", "remaining_time": "2 days, 19:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 9627, "loss": 1.9845, "learning_rate": 9.897352828850309e-05, "epoch": 0.06460995117897579, "percentage": 6.46, "elapsed_time": "4:38:15", "remaining_time": "2 days, 19:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 9627, "loss": 1.7576, "learning_rate": 9.897023646850502e-05, "epoch": 0.06471382569855615, "percentage": 6.47, "elapsed_time": "4:38:42", "remaining_time": "2 days, 19:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 9627, "loss": 1.7502, "learning_rate": 9.896693943355874e-05, "epoch": 0.06481770021813649, "percentage": 6.48, "elapsed_time": "4:39:10", "remaining_time": "2 days, 19:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 9627, "loss": 1.5323, "learning_rate": 9.896363718401536e-05, "epoch": 0.06492157473771684, "percentage": 6.49, "elapsed_time": "4:39:38", "remaining_time": "2 days, 19:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 9627, "loss": 1.5328, "learning_rate": 9.896032972022656e-05, "epoch": 0.06502544925729718, "percentage": 6.5, "elapsed_time": "4:40:07", "remaining_time": "2 days, 19:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 9627, "loss": 1.7393, "learning_rate": 9.895701704254455e-05, "epoch": 0.06512932377687754, "percentage": 6.51, "elapsed_time": "4:40:36", "remaining_time": "2 days, 19:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 9627, "loss": 1.6363, "learning_rate": 9.89536991513221e-05, "epoch": 0.06523319829645788, "percentage": 6.52, "elapsed_time": "4:41:04", "remaining_time": "2 days, 19:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 9627, "loss": 1.6374, "learning_rate": 9.895037604691256e-05, "epoch": 0.06533707281603822, "percentage": 6.53, "elapsed_time": "4:41:33", "remaining_time": "2 days, 19:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 9627, "loss": 1.773, "learning_rate": 9.894704772966977e-05, "epoch": 0.06544094733561857, "percentage": 6.54, "elapsed_time": "4:42:00", "remaining_time": "2 days, 19:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 9627, "loss": 1.7417, "learning_rate": 9.894371419994821e-05, "epoch": 0.06554482185519891, "percentage": 6.55, "elapsed_time": "4:42:28", "remaining_time": "2 days, 19:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 9627, "loss": 1.8542, "learning_rate": 9.894037545810288e-05, "epoch": 0.06564869637477927, "percentage": 6.56, "elapsed_time": "4:42:58", "remaining_time": "2 days, 19:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 9627, "loss": 1.917, "learning_rate": 9.89370315044893e-05, "epoch": 0.06575257089435961, "percentage": 6.58, "elapsed_time": "4:43:25", "remaining_time": "2 days, 19:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 9627, "loss": 1.9253, "learning_rate": 9.893368233946359e-05, "epoch": 0.06585644541393997, "percentage": 6.59, "elapsed_time": "4:43:53", "remaining_time": "2 days, 19:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 9627, "loss": 1.6948, "learning_rate": 9.89303279633824e-05, "epoch": 0.0659603199335203, "percentage": 6.6, "elapsed_time": "4:44:22", "remaining_time": "2 days, 19:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 9627, "loss": 1.8504, "learning_rate": 9.892696837660295e-05, "epoch": 0.06606419445310066, "percentage": 6.61, "elapsed_time": "4:44:50", "remaining_time": "2 days, 19:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 9627, "loss": 1.7728, "learning_rate": 9.892360357948303e-05, "epoch": 0.066168068972681, "percentage": 6.62, "elapsed_time": "4:45:18", "remaining_time": "2 days, 19:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 9627, "loss": 1.8216, "learning_rate": 9.892023357238094e-05, "epoch": 0.06627194349226134, "percentage": 6.63, "elapsed_time": "4:45:47", "remaining_time": "2 days, 19:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 9627, "loss": 1.725, "learning_rate": 9.891685835565557e-05, "epoch": 0.0663758180118417, "percentage": 6.64, "elapsed_time": "4:46:15", "remaining_time": "2 days, 19:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 9627, "loss": 1.7718, "learning_rate": 9.891347792966635e-05, "epoch": 0.06647969253142204, "percentage": 6.65, "elapsed_time": "4:46:43", "remaining_time": "2 days, 19:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 9627, "loss": 1.9705, "learning_rate": 9.891009229477326e-05, "epoch": 0.06658356705100239, "percentage": 6.66, "elapsed_time": "4:47:11", "remaining_time": "2 days, 19:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 9627, "loss": 2.0534, "learning_rate": 9.890670145133687e-05, "epoch": 0.06668744157058273, "percentage": 6.67, "elapsed_time": "4:47:40", "remaining_time": "2 days, 19:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 9627, "loss": 1.9179, "learning_rate": 9.890330539971825e-05, "epoch": 0.06679131609016309, "percentage": 6.68, "elapsed_time": "4:48:08", "remaining_time": "2 days, 19:05:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 9627, "loss": 1.8077, "learning_rate": 9.889990414027907e-05, "epoch": 0.06689519060974343, "percentage": 6.69, "elapsed_time": "4:48:37", "remaining_time": "2 days, 19:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 9627, "loss": 1.6712, "learning_rate": 9.889649767338153e-05, "epoch": 0.06699906512932377, "percentage": 6.7, "elapsed_time": "4:49:05", "remaining_time": "2 days, 19:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 9627, "loss": 1.629, "learning_rate": 9.88930859993884e-05, "epoch": 0.06710293964890413, "percentage": 6.71, "elapsed_time": "4:49:34", "remaining_time": "2 days, 19:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 9627, "loss": 2.02, "learning_rate": 9.888966911866299e-05, "epoch": 0.06720681416848447, "percentage": 6.72, "elapsed_time": "4:50:02", "remaining_time": "2 days, 19:05:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 9627, "loss": 1.6907, "learning_rate": 9.888624703156918e-05, "epoch": 0.06731068868806482, "percentage": 6.73, "elapsed_time": "4:50:30", "remaining_time": "2 days, 19:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 9627, "loss": 1.6967, "learning_rate": 9.888281973847138e-05, "epoch": 0.06741456320764516, "percentage": 6.74, "elapsed_time": "4:50:59", "remaining_time": "2 days, 19:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 9627, "loss": 1.7385, "learning_rate": 9.887938723973458e-05, "epoch": 0.06751843772722552, "percentage": 6.75, "elapsed_time": "4:51:27", "remaining_time": "2 days, 19:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 9627, "loss": 1.6206, "learning_rate": 9.887594953572432e-05, "epoch": 0.06762231224680586, "percentage": 6.76, "elapsed_time": "4:51:56", "remaining_time": "2 days, 19:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 9627, "loss": 1.6185, "learning_rate": 9.887250662680667e-05, "epoch": 0.06772618676638621, "percentage": 6.77, "elapsed_time": "4:52:24", "remaining_time": "2 days, 19:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 9627, "loss": 1.8004, "learning_rate": 9.886905851334829e-05, "epoch": 0.06783006128596655, "percentage": 6.78, "elapsed_time": "4:52:51", "remaining_time": "2 days, 19:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 9627, "loss": 1.7545, "learning_rate": 9.886560519571637e-05, "epoch": 0.0679339358055469, "percentage": 6.79, "elapsed_time": "4:53:20", "remaining_time": "2 days, 19:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 9627, "loss": 1.7991, "learning_rate": 9.886214667427867e-05, "epoch": 0.06803781032512725, "percentage": 6.8, "elapsed_time": "4:53:49", "remaining_time": "2 days, 19:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 9627, "loss": 1.7288, "learning_rate": 9.885868294940349e-05, "epoch": 0.06814168484470759, "percentage": 6.81, "elapsed_time": "4:54:17", "remaining_time": "2 days, 19:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 9627, "loss": 1.7928, "learning_rate": 9.885521402145967e-05, "epoch": 0.06824555936428794, "percentage": 6.82, "elapsed_time": "4:54:45", "remaining_time": "2 days, 19:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 9627, "loss": 1.6569, "learning_rate": 9.885173989081664e-05, "epoch": 0.06834943388386829, "percentage": 6.83, "elapsed_time": "4:55:14", "remaining_time": "2 days, 19:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 9627, "loss": 1.9213, "learning_rate": 9.88482605578444e-05, "epoch": 0.06845330840344864, "percentage": 6.85, "elapsed_time": "4:55:43", "remaining_time": "2 days, 19:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 9627, "loss": 1.6129, "learning_rate": 9.884477602291343e-05, "epoch": 0.06855718292302898, "percentage": 6.86, "elapsed_time": "4:56:11", "remaining_time": "2 days, 19:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 9627, "loss": 1.8986, "learning_rate": 9.88412862863948e-05, "epoch": 0.06866105744260932, "percentage": 6.87, "elapsed_time": "4:56:38", "remaining_time": "2 days, 19:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 9627, "loss": 2.0618, "learning_rate": 9.883779134866016e-05, "epoch": 0.06876493196218968, "percentage": 6.88, "elapsed_time": "4:57:08", "remaining_time": "2 days, 19:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 9627, "loss": 1.6847, "learning_rate": 9.883429121008169e-05, "epoch": 0.06886880648177002, "percentage": 6.89, "elapsed_time": "4:57:36", "remaining_time": "2 days, 19:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 9627, "loss": 1.7325, "learning_rate": 9.883078587103215e-05, "epoch": 0.06897268100135037, "percentage": 6.9, "elapsed_time": "4:58:03", "remaining_time": "2 days, 19:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 9627, "loss": 2.0511, "learning_rate": 9.882727533188481e-05, "epoch": 0.06907655552093071, "percentage": 6.91, "elapsed_time": "4:58:33", "remaining_time": "2 days, 19:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 9627, "loss": 1.7457, "learning_rate": 9.882375959301349e-05, "epoch": 0.06918043004051107, "percentage": 6.92, "elapsed_time": "4:59:00", "remaining_time": "2 days, 19:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 9627, "loss": 1.9451, "learning_rate": 9.882023865479263e-05, "epoch": 0.06928430456009141, "percentage": 6.93, "elapsed_time": "4:59:30", "remaining_time": "2 days, 19:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 9627, "loss": 1.9018, "learning_rate": 9.881671251759717e-05, "epoch": 0.06938817907967175, "percentage": 6.94, "elapsed_time": "4:59:58", "remaining_time": "2 days, 19:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 9627, "loss": 1.9383, "learning_rate": 9.881318118180258e-05, "epoch": 0.0694920535992521, "percentage": 6.95, "elapsed_time": "5:00:25", "remaining_time": "2 days, 19:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 9627, "loss": 1.6511, "learning_rate": 9.880964464778499e-05, "epoch": 0.06959592811883245, "percentage": 6.96, "elapsed_time": "5:00:55", "remaining_time": "2 days, 19:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 9627, "loss": 1.7165, "learning_rate": 9.880610291592096e-05, "epoch": 0.0696998026384128, "percentage": 6.97, "elapsed_time": "5:01:23", "remaining_time": "2 days, 19:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 9627, "loss": 1.6612, "learning_rate": 9.880255598658767e-05, "epoch": 0.06980367715799314, "percentage": 6.98, "elapsed_time": "5:01:51", "remaining_time": "2 days, 19:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 9627, "loss": 1.8946, "learning_rate": 9.879900386016284e-05, "epoch": 0.0699075516775735, "percentage": 6.99, "elapsed_time": "5:02:19", "remaining_time": "2 days, 19:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 9627, "loss": 1.8398, "learning_rate": 9.879544653702476e-05, "epoch": 0.07001142619715384, "percentage": 7.0, "elapsed_time": "5:02:48", "remaining_time": "2 days, 19:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 9627, "loss": 1.928, "learning_rate": 9.879188401755222e-05, "epoch": 0.07011530071673419, "percentage": 7.01, "elapsed_time": "5:03:16", "remaining_time": "2 days, 19:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 9627, "loss": 1.9605, "learning_rate": 9.878831630212465e-05, "epoch": 0.07021917523631453, "percentage": 7.02, "elapsed_time": "5:03:43", "remaining_time": "2 days, 19:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 9627, "loss": 1.7933, "learning_rate": 9.878474339112193e-05, "epoch": 0.07032304975589487, "percentage": 7.03, "elapsed_time": "5:04:13", "remaining_time": "2 days, 19:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 9627, "loss": 1.7487, "learning_rate": 9.878116528492458e-05, "epoch": 0.07042692427547523, "percentage": 7.04, "elapsed_time": "5:04:41", "remaining_time": "2 days, 19:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 9627, "loss": 1.8613, "learning_rate": 9.877758198391365e-05, "epoch": 0.07053079879505557, "percentage": 7.05, "elapsed_time": "5:05:08", "remaining_time": "2 days, 19:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 9627, "loss": 1.6381, "learning_rate": 9.87739934884707e-05, "epoch": 0.07063467331463592, "percentage": 7.06, "elapsed_time": "5:05:36", "remaining_time": "2 days, 19:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 9627, "loss": 1.944, "learning_rate": 9.87703997989779e-05, "epoch": 0.07073854783421626, "percentage": 7.07, "elapsed_time": "5:06:05", "remaining_time": "2 days, 19:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 9627, "loss": 1.7308, "learning_rate": 9.876680091581796e-05, "epoch": 0.07084242235379662, "percentage": 7.08, "elapsed_time": "5:06:33", "remaining_time": "2 days, 19:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 9627, "loss": 1.8055, "learning_rate": 9.876319683937412e-05, "epoch": 0.07094629687337696, "percentage": 7.09, "elapsed_time": "5:07:01", "remaining_time": "2 days, 19:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 9627, "loss": 1.7043, "learning_rate": 9.875958757003017e-05, "epoch": 0.0710501713929573, "percentage": 7.11, "elapsed_time": "5:07:30", "remaining_time": "2 days, 19:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 9627, "loss": 1.8259, "learning_rate": 9.875597310817049e-05, "epoch": 0.07115404591253766, "percentage": 7.12, "elapsed_time": "5:07:58", "remaining_time": "2 days, 19:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 9627, "loss": 1.7541, "learning_rate": 9.875235345417997e-05, "epoch": 0.071257920432118, "percentage": 7.13, "elapsed_time": "5:08:26", "remaining_time": "2 days, 19:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 9627, "loss": 1.5966, "learning_rate": 9.874872860844411e-05, "epoch": 0.07136179495169835, "percentage": 7.14, "elapsed_time": "5:08:54", "remaining_time": "2 days, 18:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 9627, "loss": 1.7182, "learning_rate": 9.87450985713489e-05, "epoch": 0.07146566947127869, "percentage": 7.15, "elapsed_time": "5:09:23", "remaining_time": "2 days, 18:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 9627, "loss": 1.553, "learning_rate": 9.874146334328092e-05, "epoch": 0.07156954399085905, "percentage": 7.16, "elapsed_time": "5:09:51", "remaining_time": "2 days, 18:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 9627, "loss": 1.9359, "learning_rate": 9.873782292462727e-05, "epoch": 0.07167341851043939, "percentage": 7.17, "elapsed_time": "5:10:19", "remaining_time": "2 days, 18:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 9627, "loss": 1.9939, "learning_rate": 9.873417731577568e-05, "epoch": 0.07177729303001974, "percentage": 7.18, "elapsed_time": "5:10:48", "remaining_time": "2 days, 18:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 9627, "loss": 1.8192, "learning_rate": 9.873052651711434e-05, "epoch": 0.07188116754960008, "percentage": 7.19, "elapsed_time": "5:11:16", "remaining_time": "2 days, 18:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 9627, "loss": 1.6569, "learning_rate": 9.872687052903203e-05, "epoch": 0.07198504206918042, "percentage": 7.2, "elapsed_time": "5:11:44", "remaining_time": "2 days, 18:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 9627, "loss": 1.743, "learning_rate": 9.87232093519181e-05, "epoch": 0.07208891658876078, "percentage": 7.21, "elapsed_time": "5:12:13", "remaining_time": "2 days, 18:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 9627, "loss": 1.7822, "learning_rate": 9.871954298616242e-05, "epoch": 0.07219279110834112, "percentage": 7.22, "elapsed_time": "5:12:41", "remaining_time": "2 days, 18:58:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 9627, "loss": 1.7646, "learning_rate": 9.871587143215545e-05, "epoch": 0.07229666562792147, "percentage": 7.23, "elapsed_time": "5:13:10", "remaining_time": "2 days, 18:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 9627, "loss": 1.798, "learning_rate": 9.871219469028816e-05, "epoch": 0.07240054014750182, "percentage": 7.24, "elapsed_time": "5:13:37", "remaining_time": "2 days, 18:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 9627, "loss": 1.757, "learning_rate": 9.870851276095212e-05, "epoch": 0.07250441466708217, "percentage": 7.25, "elapsed_time": "5:14:07", "remaining_time": "2 days, 18:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 9627, "loss": 1.6328, "learning_rate": 9.87048256445394e-05, "epoch": 0.07260828918666251, "percentage": 7.26, "elapsed_time": "5:14:35", "remaining_time": "2 days, 18:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 9627, "loss": 1.7512, "learning_rate": 9.870113334144267e-05, "epoch": 0.07271216370624285, "percentage": 7.27, "elapsed_time": "5:15:04", "remaining_time": "2 days, 18:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 9627, "loss": 1.8032, "learning_rate": 9.869743585205511e-05, "epoch": 0.07281603822582321, "percentage": 7.28, "elapsed_time": "5:15:32", "remaining_time": "2 days, 18:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 9627, "loss": 1.8526, "learning_rate": 9.869373317677049e-05, "epoch": 0.07291991274540355, "percentage": 7.29, "elapsed_time": "5:16:01", "remaining_time": "2 days, 18:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 9627, "loss": 1.8994, "learning_rate": 9.869002531598312e-05, "epoch": 0.0730237872649839, "percentage": 7.3, "elapsed_time": "5:16:29", "remaining_time": "2 days, 18:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 9627, "loss": 1.853, "learning_rate": 9.868631227008785e-05, "epoch": 0.07312766178456424, "percentage": 7.31, "elapsed_time": "5:16:57", "remaining_time": "2 days, 18:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 9627, "loss": 1.9527, "learning_rate": 9.868259403948008e-05, "epoch": 0.0732315363041446, "percentage": 7.32, "elapsed_time": "5:17:26", "remaining_time": "2 days, 18:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 9627, "loss": 1.7766, "learning_rate": 9.867887062455579e-05, "epoch": 0.07333541082372494, "percentage": 7.33, "elapsed_time": "5:17:53", "remaining_time": "2 days, 18:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 9627, "loss": 1.5639, "learning_rate": 9.867514202571149e-05, "epoch": 0.0734392853433053, "percentage": 7.34, "elapsed_time": "5:18:21", "remaining_time": "2 days, 18:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 9627, "loss": 1.9035, "learning_rate": 9.867140824334424e-05, "epoch": 0.07354315986288563, "percentage": 7.35, "elapsed_time": "5:18:51", "remaining_time": "2 days, 18:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 9627, "loss": 1.8442, "learning_rate": 9.866766927785167e-05, "epoch": 0.07364703438246598, "percentage": 7.36, "elapsed_time": "5:19:18", "remaining_time": "2 days, 18:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 9627, "loss": 1.6519, "learning_rate": 9.866392512963195e-05, "epoch": 0.07375090890204633, "percentage": 7.38, "elapsed_time": "5:19:48", "remaining_time": "2 days, 18:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 9627, "loss": 1.8225, "learning_rate": 9.86601757990838e-05, "epoch": 0.07385478342162667, "percentage": 7.39, "elapsed_time": "5:20:16", "remaining_time": "2 days, 18:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 9627, "loss": 1.778, "learning_rate": 9.865642128660647e-05, "epoch": 0.07395865794120703, "percentage": 7.4, "elapsed_time": "5:20:44", "remaining_time": "2 days, 18:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 9627, "loss": 1.9915, "learning_rate": 9.865266159259981e-05, "epoch": 0.07406253246078737, "percentage": 7.41, "elapsed_time": "5:21:13", "remaining_time": "2 days, 18:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 9627, "loss": 2.0117, "learning_rate": 9.864889671746421e-05, "epoch": 0.07416640698036772, "percentage": 7.42, "elapsed_time": "5:21:42", "remaining_time": "2 days, 18:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 9627, "loss": 2.2284, "learning_rate": 9.864512666160058e-05, "epoch": 0.07427028149994806, "percentage": 7.43, "elapsed_time": "5:22:09", "remaining_time": "2 days, 18:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 9627, "loss": 1.7284, "learning_rate": 9.86413514254104e-05, "epoch": 0.0743741560195284, "percentage": 7.44, "elapsed_time": "5:22:38", "remaining_time": "2 days, 18:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 9627, "loss": 1.7128, "learning_rate": 9.863757100929573e-05, "epoch": 0.07447803053910876, "percentage": 7.45, "elapsed_time": "5:23:07", "remaining_time": "2 days, 18:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 9627, "loss": 1.8116, "learning_rate": 9.863378541365912e-05, "epoch": 0.0745819050586891, "percentage": 7.46, "elapsed_time": "5:23:34", "remaining_time": "2 days, 18:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 9627, "loss": 1.9717, "learning_rate": 9.862999463890372e-05, "epoch": 0.07468577957826945, "percentage": 7.47, "elapsed_time": "5:24:04", "remaining_time": "2 days, 18:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 9627, "loss": 1.886, "learning_rate": 9.862619868543322e-05, "epoch": 0.0747896540978498, "percentage": 7.48, "elapsed_time": "5:24:32", "remaining_time": "2 days, 18:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 9627, "loss": 1.7202, "learning_rate": 9.862239755365186e-05, "epoch": 0.07489352861743015, "percentage": 7.49, "elapsed_time": "5:25:02", "remaining_time": "2 days, 18:54:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 9627, "loss": 1.9074, "learning_rate": 9.861859124396444e-05, "epoch": 0.07499740313701049, "percentage": 7.5, "elapsed_time": "5:25:29", "remaining_time": "2 days, 18:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 9627, "loss": 1.963, "learning_rate": 9.86147797567763e-05, "epoch": 0.07510127765659085, "percentage": 7.51, "elapsed_time": "5:25:58", "remaining_time": "2 days, 18:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 9627, "loss": 2.119, "learning_rate": 9.86109630924933e-05, "epoch": 0.07520515217617119, "percentage": 7.52, "elapsed_time": "5:26:27", "remaining_time": "2 days, 18:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 9627, "loss": 1.8536, "learning_rate": 9.860714125152191e-05, "epoch": 0.07530902669575153, "percentage": 7.53, "elapsed_time": "5:26:55", "remaining_time": "2 days, 18:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 9627, "loss": 1.7498, "learning_rate": 9.860331423426914e-05, "epoch": 0.07541290121533188, "percentage": 7.54, "elapsed_time": "5:27:24", "remaining_time": "2 days, 18:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 9627, "loss": 1.9569, "learning_rate": 9.859948204114253e-05, "epoch": 0.07551677573491222, "percentage": 7.55, "elapsed_time": "5:27:52", "remaining_time": "2 days, 18:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 9627, "loss": 2.0232, "learning_rate": 9.859564467255015e-05, "epoch": 0.07562065025449258, "percentage": 7.56, "elapsed_time": "5:28:20", "remaining_time": "2 days, 18:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 9627, "loss": 1.6597, "learning_rate": 9.859180212890069e-05, "epoch": 0.07572452477407292, "percentage": 7.57, "elapsed_time": "5:28:48", "remaining_time": "2 days, 18:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 9627, "loss": 1.8534, "learning_rate": 9.858795441060333e-05, "epoch": 0.07582839929365327, "percentage": 7.58, "elapsed_time": "5:29:17", "remaining_time": "2 days, 18:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 9627, "loss": 1.8047, "learning_rate": 9.858410151806783e-05, "epoch": 0.07593227381323361, "percentage": 7.59, "elapsed_time": "5:29:45", "remaining_time": "2 days, 18:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 9627, "loss": 1.7222, "learning_rate": 9.85802434517045e-05, "epoch": 0.07603614833281395, "percentage": 7.6, "elapsed_time": "5:30:14", "remaining_time": "2 days, 18:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 9627, "loss": 1.9158, "learning_rate": 9.857638021192417e-05, "epoch": 0.07614002285239431, "percentage": 7.61, "elapsed_time": "5:30:43", "remaining_time": "2 days, 18:52:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 9627, "loss": 2.1136, "learning_rate": 9.857251179913824e-05, "epoch": 0.07624389737197465, "percentage": 7.62, "elapsed_time": "5:31:10", "remaining_time": "2 days, 18:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 9627, "loss": 1.802, "learning_rate": 9.856863821375872e-05, "epoch": 0.076347771891555, "percentage": 7.63, "elapsed_time": "5:31:39", "remaining_time": "2 days, 18:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 9627, "loss": 1.8454, "learning_rate": 9.856475945619806e-05, "epoch": 0.07645164641113535, "percentage": 7.65, "elapsed_time": "5:32:08", "remaining_time": "2 days, 18:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 9627, "loss": 1.7785, "learning_rate": 9.856087552686932e-05, "epoch": 0.0765555209307157, "percentage": 7.66, "elapsed_time": "5:32:36", "remaining_time": "2 days, 18:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 9627, "loss": 1.9353, "learning_rate": 9.855698642618616e-05, "epoch": 0.07665939545029604, "percentage": 7.67, "elapsed_time": "5:33:03", "remaining_time": "2 days, 18:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 9627, "loss": 1.9781, "learning_rate": 9.855309215456268e-05, "epoch": 0.07676326996987638, "percentage": 7.68, "elapsed_time": "5:33:33", "remaining_time": "2 days, 18:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 9627, "loss": 1.917, "learning_rate": 9.854919271241363e-05, "epoch": 0.07686714448945674, "percentage": 7.69, "elapsed_time": "5:34:01", "remaining_time": "2 days, 18:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 9627, "loss": 1.6168, "learning_rate": 9.854528810015425e-05, "epoch": 0.07697101900903708, "percentage": 7.7, "elapsed_time": "5:34:30", "remaining_time": "2 days, 18:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 9627, "loss": 1.7935, "learning_rate": 9.854137831820035e-05, "epoch": 0.07707489352861743, "percentage": 7.71, "elapsed_time": "5:34:58", "remaining_time": "2 days, 18:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 9627, "loss": 1.7695, "learning_rate": 9.85374633669683e-05, "epoch": 0.07717876804819777, "percentage": 7.72, "elapsed_time": "5:35:27", "remaining_time": "2 days, 18:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 9627, "loss": 1.8163, "learning_rate": 9.8533543246875e-05, "epoch": 0.07728264256777813, "percentage": 7.73, "elapsed_time": "5:35:55", "remaining_time": "2 days, 18:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 9627, "loss": 1.7706, "learning_rate": 9.852961795833793e-05, "epoch": 0.07738651708735847, "percentage": 7.74, "elapsed_time": "5:36:25", "remaining_time": "2 days, 18:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 9627, "loss": 1.6099, "learning_rate": 9.852568750177508e-05, "epoch": 0.07749039160693882, "percentage": 7.75, "elapsed_time": "5:36:52", "remaining_time": "2 days, 18:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 9627, "loss": 1.5333, "learning_rate": 9.852175187760504e-05, "epoch": 0.07759426612651917, "percentage": 7.76, "elapsed_time": "5:37:21", "remaining_time": "2 days, 18:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 9627, "loss": 1.7676, "learning_rate": 9.851781108624692e-05, "epoch": 0.0776981406460995, "percentage": 7.77, "elapsed_time": "5:37:49", "remaining_time": "2 days, 18:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 9627, "loss": 1.8172, "learning_rate": 9.851386512812036e-05, "epoch": 0.07780201516567986, "percentage": 7.78, "elapsed_time": "5:38:18", "remaining_time": "2 days, 18:50:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 9627, "loss": 1.8644, "learning_rate": 9.850991400364557e-05, "epoch": 0.0779058896852602, "percentage": 7.79, "elapsed_time": "5:38:46", "remaining_time": "2 days, 18:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 9627, "loss": 1.8879, "learning_rate": 9.850595771324335e-05, "epoch": 0.07800976420484056, "percentage": 7.8, "elapsed_time": "5:39:16", "remaining_time": "2 days, 18:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 9627, "loss": 1.9628, "learning_rate": 9.850199625733501e-05, "epoch": 0.0781136387244209, "percentage": 7.81, "elapsed_time": "5:39:43", "remaining_time": "2 days, 18:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 9627, "loss": 1.8383, "learning_rate": 9.849802963634238e-05, "epoch": 0.07821751324400125, "percentage": 7.82, "elapsed_time": "5:40:12", "remaining_time": "2 days, 18:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 9627, "loss": 1.903, "learning_rate": 9.849405785068789e-05, "epoch": 0.07832138776358159, "percentage": 7.83, "elapsed_time": "5:40:41", "remaining_time": "2 days, 18:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 9627, "loss": 1.7703, "learning_rate": 9.84900809007945e-05, "epoch": 0.07842526228316193, "percentage": 7.84, "elapsed_time": "5:41:10", "remaining_time": "2 days, 18:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 9627, "loss": 2.017, "learning_rate": 9.848609878708575e-05, "epoch": 0.07852913680274229, "percentage": 7.85, "elapsed_time": "5:41:38", "remaining_time": "2 days, 18:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 9627, "loss": 1.8528, "learning_rate": 9.848211150998568e-05, "epoch": 0.07863301132232263, "percentage": 7.86, "elapsed_time": "5:42:07", "remaining_time": "2 days, 18:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 9627, "loss": 1.8787, "learning_rate": 9.84781190699189e-05, "epoch": 0.07873688584190298, "percentage": 7.87, "elapsed_time": "5:42:35", "remaining_time": "2 days, 18:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 9627, "loss": 2.0583, "learning_rate": 9.847412146731058e-05, "epoch": 0.07884076036148333, "percentage": 7.88, "elapsed_time": "5:43:04", "remaining_time": "2 days, 18:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 9627, "loss": 1.9294, "learning_rate": 9.847011870258644e-05, "epoch": 0.07894463488106368, "percentage": 7.89, "elapsed_time": "5:43:32", "remaining_time": "2 days, 18:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 9627, "loss": 1.7817, "learning_rate": 9.846611077617274e-05, "epoch": 0.07904850940064402, "percentage": 7.9, "elapsed_time": "5:44:02", "remaining_time": "2 days, 18:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 9627, "loss": 1.8936, "learning_rate": 9.84620976884963e-05, "epoch": 0.07915238392022438, "percentage": 7.92, "elapsed_time": "5:44:30", "remaining_time": "2 days, 18:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 9627, "loss": 1.6904, "learning_rate": 9.845807943998448e-05, "epoch": 0.07925625843980472, "percentage": 7.93, "elapsed_time": "5:44:58", "remaining_time": "2 days, 18:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 9627, "loss": 1.9056, "learning_rate": 9.845405603106518e-05, "epoch": 0.07936013295938506, "percentage": 7.94, "elapsed_time": "5:45:27", "remaining_time": "2 days, 18:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 9627, "loss": 1.8097, "learning_rate": 9.845002746216687e-05, "epoch": 0.07946400747896541, "percentage": 7.95, "elapsed_time": "5:45:55", "remaining_time": "2 days, 18:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 9627, "loss": 1.6326, "learning_rate": 9.844599373371855e-05, "epoch": 0.07956788199854575, "percentage": 7.96, "elapsed_time": "5:46:24", "remaining_time": "2 days, 18:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 9627, "loss": 1.9049, "learning_rate": 9.84419548461498e-05, "epoch": 0.07967175651812611, "percentage": 7.97, "elapsed_time": "5:46:52", "remaining_time": "2 days, 18:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 9627, "loss": 1.7215, "learning_rate": 9.843791079989071e-05, "epoch": 0.07977563103770645, "percentage": 7.98, "elapsed_time": "5:47:22", "remaining_time": "2 days, 18:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 9627, "loss": 1.6931, "learning_rate": 9.843386159537196e-05, "epoch": 0.0798795055572868, "percentage": 7.99, "elapsed_time": "5:47:49", "remaining_time": "2 days, 18:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 9627, "loss": 1.7751, "learning_rate": 9.842980723302476e-05, "epoch": 0.07998338007686714, "percentage": 8.0, "elapsed_time": "5:48:19", "remaining_time": "2 days, 18:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 9627, "loss": 1.7259, "learning_rate": 9.842574771328084e-05, "epoch": 0.08008725459644749, "percentage": 8.01, "elapsed_time": "5:48:47", "remaining_time": "2 days, 18:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 9627, "loss": 1.8242, "learning_rate": 9.842168303657253e-05, "epoch": 0.08019112911602784, "percentage": 8.02, "elapsed_time": "5:49:15", "remaining_time": "2 days, 18:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 9627, "loss": 1.7493, "learning_rate": 9.841761320333266e-05, "epoch": 0.08029500363560818, "percentage": 8.03, "elapsed_time": "5:49:45", "remaining_time": "2 days, 18:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 9627, "loss": 1.7955, "learning_rate": 9.841353821399469e-05, "epoch": 0.08039887815518854, "percentage": 8.04, "elapsed_time": "5:50:13", "remaining_time": "2 days, 18:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 9627, "loss": 1.9765, "learning_rate": 9.840945806899253e-05, "epoch": 0.08050275267476888, "percentage": 8.05, "elapsed_time": "5:50:42", "remaining_time": "2 days, 18:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 9627, "loss": 1.6581, "learning_rate": 9.840537276876069e-05, "epoch": 0.08060662719434923, "percentage": 8.06, "elapsed_time": "5:51:10", "remaining_time": "2 days, 18:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 9627, "loss": 1.8436, "learning_rate": 9.840128231373422e-05, "epoch": 0.08071050171392957, "percentage": 8.07, "elapsed_time": "5:51:38", "remaining_time": "2 days, 18:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 9627, "loss": 1.8948, "learning_rate": 9.839718670434873e-05, "epoch": 0.08081437623350993, "percentage": 8.08, "elapsed_time": "5:52:07", "remaining_time": "2 days, 18:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 9627, "loss": 1.7955, "learning_rate": 9.839308594104038e-05, "epoch": 0.08091825075309027, "percentage": 8.09, "elapsed_time": "5:52:35", "remaining_time": "2 days, 18:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 9627, "loss": 1.987, "learning_rate": 9.838898002424585e-05, "epoch": 0.08102212527267061, "percentage": 8.1, "elapsed_time": "5:53:04", "remaining_time": "2 days, 18:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 9627, "loss": 1.959, "learning_rate": 9.83848689544024e-05, "epoch": 0.08112599979225096, "percentage": 8.11, "elapsed_time": "5:53:33", "remaining_time": "2 days, 18:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 9627, "loss": 1.8185, "learning_rate": 9.83807527319478e-05, "epoch": 0.0812298743118313, "percentage": 8.12, "elapsed_time": "5:54:02", "remaining_time": "2 days, 18:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 9627, "loss": 1.8079, "learning_rate": 9.837663135732045e-05, "epoch": 0.08133374883141166, "percentage": 8.13, "elapsed_time": "5:54:31", "remaining_time": "2 days, 18:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 9627, "loss": 1.7167, "learning_rate": 9.83725048309592e-05, "epoch": 0.081437623350992, "percentage": 8.14, "elapsed_time": "5:54:59", "remaining_time": "2 days, 18:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 9627, "loss": 1.8118, "learning_rate": 9.83683731533035e-05, "epoch": 0.08154149787057235, "percentage": 8.15, "elapsed_time": "5:55:28", "remaining_time": "2 days, 18:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 9627, "loss": 1.7767, "learning_rate": 9.836423632479335e-05, "epoch": 0.0816453723901527, "percentage": 8.16, "elapsed_time": "5:55:56", "remaining_time": "2 days, 18:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 9627, "loss": 1.9734, "learning_rate": 9.836009434586929e-05, "epoch": 0.08174924690973304, "percentage": 8.17, "elapsed_time": "5:56:25", "remaining_time": "2 days, 18:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 9627, "loss": 1.8049, "learning_rate": 9.835594721697241e-05, "epoch": 0.08185312142931339, "percentage": 8.19, "elapsed_time": "5:56:53", "remaining_time": "2 days, 18:43:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 9627, "loss": 1.8358, "learning_rate": 9.835179493854433e-05, "epoch": 0.08195699594889373, "percentage": 8.2, "elapsed_time": "5:57:22", "remaining_time": "2 days, 18:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 9627, "loss": 1.6816, "learning_rate": 9.834763751102726e-05, "epoch": 0.08206087046847409, "percentage": 8.21, "elapsed_time": "5:57:50", "remaining_time": "2 days, 18:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 9627, "loss": 1.8448, "learning_rate": 9.834347493486391e-05, "epoch": 0.08216474498805443, "percentage": 8.22, "elapsed_time": "5:58:20", "remaining_time": "2 days, 18:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 9627, "loss": 1.9219, "learning_rate": 9.833930721049758e-05, "epoch": 0.08226861950763478, "percentage": 8.23, "elapsed_time": "5:58:48", "remaining_time": "2 days, 18:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 9627, "loss": 2.0203, "learning_rate": 9.833513433837209e-05, "epoch": 0.08237249402721512, "percentage": 8.24, "elapsed_time": "5:59:16", "remaining_time": "2 days, 18:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 9627, "loss": 1.5018, "learning_rate": 9.833095631893183e-05, "epoch": 0.08247636854679546, "percentage": 8.25, "elapsed_time": "5:59:46", "remaining_time": "2 days, 18:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 9627, "loss": 1.9229, "learning_rate": 9.832677315262171e-05, "epoch": 0.08258024306637582, "percentage": 8.26, "elapsed_time": "6:00:14", "remaining_time": "2 days, 18:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 9627, "loss": 1.8676, "learning_rate": 9.832258483988721e-05, "epoch": 0.08268411758595616, "percentage": 8.27, "elapsed_time": "6:00:44", "remaining_time": "2 days, 18:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 9627, "loss": 1.8478, "learning_rate": 9.831839138117435e-05, "epoch": 0.08278799210553651, "percentage": 8.28, "elapsed_time": "6:01:11", "remaining_time": "2 days, 18:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 9627, "loss": 1.7087, "learning_rate": 9.831419277692972e-05, "epoch": 0.08289186662511686, "percentage": 8.29, "elapsed_time": "6:01:40", "remaining_time": "2 days, 18:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 9627, "loss": 1.8661, "learning_rate": 9.830998902760043e-05, "epoch": 0.08299574114469721, "percentage": 8.3, "elapsed_time": "6:02:10", "remaining_time": "2 days, 18:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 9627, "loss": 1.8653, "learning_rate": 9.830578013363411e-05, "epoch": 0.08309961566427755, "percentage": 8.31, "elapsed_time": "6:02:37", "remaining_time": "2 days, 18:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 9627, "loss": 1.8252, "learning_rate": 9.830156609547905e-05, "epoch": 0.0832034901838579, "percentage": 8.32, "elapsed_time": "6:03:06", "remaining_time": "2 days, 18:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 9627, "loss": 1.8055, "learning_rate": 9.829734691358393e-05, "epoch": 0.08330736470343825, "percentage": 8.33, "elapsed_time": "6:03:36", "remaining_time": "2 days, 18:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 9627, "loss": 1.7022, "learning_rate": 9.829312258839811e-05, "epoch": 0.08341123922301859, "percentage": 8.34, "elapsed_time": "6:04:04", "remaining_time": "2 days, 18:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 9627, "loss": 2.0613, "learning_rate": 9.828889312037143e-05, "epoch": 0.08351511374259894, "percentage": 8.35, "elapsed_time": "6:04:32", "remaining_time": "2 days, 18:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 9627, "loss": 1.973, "learning_rate": 9.828465850995433e-05, "epoch": 0.08361898826217928, "percentage": 8.36, "elapsed_time": "6:05:02", "remaining_time": "2 days, 18:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 9627, "loss": 1.8557, "learning_rate": 9.82804187575977e-05, "epoch": 0.08372286278175964, "percentage": 8.37, "elapsed_time": "6:05:29", "remaining_time": "2 days, 18:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 9627, "loss": 1.9153, "learning_rate": 9.827617386375307e-05, "epoch": 0.08382673730133998, "percentage": 8.38, "elapsed_time": "6:05:59", "remaining_time": "2 days, 18:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 9627, "loss": 1.8209, "learning_rate": 9.827192382887251e-05, "epoch": 0.08393061182092033, "percentage": 8.39, "elapsed_time": "6:06:28", "remaining_time": "2 days, 18:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 9627, "loss": 1.6632, "learning_rate": 9.82676686534086e-05, "epoch": 0.08403448634050067, "percentage": 8.4, "elapsed_time": "6:06:58", "remaining_time": "2 days, 18:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 9627, "loss": 1.7217, "learning_rate": 9.826340833781447e-05, "epoch": 0.08413836086008102, "percentage": 8.41, "elapsed_time": "6:07:25", "remaining_time": "2 days, 18:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 9627, "loss": 1.9889, "learning_rate": 9.825914288254383e-05, "epoch": 0.08424223537966137, "percentage": 8.42, "elapsed_time": "6:07:55", "remaining_time": "2 days, 18:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 9627, "loss": 1.7551, "learning_rate": 9.82548722880509e-05, "epoch": 0.08434610989924171, "percentage": 8.43, "elapsed_time": "6:08:23", "remaining_time": "2 days, 18:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 9627, "loss": 1.5998, "learning_rate": 9.825059655479047e-05, "epoch": 0.08444998441882207, "percentage": 8.44, "elapsed_time": "6:08:53", "remaining_time": "2 days, 18:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 9627, "loss": 1.93, "learning_rate": 9.82463156832179e-05, "epoch": 0.08455385893840241, "percentage": 8.46, "elapsed_time": "6:09:20", "remaining_time": "2 days, 18:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 9627, "loss": 1.7851, "learning_rate": 9.824202967378903e-05, "epoch": 0.08465773345798276, "percentage": 8.47, "elapsed_time": "6:09:51", "remaining_time": "2 days, 18:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 9627, "loss": 1.7856, "learning_rate": 9.82377385269603e-05, "epoch": 0.0847616079775631, "percentage": 8.48, "elapsed_time": "6:10:20", "remaining_time": "2 days, 18:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 9627, "loss": 1.7032, "learning_rate": 9.823344224318869e-05, "epoch": 0.08486548249714346, "percentage": 8.49, "elapsed_time": "6:10:48", "remaining_time": "2 days, 18:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 9627, "loss": 1.8525, "learning_rate": 9.822914082293171e-05, "epoch": 0.0849693570167238, "percentage": 8.5, "elapsed_time": "6:11:17", "remaining_time": "2 days, 18:38:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 9627, "loss": 1.8626, "learning_rate": 9.822483426664744e-05, "epoch": 0.08507323153630414, "percentage": 8.51, "elapsed_time": "6:11:45", "remaining_time": "2 days, 18:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 9627, "loss": 1.7556, "learning_rate": 9.822052257479448e-05, "epoch": 0.0851771060558845, "percentage": 8.52, "elapsed_time": "6:12:13", "remaining_time": "2 days, 18:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 9627, "loss": 1.713, "learning_rate": 9.821620574783202e-05, "epoch": 0.08528098057546483, "percentage": 8.53, "elapsed_time": "6:12:43", "remaining_time": "2 days, 18:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 9627, "loss": 2.0036, "learning_rate": 9.821188378621973e-05, "epoch": 0.08538485509504519, "percentage": 8.54, "elapsed_time": "6:13:11", "remaining_time": "2 days, 18:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 9627, "loss": 1.8456, "learning_rate": 9.820755669041787e-05, "epoch": 0.08548872961462553, "percentage": 8.55, "elapsed_time": "6:13:40", "remaining_time": "2 days, 18:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 9627, "loss": 1.6277, "learning_rate": 9.820322446088729e-05, "epoch": 0.08559260413420589, "percentage": 8.56, "elapsed_time": "6:14:10", "remaining_time": "2 days, 18:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 9627, "loss": 1.8758, "learning_rate": 9.819888709808929e-05, "epoch": 0.08569647865378623, "percentage": 8.57, "elapsed_time": "6:14:38", "remaining_time": "2 days, 18:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 9627, "loss": 1.8693, "learning_rate": 9.819454460248578e-05, "epoch": 0.08580035317336657, "percentage": 8.58, "elapsed_time": "6:15:07", "remaining_time": "2 days, 18:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 9627, "loss": 1.8883, "learning_rate": 9.81901969745392e-05, "epoch": 0.08590422769294692, "percentage": 8.59, "elapsed_time": "6:15:35", "remaining_time": "2 days, 18:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 9627, "loss": 1.7379, "learning_rate": 9.818584421471254e-05, "epoch": 0.08600810221252726, "percentage": 8.6, "elapsed_time": "6:16:05", "remaining_time": "2 days, 18:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 9627, "loss": 1.67, "learning_rate": 9.818148632346934e-05, "epoch": 0.08611197673210762, "percentage": 8.61, "elapsed_time": "6:16:34", "remaining_time": "2 days, 18:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 9627, "loss": 1.9572, "learning_rate": 9.817712330127367e-05, "epoch": 0.08621585125168796, "percentage": 8.62, "elapsed_time": "6:17:03", "remaining_time": "2 days, 18:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 9627, "loss": 1.7383, "learning_rate": 9.817275514859017e-05, "epoch": 0.08631972577126831, "percentage": 8.63, "elapsed_time": "6:17:31", "remaining_time": "2 days, 18:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 9627, "loss": 1.9483, "learning_rate": 9.8168381865884e-05, "epoch": 0.08642360029084865, "percentage": 8.64, "elapsed_time": "6:18:01", "remaining_time": "2 days, 18:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 9627, "loss": 1.7132, "learning_rate": 9.81640034536209e-05, "epoch": 0.08652747481042901, "percentage": 8.65, "elapsed_time": "6:18:29", "remaining_time": "2 days, 18:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 9627, "loss": 2.0216, "learning_rate": 9.815961991226711e-05, "epoch": 0.08663134933000935, "percentage": 8.66, "elapsed_time": "6:18:58", "remaining_time": "2 days, 18:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 9627, "loss": 1.7324, "learning_rate": 9.815523124228949e-05, "epoch": 0.08673522384958969, "percentage": 8.67, "elapsed_time": "6:19:27", "remaining_time": "2 days, 18:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 9627, "loss": 1.7634, "learning_rate": 9.815083744415534e-05, "epoch": 0.08683909836917005, "percentage": 8.68, "elapsed_time": "6:19:56", "remaining_time": "2 days, 18:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 9627, "loss": 1.4646, "learning_rate": 9.81464385183326e-05, "epoch": 0.08694297288875039, "percentage": 8.69, "elapsed_time": "6:20:25", "remaining_time": "2 days, 18:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 9627, "loss": 1.3127, "learning_rate": 9.814203446528971e-05, "epoch": 0.08704684740833074, "percentage": 8.7, "elapsed_time": "6:20:55", "remaining_time": "2 days, 18:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 9627, "loss": 1.9647, "learning_rate": 9.813762528549568e-05, "epoch": 0.08715072192791108, "percentage": 8.72, "elapsed_time": "6:21:23", "remaining_time": "2 days, 18:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 9627, "loss": 1.7981, "learning_rate": 9.813321097942005e-05, "epoch": 0.08725459644749144, "percentage": 8.73, "elapsed_time": "6:21:53", "remaining_time": "2 days, 18:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 9627, "loss": 1.8632, "learning_rate": 9.812879154753289e-05, "epoch": 0.08735847096707178, "percentage": 8.74, "elapsed_time": "6:22:22", "remaining_time": "2 days, 18:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 9627, "loss": 1.653, "learning_rate": 9.812436699030486e-05, "epoch": 0.08746234548665212, "percentage": 8.75, "elapsed_time": "6:22:52", "remaining_time": "2 days, 18:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 9627, "loss": 1.798, "learning_rate": 9.811993730820712e-05, "epoch": 0.08756622000623247, "percentage": 8.76, "elapsed_time": "6:23:20", "remaining_time": "2 days, 18:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 9627, "loss": 1.7409, "learning_rate": 9.811550250171142e-05, "epoch": 0.08767009452581281, "percentage": 8.77, "elapsed_time": "6:23:49", "remaining_time": "2 days, 18:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 9627, "loss": 1.8968, "learning_rate": 9.811106257129001e-05, "epoch": 0.08777396904539317, "percentage": 8.78, "elapsed_time": "6:24:17", "remaining_time": "2 days, 18:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 9627, "loss": 1.7981, "learning_rate": 9.810661751741573e-05, "epoch": 0.08787784356497351, "percentage": 8.79, "elapsed_time": "6:24:47", "remaining_time": "2 days, 18:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 9627, "loss": 1.5857, "learning_rate": 9.810216734056192e-05, "epoch": 0.08798171808455386, "percentage": 8.8, "elapsed_time": "6:25:15", "remaining_time": "2 days, 18:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 9627, "loss": 1.7766, "learning_rate": 9.809771204120248e-05, "epoch": 0.0880855926041342, "percentage": 8.81, "elapsed_time": "6:25:45", "remaining_time": "2 days, 18:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 9627, "loss": 1.6296, "learning_rate": 9.809325161981191e-05, "epoch": 0.08818946712371455, "percentage": 8.82, "elapsed_time": "6:26:13", "remaining_time": "2 days, 18:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 9627, "loss": 1.8433, "learning_rate": 9.808878607686518e-05, "epoch": 0.0882933416432949, "percentage": 8.83, "elapsed_time": "6:26:43", "remaining_time": "2 days, 18:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 9627, "loss": 1.8521, "learning_rate": 9.808431541283783e-05, "epoch": 0.08839721616287524, "percentage": 8.84, "elapsed_time": "6:27:12", "remaining_time": "2 days, 18:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 9627, "loss": 2.0822, "learning_rate": 9.807983962820597e-05, "epoch": 0.0885010906824556, "percentage": 8.85, "elapsed_time": "6:27:41", "remaining_time": "2 days, 18:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 9627, "loss": 1.8393, "learning_rate": 9.807535872344622e-05, "epoch": 0.08860496520203594, "percentage": 8.86, "elapsed_time": "6:28:10", "remaining_time": "2 days, 18:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 9627, "loss": 1.921, "learning_rate": 9.807087269903577e-05, "epoch": 0.08870883972161629, "percentage": 8.87, "elapsed_time": "6:28:38", "remaining_time": "2 days, 18:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 9627, "loss": 2.0497, "learning_rate": 9.806638155545236e-05, "epoch": 0.08881271424119663, "percentage": 8.88, "elapsed_time": "6:29:08", "remaining_time": "2 days, 18:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 9627, "loss": 1.849, "learning_rate": 9.806188529317423e-05, "epoch": 0.08891658876077699, "percentage": 8.89, "elapsed_time": "6:29:37", "remaining_time": "2 days, 18:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 9627, "loss": 1.6662, "learning_rate": 9.805738391268021e-05, "epoch": 0.08902046328035733, "percentage": 8.9, "elapsed_time": "6:30:05", "remaining_time": "2 days, 18:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 9627, "loss": 1.5148, "learning_rate": 9.805287741444968e-05, "epoch": 0.08912433779993767, "percentage": 8.91, "elapsed_time": "6:30:33", "remaining_time": "2 days, 18:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 9627, "loss": 1.9624, "learning_rate": 9.804836579896253e-05, "epoch": 0.08922821231951802, "percentage": 8.92, "elapsed_time": "6:31:04", "remaining_time": "2 days, 18:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 9627, "loss": 1.7757, "learning_rate": 9.80438490666992e-05, "epoch": 0.08933208683909837, "percentage": 8.93, "elapsed_time": "6:31:32", "remaining_time": "2 days, 18:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 9627, "loss": 1.692, "learning_rate": 9.803932721814071e-05, "epoch": 0.08943596135867872, "percentage": 8.94, "elapsed_time": "6:32:03", "remaining_time": "2 days, 18:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 9627, "loss": 1.8445, "learning_rate": 9.803480025376858e-05, "epoch": 0.08953983587825906, "percentage": 8.95, "elapsed_time": "6:32:30", "remaining_time": "2 days, 18:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 9627, "loss": 1.8338, "learning_rate": 9.803026817406493e-05, "epoch": 0.08964371039783942, "percentage": 8.96, "elapsed_time": "6:33:01", "remaining_time": "2 days, 18:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 9627, "loss": 1.7572, "learning_rate": 9.802573097951235e-05, "epoch": 0.08974758491741976, "percentage": 8.97, "elapsed_time": "6:33:30", "remaining_time": "2 days, 18:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 9627, "loss": 1.8358, "learning_rate": 9.802118867059407e-05, "epoch": 0.0898514594370001, "percentage": 8.99, "elapsed_time": "6:33:58", "remaining_time": "2 days, 18:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 9627, "loss": 1.8347, "learning_rate": 9.801664124779373e-05, "epoch": 0.08995533395658045, "percentage": 9.0, "elapsed_time": "6:34:28", "remaining_time": "2 days, 18:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 9627, "loss": 1.8158, "learning_rate": 9.801208871159567e-05, "epoch": 0.09005920847616079, "percentage": 9.01, "elapsed_time": "6:34:57", "remaining_time": "2 days, 18:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 9627, "loss": 1.9947, "learning_rate": 9.800753106248468e-05, "epoch": 0.09016308299574115, "percentage": 9.02, "elapsed_time": "6:35:26", "remaining_time": "2 days, 18:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 9627, "loss": 1.7856, "learning_rate": 9.800296830094609e-05, "epoch": 0.09026695751532149, "percentage": 9.03, "elapsed_time": "6:35:56", "remaining_time": "2 days, 18:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 9627, "loss": 1.7665, "learning_rate": 9.79984004274658e-05, "epoch": 0.09037083203490184, "percentage": 9.04, "elapsed_time": "6:36:25", "remaining_time": "2 days, 18:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 9627, "loss": 1.715, "learning_rate": 9.799382744253029e-05, "epoch": 0.09047470655448218, "percentage": 9.05, "elapsed_time": "6:36:53", "remaining_time": "2 days, 18:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 9627, "loss": 1.7945, "learning_rate": 9.79892493466265e-05, "epoch": 0.09057858107406254, "percentage": 9.06, "elapsed_time": "6:37:22", "remaining_time": "2 days, 18:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 9627, "loss": 1.7249, "learning_rate": 9.7984666140242e-05, "epoch": 0.09068245559364288, "percentage": 9.07, "elapsed_time": "6:37:52", "remaining_time": "2 days, 18:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 9627, "loss": 1.6934, "learning_rate": 9.798007782386485e-05, "epoch": 0.09078633011322322, "percentage": 9.08, "elapsed_time": "6:38:21", "remaining_time": "2 days, 18:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 9627, "loss": 1.9192, "learning_rate": 9.797548439798368e-05, "epoch": 0.09089020463280358, "percentage": 9.09, "elapsed_time": "6:38:49", "remaining_time": "2 days, 18:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 9627, "loss": 1.9863, "learning_rate": 9.797088586308762e-05, "epoch": 0.09099407915238392, "percentage": 9.1, "elapsed_time": "6:39:19", "remaining_time": "2 days, 18:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 9627, "loss": 1.6311, "learning_rate": 9.796628221966642e-05, "epoch": 0.09109795367196427, "percentage": 9.11, "elapsed_time": "6:39:47", "remaining_time": "2 days, 18:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 9627, "loss": 1.6965, "learning_rate": 9.796167346821032e-05, "epoch": 0.09120182819154461, "percentage": 9.12, "elapsed_time": "6:40:16", "remaining_time": "2 days, 18:28:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 9627, "loss": 1.745, "learning_rate": 9.79570596092101e-05, "epoch": 0.09130570271112497, "percentage": 9.13, "elapsed_time": "6:40:46", "remaining_time": "2 days, 18:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 9627, "loss": 1.886, "learning_rate": 9.795244064315712e-05, "epoch": 0.09140957723070531, "percentage": 9.14, "elapsed_time": "6:41:14", "remaining_time": "2 days, 18:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 9627, "loss": 1.8935, "learning_rate": 9.794781657054324e-05, "epoch": 0.09151345175028565, "percentage": 9.15, "elapsed_time": "6:41:44", "remaining_time": "2 days, 18:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 9627, "loss": 1.9279, "learning_rate": 9.794318739186092e-05, "epoch": 0.091617326269866, "percentage": 9.16, "elapsed_time": "6:42:12", "remaining_time": "2 days, 18:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 9627, "loss": 1.9028, "learning_rate": 9.79385531076031e-05, "epoch": 0.09172120078944634, "percentage": 9.17, "elapsed_time": "6:42:41", "remaining_time": "2 days, 18:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 9627, "loss": 1.9369, "learning_rate": 9.793391371826332e-05, "epoch": 0.0918250753090267, "percentage": 9.18, "elapsed_time": "6:43:09", "remaining_time": "2 days, 18:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 9627, "loss": 1.9072, "learning_rate": 9.792926922433563e-05, "epoch": 0.09192894982860704, "percentage": 9.19, "elapsed_time": "6:43:39", "remaining_time": "2 days, 18:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 9627, "loss": 1.6753, "learning_rate": 9.792461962631462e-05, "epoch": 0.0920328243481874, "percentage": 9.2, "elapsed_time": "6:44:07", "remaining_time": "2 days, 18:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 9627, "loss": 1.8044, "learning_rate": 9.791996492469544e-05, "epoch": 0.09213669886776774, "percentage": 9.21, "elapsed_time": "6:44:36", "remaining_time": "2 days, 18:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 9627, "loss": 1.6905, "learning_rate": 9.79153051199738e-05, "epoch": 0.09224057338734809, "percentage": 9.22, "elapsed_time": "6:45:05", "remaining_time": "2 days, 18:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 9627, "loss": 1.9002, "learning_rate": 9.791064021264591e-05, "epoch": 0.09234444790692843, "percentage": 9.23, "elapsed_time": "6:45:33", "remaining_time": "2 days, 18:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 9627, "loss": 1.8316, "learning_rate": 9.790597020320856e-05, "epoch": 0.09244832242650877, "percentage": 9.24, "elapsed_time": "6:46:03", "remaining_time": "2 days, 18:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 9627, "loss": 1.7874, "learning_rate": 9.790129509215907e-05, "epoch": 0.09255219694608913, "percentage": 9.26, "elapsed_time": "6:46:32", "remaining_time": "2 days, 18:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 9627, "loss": 1.8666, "learning_rate": 9.789661487999528e-05, "epoch": 0.09265607146566947, "percentage": 9.27, "elapsed_time": "6:47:00", "remaining_time": "2 days, 18:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 9627, "loss": 2.0314, "learning_rate": 9.789192956721563e-05, "epoch": 0.09275994598524982, "percentage": 9.28, "elapsed_time": "6:47:29", "remaining_time": "2 days, 18:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 9627, "loss": 1.6938, "learning_rate": 9.788723915431905e-05, "epoch": 0.09286382050483016, "percentage": 9.29, "elapsed_time": "6:47:57", "remaining_time": "2 days, 18:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 9627, "loss": 1.9863, "learning_rate": 9.788254364180503e-05, "epoch": 0.09296769502441052, "percentage": 9.3, "elapsed_time": "6:48:26", "remaining_time": "2 days, 18:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 9627, "loss": 1.7899, "learning_rate": 9.78778430301736e-05, "epoch": 0.09307156954399086, "percentage": 9.31, "elapsed_time": "6:48:55", "remaining_time": "2 days, 18:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 9627, "loss": 1.8823, "learning_rate": 9.787313731992537e-05, "epoch": 0.0931754440635712, "percentage": 9.32, "elapsed_time": "6:49:23", "remaining_time": "2 days, 18:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 9627, "loss": 1.8849, "learning_rate": 9.786842651156143e-05, "epoch": 0.09327931858315155, "percentage": 9.33, "elapsed_time": "6:49:51", "remaining_time": "2 days, 18:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 9627, "loss": 1.7419, "learning_rate": 9.786371060558346e-05, "epoch": 0.0933831931027319, "percentage": 9.34, "elapsed_time": "6:50:21", "remaining_time": "2 days, 18:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 9627, "loss": 1.9191, "learning_rate": 9.785898960249364e-05, "epoch": 0.09348706762231225, "percentage": 9.35, "elapsed_time": "6:50:49", "remaining_time": "2 days, 18:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 9627, "loss": 1.8023, "learning_rate": 9.785426350279477e-05, "epoch": 0.09359094214189259, "percentage": 9.36, "elapsed_time": "6:51:19", "remaining_time": "2 days, 18:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 9627, "loss": 1.9383, "learning_rate": 9.78495323069901e-05, "epoch": 0.09369481666147295, "percentage": 9.37, "elapsed_time": "6:51:47", "remaining_time": "2 days, 18:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 9627, "loss": 1.8187, "learning_rate": 9.784479601558348e-05, "epoch": 0.09379869118105329, "percentage": 9.38, "elapsed_time": "6:52:15", "remaining_time": "2 days, 18:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 9627, "loss": 1.5762, "learning_rate": 9.78400546290793e-05, "epoch": 0.09390256570063363, "percentage": 9.39, "elapsed_time": "6:52:45", "remaining_time": "2 days, 18:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 9627, "loss": 1.8772, "learning_rate": 9.783530814798245e-05, "epoch": 0.09400644022021398, "percentage": 9.4, "elapsed_time": "6:53:12", "remaining_time": "2 days, 18:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 9627, "loss": 1.7432, "learning_rate": 9.783055657279843e-05, "epoch": 0.09411031473979432, "percentage": 9.41, "elapsed_time": "6:53:42", "remaining_time": "2 days, 18:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 9627, "loss": 1.7051, "learning_rate": 9.782579990403321e-05, "epoch": 0.09421418925937468, "percentage": 9.42, "elapsed_time": "6:54:10", "remaining_time": "2 days, 18:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 9627, "loss": 1.7051, "learning_rate": 9.782103814219337e-05, "epoch": 0.09431806377895502, "percentage": 9.43, "elapsed_time": "6:54:38", "remaining_time": "2 days, 18:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 9627, "loss": 2.0238, "learning_rate": 9.781627128778598e-05, "epoch": 0.09442193829853537, "percentage": 9.44, "elapsed_time": "6:55:08", "remaining_time": "2 days, 18:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 9627, "loss": 1.6112, "learning_rate": 9.781149934131868e-05, "epoch": 0.09452581281811571, "percentage": 9.45, "elapsed_time": "6:55:36", "remaining_time": "2 days, 18:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 9627, "loss": 1.7238, "learning_rate": 9.780672230329964e-05, "epoch": 0.09462968733769607, "percentage": 9.46, "elapsed_time": "6:56:05", "remaining_time": "2 days, 18:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 9627, "loss": 1.8491, "learning_rate": 9.780194017423758e-05, "epoch": 0.09473356185727641, "percentage": 9.47, "elapsed_time": "6:56:33", "remaining_time": "2 days, 18:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 9627, "loss": 1.666, "learning_rate": 9.779715295464178e-05, "epoch": 0.09483743637685675, "percentage": 9.48, "elapsed_time": "6:57:01", "remaining_time": "2 days, 18:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 9627, "loss": 1.8345, "learning_rate": 9.779236064502201e-05, "epoch": 0.0949413108964371, "percentage": 9.49, "elapsed_time": "6:57:31", "remaining_time": "2 days, 18:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 9627, "loss": 1.7373, "learning_rate": 9.778756324588863e-05, "epoch": 0.09504518541601745, "percentage": 9.5, "elapsed_time": "6:57:58", "remaining_time": "2 days, 18:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 9627, "loss": 1.9764, "learning_rate": 9.778276075775251e-05, "epoch": 0.0951490599355978, "percentage": 9.51, "elapsed_time": "6:58:28", "remaining_time": "2 days, 18:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 9627, "loss": 1.8864, "learning_rate": 9.77779531811251e-05, "epoch": 0.09525293445517814, "percentage": 9.53, "elapsed_time": "6:58:56", "remaining_time": "2 days, 18:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 9627, "loss": 1.8929, "learning_rate": 9.777314051651836e-05, "epoch": 0.0953568089747585, "percentage": 9.54, "elapsed_time": "6:59:25", "remaining_time": "2 days, 18:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 9627, "loss": 1.8455, "learning_rate": 9.776832276444479e-05, "epoch": 0.09546068349433884, "percentage": 9.55, "elapsed_time": "6:59:54", "remaining_time": "2 days, 18:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 9627, "loss": 1.7881, "learning_rate": 9.776349992541746e-05, "epoch": 0.09556455801391918, "percentage": 9.56, "elapsed_time": "7:00:22", "remaining_time": "2 days, 18:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 9627, "loss": 1.9618, "learning_rate": 9.775867199994994e-05, "epoch": 0.09566843253349953, "percentage": 9.57, "elapsed_time": "7:00:52", "remaining_time": "2 days, 18:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 9627, "loss": 1.9835, "learning_rate": 9.775383898855641e-05, "epoch": 0.09577230705307987, "percentage": 9.58, "elapsed_time": "7:01:19", "remaining_time": "2 days, 18:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 9627, "loss": 1.6711, "learning_rate": 9.77490008917515e-05, "epoch": 0.09587618157266023, "percentage": 9.59, "elapsed_time": "7:01:49", "remaining_time": "2 days, 18:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 9627, "loss": 1.7854, "learning_rate": 9.774415771005048e-05, "epoch": 0.09598005609224057, "percentage": 9.6, "elapsed_time": "7:02:17", "remaining_time": "2 days, 18:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 9627, "loss": 1.8105, "learning_rate": 9.773930944396905e-05, "epoch": 0.09608393061182093, "percentage": 9.61, "elapsed_time": "7:02:46", "remaining_time": "2 days, 18:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 9627, "loss": 1.8127, "learning_rate": 9.773445609402356e-05, "epoch": 0.09618780513140127, "percentage": 9.62, "elapsed_time": "7:03:14", "remaining_time": "2 days, 18:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 9627, "loss": 1.8921, "learning_rate": 9.772959766073084e-05, "epoch": 0.09629167965098162, "percentage": 9.63, "elapsed_time": "7:03:43", "remaining_time": "2 days, 18:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 9627, "loss": 1.8411, "learning_rate": 9.772473414460828e-05, "epoch": 0.09639555417056196, "percentage": 9.64, "elapsed_time": "7:04:11", "remaining_time": "2 days, 18:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 9627, "loss": 1.6894, "learning_rate": 9.77198655461738e-05, "epoch": 0.0964994286901423, "percentage": 9.65, "elapsed_time": "7:04:41", "remaining_time": "2 days, 18:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 9627, "loss": 1.8592, "learning_rate": 9.771499186594586e-05, "epoch": 0.09660330320972266, "percentage": 9.66, "elapsed_time": "7:05:09", "remaining_time": "2 days, 18:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 9627, "loss": 1.6941, "learning_rate": 9.771011310444348e-05, "epoch": 0.096707177729303, "percentage": 9.67, "elapsed_time": "7:05:38", "remaining_time": "2 days, 18:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 9627, "loss": 1.7519, "learning_rate": 9.770522926218622e-05, "epoch": 0.09681105224888335, "percentage": 9.68, "elapsed_time": "7:06:06", "remaining_time": "2 days, 18:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 9627, "loss": 1.9341, "learning_rate": 9.770034033969413e-05, "epoch": 0.0969149267684637, "percentage": 9.69, "elapsed_time": "7:06:36", "remaining_time": "2 days, 18:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 9627, "loss": 1.8773, "learning_rate": 9.769544633748789e-05, "epoch": 0.09701880128804405, "percentage": 9.7, "elapsed_time": "7:07:04", "remaining_time": "2 days, 18:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 9627, "loss": 1.9544, "learning_rate": 9.769054725608867e-05, "epoch": 0.09712267580762439, "percentage": 9.71, "elapsed_time": "7:07:33", "remaining_time": "2 days, 18:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 9627, "loss": 2.0178, "learning_rate": 9.768564309601813e-05, "epoch": 0.09722655032720473, "percentage": 9.72, "elapsed_time": "7:08:01", "remaining_time": "2 days, 18:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 9627, "loss": 1.6323, "learning_rate": 9.768073385779859e-05, "epoch": 0.09733042484678509, "percentage": 9.73, "elapsed_time": "7:08:30", "remaining_time": "2 days, 18:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 9627, "loss": 1.8568, "learning_rate": 9.76758195419528e-05, "epoch": 0.09743429936636543, "percentage": 9.74, "elapsed_time": "7:08:58", "remaining_time": "2 days, 18:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 9627, "loss": 1.6446, "learning_rate": 9.767090014900413e-05, "epoch": 0.09753817388594578, "percentage": 9.75, "elapsed_time": "7:09:28", "remaining_time": "2 days, 18:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 9627, "loss": 1.7432, "learning_rate": 9.766597567947644e-05, "epoch": 0.09764204840552612, "percentage": 9.76, "elapsed_time": "7:09:55", "remaining_time": "2 days, 18:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 9627, "loss": 1.8066, "learning_rate": 9.766104613389413e-05, "epoch": 0.09774592292510648, "percentage": 9.77, "elapsed_time": "7:10:25", "remaining_time": "2 days, 18:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 9627, "loss": 1.8682, "learning_rate": 9.76561115127822e-05, "epoch": 0.09784979744468682, "percentage": 9.78, "elapsed_time": "7:10:52", "remaining_time": "2 days, 18:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 9627, "loss": 1.8556, "learning_rate": 9.765117181666612e-05, "epoch": 0.09795367196426717, "percentage": 9.8, "elapsed_time": "7:11:22", "remaining_time": "2 days, 18:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 9627, "loss": 1.8249, "learning_rate": 9.764622704607193e-05, "epoch": 0.09805754648384751, "percentage": 9.81, "elapsed_time": "7:11:49", "remaining_time": "2 days, 18:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 9627, "loss": 1.7983, "learning_rate": 9.764127720152623e-05, "epoch": 0.09816142100342785, "percentage": 9.82, "elapsed_time": "7:12:19", "remaining_time": "2 days, 18:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 9627, "loss": 1.8482, "learning_rate": 9.763632228355611e-05, "epoch": 0.09826529552300821, "percentage": 9.83, "elapsed_time": "7:12:47", "remaining_time": "2 days, 18:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 9627, "loss": 1.9735, "learning_rate": 9.763136229268924e-05, "epoch": 0.09836917004258855, "percentage": 9.84, "elapsed_time": "7:13:16", "remaining_time": "2 days, 18:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 9627, "loss": 1.8289, "learning_rate": 9.762639722945384e-05, "epoch": 0.0984730445621689, "percentage": 9.85, "elapsed_time": "7:13:44", "remaining_time": "2 days, 18:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 9627, "loss": 1.6953, "learning_rate": 9.762142709437863e-05, "epoch": 0.09857691908174925, "percentage": 9.86, "elapsed_time": "7:14:13", "remaining_time": "2 days, 18:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 9627, "loss": 1.9994, "learning_rate": 9.76164518879929e-05, "epoch": 0.0986807936013296, "percentage": 9.87, "elapsed_time": "7:14:42", "remaining_time": "2 days, 18:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 9627, "loss": 1.7591, "learning_rate": 9.761147161082644e-05, "epoch": 0.09878466812090994, "percentage": 9.88, "elapsed_time": "7:15:11", "remaining_time": "2 days, 18:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 9627, "loss": 1.8883, "learning_rate": 9.760648626340965e-05, "epoch": 0.09888854264049028, "percentage": 9.89, "elapsed_time": "7:15:39", "remaining_time": "2 days, 18:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 9627, "loss": 1.7859, "learning_rate": 9.760149584627343e-05, "epoch": 0.09899241716007064, "percentage": 9.9, "elapsed_time": "7:16:08", "remaining_time": "2 days, 18:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 9627, "loss": 1.9948, "learning_rate": 9.759650035994921e-05, "epoch": 0.09909629167965098, "percentage": 9.91, "elapsed_time": "7:16:37", "remaining_time": "2 days, 18:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 9627, "loss": 1.8239, "learning_rate": 9.759149980496896e-05, "epoch": 0.09920016619923133, "percentage": 9.92, "elapsed_time": "7:17:05", "remaining_time": "2 days, 18:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 9627, "loss": 1.8389, "learning_rate": 9.758649418186521e-05, "epoch": 0.09930404071881167, "percentage": 9.93, "elapsed_time": "7:17:35", "remaining_time": "2 days, 18:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 9627, "loss": 1.9304, "learning_rate": 9.758148349117101e-05, "epoch": 0.09940791523839203, "percentage": 9.94, "elapsed_time": "7:18:02", "remaining_time": "2 days, 18:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 9627, "loss": 1.9184, "learning_rate": 9.757646773341998e-05, "epoch": 0.09951178975797237, "percentage": 9.95, "elapsed_time": "7:18:32", "remaining_time": "2 days, 18:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 9627, "loss": 1.8935, "learning_rate": 9.757144690914624e-05, "epoch": 0.09961566427755271, "percentage": 9.96, "elapsed_time": "7:19:00", "remaining_time": "2 days, 18:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 9627, "loss": 1.8969, "learning_rate": 9.756642101888448e-05, "epoch": 0.09971953879713306, "percentage": 9.97, "elapsed_time": "7:19:28", "remaining_time": "2 days, 18:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 9627, "loss": 1.7702, "learning_rate": 9.756139006316991e-05, "epoch": 0.0998234133167134, "percentage": 9.98, "elapsed_time": "7:19:57", "remaining_time": "2 days, 18:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 9627, "loss": 1.6524, "learning_rate": 9.755635404253829e-05, "epoch": 0.09992728783629376, "percentage": 9.99, "elapsed_time": "7:20:25", "remaining_time": "2 days, 18:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 9627, "loss": 1.701, "learning_rate": 9.755131295752593e-05, "epoch": 0.1000311623558741, "percentage": 10.0, "elapsed_time": "7:20:55", "remaining_time": "2 days, 18:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 9627, "loss": 1.8465, "learning_rate": 9.754626680866964e-05, "epoch": 0.10013503687545446, "percentage": 10.01, "elapsed_time": "7:21:23", "remaining_time": "2 days, 18:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 9627, "loss": 2.0038, "learning_rate": 9.754121559650681e-05, "epoch": 0.1002389113950348, "percentage": 10.02, "elapsed_time": "7:21:52", "remaining_time": "2 days, 18:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 9627, "loss": 2.1116, "learning_rate": 9.753615932157536e-05, "epoch": 0.10034278591461515, "percentage": 10.03, "elapsed_time": "7:22:20", "remaining_time": "2 days, 18:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 9627, "loss": 1.9158, "learning_rate": 9.753109798441375e-05, "epoch": 0.10044666043419549, "percentage": 10.04, "elapsed_time": "7:22:49", "remaining_time": "2 days, 18:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 9627, "loss": 1.7587, "learning_rate": 9.752603158556095e-05, "epoch": 0.10055053495377583, "percentage": 10.06, "elapsed_time": "7:23:18", "remaining_time": "2 days, 18:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 9627, "loss": 1.8125, "learning_rate": 9.752096012555652e-05, "epoch": 0.10065440947335619, "percentage": 10.07, "elapsed_time": "7:23:46", "remaining_time": "2 days, 18:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 9627, "loss": 1.9693, "learning_rate": 9.751588360494048e-05, "epoch": 0.10075828399293653, "percentage": 10.08, "elapsed_time": "7:24:16", "remaining_time": "2 days, 18:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 9627, "loss": 1.7953, "learning_rate": 9.75108020242535e-05, "epoch": 0.10086215851251688, "percentage": 10.09, "elapsed_time": "7:24:43", "remaining_time": "2 days, 18:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 9627, "loss": 1.7753, "learning_rate": 9.75057153840367e-05, "epoch": 0.10096603303209722, "percentage": 10.1, "elapsed_time": "7:25:13", "remaining_time": "2 days, 18:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 9627, "loss": 2.1136, "learning_rate": 9.750062368483176e-05, "epoch": 0.10106990755167758, "percentage": 10.11, "elapsed_time": "7:25:41", "remaining_time": "2 days, 18:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 9627, "loss": 1.7655, "learning_rate": 9.749552692718093e-05, "epoch": 0.10117378207125792, "percentage": 10.12, "elapsed_time": "7:26:10", "remaining_time": "2 days, 18:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 9627, "loss": 1.8326, "learning_rate": 9.749042511162696e-05, "epoch": 0.10127765659083826, "percentage": 10.13, "elapsed_time": "7:26:38", "remaining_time": "2 days, 18:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 9627, "loss": 1.7562, "learning_rate": 9.748531823871314e-05, "epoch": 0.10138153111041862, "percentage": 10.14, "elapsed_time": "7:27:07", "remaining_time": "2 days, 18:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 9627, "loss": 1.7919, "learning_rate": 9.748020630898333e-05, "epoch": 0.10148540562999896, "percentage": 10.15, "elapsed_time": "7:27:36", "remaining_time": "2 days, 18:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 9627, "loss": 1.7349, "learning_rate": 9.747508932298192e-05, "epoch": 0.10158928014957931, "percentage": 10.16, "elapsed_time": "7:28:03", "remaining_time": "2 days, 18:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 9627, "loss": 1.6836, "learning_rate": 9.746996728125382e-05, "epoch": 0.10169315466915965, "percentage": 10.17, "elapsed_time": "7:28:33", "remaining_time": "2 days, 18:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 9627, "loss": 1.6913, "learning_rate": 9.746484018434447e-05, "epoch": 0.10179702918874001, "percentage": 10.18, "elapsed_time": "7:29:01", "remaining_time": "2 days, 18:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 9627, "loss": 2.2579, "learning_rate": 9.745970803279989e-05, "epoch": 0.10190090370832035, "percentage": 10.19, "elapsed_time": "7:29:30", "remaining_time": "2 days, 18:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 9627, "loss": 1.7616, "learning_rate": 9.74545708271666e-05, "epoch": 0.1020047782279007, "percentage": 10.2, "elapsed_time": "7:29:57", "remaining_time": "2 days, 18:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 9627, "loss": 1.6341, "learning_rate": 9.744942856799169e-05, "epoch": 0.10210865274748104, "percentage": 10.21, "elapsed_time": "7:30:27", "remaining_time": "2 days, 18:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 9627, "loss": 2.0114, "learning_rate": 9.744428125582275e-05, "epoch": 0.10221252726706138, "percentage": 10.22, "elapsed_time": "7:30:55", "remaining_time": "2 days, 18:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 9627, "loss": 1.7651, "learning_rate": 9.743912889120791e-05, "epoch": 0.10231640178664174, "percentage": 10.23, "elapsed_time": "7:31:25", "remaining_time": "2 days, 18:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 9627, "loss": 2.0589, "learning_rate": 9.743397147469592e-05, "epoch": 0.10242027630622208, "percentage": 10.24, "elapsed_time": "7:31:53", "remaining_time": "2 days, 18:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 9627, "loss": 1.8003, "learning_rate": 9.742880900683596e-05, "epoch": 0.10252415082580243, "percentage": 10.25, "elapsed_time": "7:32:21", "remaining_time": "2 days, 17:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 9627, "loss": 1.8546, "learning_rate": 9.742364148817777e-05, "epoch": 0.10262802534538278, "percentage": 10.26, "elapsed_time": "7:32:51", "remaining_time": "2 days, 17:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 9627, "loss": 1.6446, "learning_rate": 9.74184689192717e-05, "epoch": 0.10273189986496313, "percentage": 10.27, "elapsed_time": "7:33:19", "remaining_time": "2 days, 17:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 9627, "loss": 2.0174, "learning_rate": 9.741329130066859e-05, "epoch": 0.10283577438454347, "percentage": 10.28, "elapsed_time": "7:33:49", "remaining_time": "2 days, 17:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 9627, "loss": 1.9646, "learning_rate": 9.740810863291976e-05, "epoch": 0.10293964890412381, "percentage": 10.29, "elapsed_time": "7:34:17", "remaining_time": "2 days, 17:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 9627, "loss": 1.7112, "learning_rate": 9.740292091657718e-05, "epoch": 0.10304352342370417, "percentage": 10.3, "elapsed_time": "7:34:46", "remaining_time": "2 days, 17:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 9627, "loss": 1.736, "learning_rate": 9.739772815219327e-05, "epoch": 0.10314739794328451, "percentage": 10.31, "elapsed_time": "7:35:14", "remaining_time": "2 days, 17:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 9627, "loss": 1.7482, "learning_rate": 9.739253034032103e-05, "epoch": 0.10325127246286486, "percentage": 10.33, "elapsed_time": "7:35:44", "remaining_time": "2 days, 17:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 9627, "loss": 1.9931, "learning_rate": 9.738732748151397e-05, "epoch": 0.1033551469824452, "percentage": 10.34, "elapsed_time": "7:36:12", "remaining_time": "2 days, 17:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 9627, "loss": 1.7324, "learning_rate": 9.738211957632619e-05, "epoch": 0.10345902150202556, "percentage": 10.35, "elapsed_time": "7:36:42", "remaining_time": "2 days, 17:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 9627, "loss": 1.7277, "learning_rate": 9.737690662531227e-05, "epoch": 0.1035628960216059, "percentage": 10.36, "elapsed_time": "7:37:10", "remaining_time": "2 days, 17:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 9627, "loss": 1.8904, "learning_rate": 9.737168862902735e-05, "epoch": 0.10366677054118625, "percentage": 10.37, "elapsed_time": "7:37:39", "remaining_time": "2 days, 17:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 9627, "loss": 1.898, "learning_rate": 9.736646558802709e-05, "epoch": 0.1037706450607666, "percentage": 10.38, "elapsed_time": "7:38:07", "remaining_time": "2 days, 17:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 9627, "loss": 1.9826, "learning_rate": 9.736123750286772e-05, "epoch": 0.10387451958034694, "percentage": 10.39, "elapsed_time": "7:38:37", "remaining_time": "2 days, 17:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 9627, "loss": 1.6245, "learning_rate": 9.7356004374106e-05, "epoch": 0.10397839409992729, "percentage": 10.4, "elapsed_time": "7:39:06", "remaining_time": "2 days, 17:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 9627, "loss": 1.9813, "learning_rate": 9.735076620229919e-05, "epoch": 0.10408226861950763, "percentage": 10.41, "elapsed_time": "7:39:36", "remaining_time": "2 days, 17:56:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 9627, "loss": 1.7119, "learning_rate": 9.734552298800513e-05, "epoch": 0.10418614313908799, "percentage": 10.42, "elapsed_time": "7:40:04", "remaining_time": "2 days, 17:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 9627, "loss": 1.8563, "learning_rate": 9.734027473178219e-05, "epoch": 0.10429001765866833, "percentage": 10.43, "elapsed_time": "7:40:33", "remaining_time": "2 days, 17:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 9627, "loss": 1.5552, "learning_rate": 9.733502143418925e-05, "epoch": 0.10439389217824868, "percentage": 10.44, "elapsed_time": "7:41:01", "remaining_time": "2 days, 17:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 9627, "loss": 1.6061, "learning_rate": 9.732976309578577e-05, "epoch": 0.10449776669782902, "percentage": 10.45, "elapsed_time": "7:41:32", "remaining_time": "2 days, 17:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 9627, "loss": 2.0223, "learning_rate": 9.73244997171317e-05, "epoch": 0.10460164121740936, "percentage": 10.46, "elapsed_time": "7:42:00", "remaining_time": "2 days, 17:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 9627, "loss": 1.8512, "learning_rate": 9.731923129878754e-05, "epoch": 0.10470551573698972, "percentage": 10.47, "elapsed_time": "7:42:29", "remaining_time": "2 days, 17:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 9627, "loss": 1.7601, "learning_rate": 9.731395784131437e-05, "epoch": 0.10480939025657006, "percentage": 10.48, "elapsed_time": "7:42:58", "remaining_time": "2 days, 17:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 9627, "loss": 1.7264, "learning_rate": 9.730867934527374e-05, "epoch": 0.10491326477615041, "percentage": 10.49, "elapsed_time": "7:43:27", "remaining_time": "2 days, 17:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 9627, "loss": 1.8542, "learning_rate": 9.73033958112278e-05, "epoch": 0.10501713929573075, "percentage": 10.5, "elapsed_time": "7:43:56", "remaining_time": "2 days, 17:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 9627, "loss": 1.7967, "learning_rate": 9.729810723973917e-05, "epoch": 0.10512101381531111, "percentage": 10.51, "elapsed_time": "7:44:25", "remaining_time": "2 days, 17:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 9627, "loss": 1.9559, "learning_rate": 9.729281363137106e-05, "epoch": 0.10522488833489145, "percentage": 10.52, "elapsed_time": "7:44:54", "remaining_time": "2 days, 17:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 9627, "loss": 1.8265, "learning_rate": 9.72875149866872e-05, "epoch": 0.10532876285447179, "percentage": 10.53, "elapsed_time": "7:45:23", "remaining_time": "2 days, 17:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 9627, "loss": 1.7892, "learning_rate": 9.728221130625186e-05, "epoch": 0.10543263737405215, "percentage": 10.54, "elapsed_time": "7:45:52", "remaining_time": "2 days, 17:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 9627, "loss": 1.7436, "learning_rate": 9.727690259062982e-05, "epoch": 0.10553651189363249, "percentage": 10.55, "elapsed_time": "7:46:20", "remaining_time": "2 days, 17:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 9627, "loss": 2.0679, "learning_rate": 9.727158884038643e-05, "epoch": 0.10564038641321284, "percentage": 10.56, "elapsed_time": "7:46:49", "remaining_time": "2 days, 17:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 9627, "loss": 1.8322, "learning_rate": 9.726627005608756e-05, "epoch": 0.10574426093279318, "percentage": 10.57, "elapsed_time": "7:47:17", "remaining_time": "2 days, 17:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 9627, "loss": 1.9986, "learning_rate": 9.726094623829962e-05, "epoch": 0.10584813545237354, "percentage": 10.58, "elapsed_time": "7:47:45", "remaining_time": "2 days, 17:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 9627, "loss": 1.8012, "learning_rate": 9.725561738758956e-05, "epoch": 0.10595200997195388, "percentage": 10.6, "elapsed_time": "7:48:15", "remaining_time": "2 days, 17:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 9627, "loss": 1.859, "learning_rate": 9.725028350452485e-05, "epoch": 0.10605588449153423, "percentage": 10.61, "elapsed_time": "7:48:43", "remaining_time": "2 days, 17:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 9627, "loss": 1.6539, "learning_rate": 9.724494458967352e-05, "epoch": 0.10615975901111457, "percentage": 10.62, "elapsed_time": "7:49:13", "remaining_time": "2 days, 17:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 9627, "loss": 1.6884, "learning_rate": 9.723960064360412e-05, "epoch": 0.10626363353069491, "percentage": 10.63, "elapsed_time": "7:49:41", "remaining_time": "2 days, 17:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 9627, "loss": 1.7554, "learning_rate": 9.72342516668857e-05, "epoch": 0.10636750805027527, "percentage": 10.64, "elapsed_time": "7:50:10", "remaining_time": "2 days, 17:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 9627, "loss": 1.7656, "learning_rate": 9.722889766008796e-05, "epoch": 0.10647138256985561, "percentage": 10.65, "elapsed_time": "7:50:39", "remaining_time": "2 days, 17:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 9627, "loss": 1.8226, "learning_rate": 9.722353862378101e-05, "epoch": 0.10657525708943597, "percentage": 10.66, "elapsed_time": "7:51:07", "remaining_time": "2 days, 17:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1027, "total_steps": 9627, "loss": 1.6735, "learning_rate": 9.721817455853554e-05, "epoch": 0.1066791316090163, "percentage": 10.67, "elapsed_time": "7:51:37", "remaining_time": "2 days, 17:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 9627, "loss": 1.6466, "learning_rate": 9.72128054649228e-05, "epoch": 0.10678300612859666, "percentage": 10.68, "elapsed_time": "7:52:04", "remaining_time": "2 days, 17:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1029, "total_steps": 9627, "loss": 1.8349, "learning_rate": 9.720743134351457e-05, "epoch": 0.106886880648177, "percentage": 10.69, "elapsed_time": "7:52:33", "remaining_time": "2 days, 17:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 9627, "loss": 1.7535, "learning_rate": 9.720205219488312e-05, "epoch": 0.10699075516775734, "percentage": 10.7, "elapsed_time": "7:53:01", "remaining_time": "2 days, 17:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1031, "total_steps": 9627, "loss": 1.7835, "learning_rate": 9.71966680196013e-05, "epoch": 0.1070946296873377, "percentage": 10.71, "elapsed_time": "7:53:31", "remaining_time": "2 days, 17:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 9627, "loss": 1.7698, "learning_rate": 9.719127881824249e-05, "epoch": 0.10719850420691804, "percentage": 10.72, "elapsed_time": "7:53:58", "remaining_time": "2 days, 17:47:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1033, "total_steps": 9627, "loss": 1.8369, "learning_rate": 9.718588459138059e-05, "epoch": 0.10730237872649839, "percentage": 10.73, "elapsed_time": "7:54:28", "remaining_time": "2 days, 17:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 9627, "loss": 1.8615, "learning_rate": 9.718048533959004e-05, "epoch": 0.10740625324607873, "percentage": 10.74, "elapsed_time": "7:54:55", "remaining_time": "2 days, 17:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 9627, "loss": 1.9681, "learning_rate": 9.717508106344582e-05, "epoch": 0.10751012776565909, "percentage": 10.75, "elapsed_time": "7:55:25", "remaining_time": "2 days, 17:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 9627, "loss": 1.8015, "learning_rate": 9.716967176352345e-05, "epoch": 0.10761400228523943, "percentage": 10.76, "elapsed_time": "7:55:53", "remaining_time": "2 days, 17:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1037, "total_steps": 9627, "loss": 1.9817, "learning_rate": 9.716425744039898e-05, "epoch": 0.10771787680481978, "percentage": 10.77, "elapsed_time": "7:56:21", "remaining_time": "2 days, 17:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 9627, "loss": 1.7871, "learning_rate": 9.715883809464899e-05, "epoch": 0.10782175132440013, "percentage": 10.78, "elapsed_time": "7:56:50", "remaining_time": "2 days, 17:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1039, "total_steps": 9627, "loss": 1.9029, "learning_rate": 9.715341372685059e-05, "epoch": 0.10792562584398047, "percentage": 10.79, "elapsed_time": "7:57:18", "remaining_time": "2 days, 17:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 9627, "loss": 1.6931, "learning_rate": 9.714798433758144e-05, "epoch": 0.10802950036356082, "percentage": 10.8, "elapsed_time": "7:57:48", "remaining_time": "2 days, 17:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1041, "total_steps": 9627, "loss": 1.7422, "learning_rate": 9.714254992741971e-05, "epoch": 0.10813337488314116, "percentage": 10.81, "elapsed_time": "7:58:16", "remaining_time": "2 days, 17:44:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 9627, "loss": 1.7005, "learning_rate": 9.713711049694416e-05, "epoch": 0.10823724940272152, "percentage": 10.82, "elapsed_time": "7:58:45", "remaining_time": "2 days, 17:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1043, "total_steps": 9627, "loss": 1.7248, "learning_rate": 9.713166604673403e-05, "epoch": 0.10834112392230186, "percentage": 10.83, "elapsed_time": "7:59:14", "remaining_time": "2 days, 17:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 9627, "loss": 1.719, "learning_rate": 9.71262165773691e-05, "epoch": 0.10844499844188221, "percentage": 10.84, "elapsed_time": "7:59:42", "remaining_time": "2 days, 17:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 9627, "loss": 1.7452, "learning_rate": 9.712076208942968e-05, "epoch": 0.10854887296146255, "percentage": 10.85, "elapsed_time": "8:00:11", "remaining_time": "2 days, 17:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 9627, "loss": 1.7313, "learning_rate": 9.711530258349668e-05, "epoch": 0.1086527474810429, "percentage": 10.87, "elapsed_time": "8:00:39", "remaining_time": "2 days, 17:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1047, "total_steps": 9627, "loss": 1.7674, "learning_rate": 9.710983806015148e-05, "epoch": 0.10875662200062325, "percentage": 10.88, "elapsed_time": "8:01:07", "remaining_time": "2 days, 17:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 9627, "loss": 1.964, "learning_rate": 9.710436851997598e-05, "epoch": 0.10886049652020359, "percentage": 10.89, "elapsed_time": "8:01:36", "remaining_time": "2 days, 17:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1049, "total_steps": 9627, "loss": 1.8366, "learning_rate": 9.709889396355265e-05, "epoch": 0.10896437103978394, "percentage": 10.9, "elapsed_time": "8:02:05", "remaining_time": "2 days, 17:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 9627, "loss": 1.8713, "learning_rate": 9.709341439146452e-05, "epoch": 0.10906824555936429, "percentage": 10.91, "elapsed_time": "8:02:34", "remaining_time": "2 days, 17:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1051, "total_steps": 9627, "loss": 1.988, "learning_rate": 9.708792980429508e-05, "epoch": 0.10917212007894464, "percentage": 10.92, "elapsed_time": "8:03:02", "remaining_time": "2 days, 17:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 9627, "loss": 1.9337, "learning_rate": 9.708244020262842e-05, "epoch": 0.10927599459852498, "percentage": 10.93, "elapsed_time": "8:03:30", "remaining_time": "2 days, 17:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1053, "total_steps": 9627, "loss": 1.8026, "learning_rate": 9.707694558704914e-05, "epoch": 0.10937986911810534, "percentage": 10.94, "elapsed_time": "8:04:00", "remaining_time": "2 days, 17:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 9627, "loss": 1.6728, "learning_rate": 9.707144595814237e-05, "epoch": 0.10948374363768568, "percentage": 10.95, "elapsed_time": "8:04:28", "remaining_time": "2 days, 17:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 9627, "loss": 1.8825, "learning_rate": 9.706594131649378e-05, "epoch": 0.10958761815726602, "percentage": 10.96, "elapsed_time": "8:04:57", "remaining_time": "2 days, 17:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 9627, "loss": 1.8012, "learning_rate": 9.706043166268957e-05, "epoch": 0.10969149267684637, "percentage": 10.97, "elapsed_time": "8:05:25", "remaining_time": "2 days, 17:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1057, "total_steps": 9627, "loss": 1.6768, "learning_rate": 9.705491699731646e-05, "epoch": 0.10979536719642671, "percentage": 10.98, "elapsed_time": "8:05:54", "remaining_time": "2 days, 17:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 9627, "loss": 1.8888, "learning_rate": 9.704939732096175e-05, "epoch": 0.10989924171600707, "percentage": 10.99, "elapsed_time": "8:06:22", "remaining_time": "2 days, 17:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1059, "total_steps": 9627, "loss": 1.6474, "learning_rate": 9.704387263421322e-05, "epoch": 0.11000311623558741, "percentage": 11.0, "elapsed_time": "8:06:51", "remaining_time": "2 days, 17:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 9627, "loss": 1.9323, "learning_rate": 9.70383429376592e-05, "epoch": 0.11010699075516776, "percentage": 11.01, "elapsed_time": "8:07:20", "remaining_time": "2 days, 17:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1061, "total_steps": 9627, "loss": 1.8642, "learning_rate": 9.703280823188858e-05, "epoch": 0.1102108652747481, "percentage": 11.02, "elapsed_time": "8:07:48", "remaining_time": "2 days, 17:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 9627, "loss": 1.7669, "learning_rate": 9.702726851749074e-05, "epoch": 0.11031473979432845, "percentage": 11.03, "elapsed_time": "8:08:17", "remaining_time": "2 days, 17:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1063, "total_steps": 9627, "loss": 1.6532, "learning_rate": 9.702172379505565e-05, "epoch": 0.1104186143139088, "percentage": 11.04, "elapsed_time": "8:08:46", "remaining_time": "2 days, 17:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 9627, "loss": 1.6235, "learning_rate": 9.701617406517374e-05, "epoch": 0.11052248883348914, "percentage": 11.05, "elapsed_time": "8:09:14", "remaining_time": "2 days, 17:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 9627, "loss": 1.9023, "learning_rate": 9.701061932843605e-05, "epoch": 0.1106263633530695, "percentage": 11.06, "elapsed_time": "8:09:42", "remaining_time": "2 days, 17:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 9627, "loss": 1.6955, "learning_rate": 9.700505958543409e-05, "epoch": 0.11073023787264984, "percentage": 11.07, "elapsed_time": "8:10:11", "remaining_time": "2 days, 17:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1067, "total_steps": 9627, "loss": 1.7417, "learning_rate": 9.699949483675994e-05, "epoch": 0.11083411239223019, "percentage": 11.08, "elapsed_time": "8:10:40", "remaining_time": "2 days, 17:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 9627, "loss": 1.7226, "learning_rate": 9.69939250830062e-05, "epoch": 0.11093798691181053, "percentage": 11.09, "elapsed_time": "8:11:08", "remaining_time": "2 days, 17:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1069, "total_steps": 9627, "loss": 1.7571, "learning_rate": 9.698835032476598e-05, "epoch": 0.11104186143139087, "percentage": 11.1, "elapsed_time": "8:11:37", "remaining_time": "2 days, 17:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 9627, "loss": 1.8685, "learning_rate": 9.6982770562633e-05, "epoch": 0.11114573595097123, "percentage": 11.11, "elapsed_time": "8:12:05", "remaining_time": "2 days, 17:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1071, "total_steps": 9627, "loss": 1.6949, "learning_rate": 9.697718579720144e-05, "epoch": 0.11124961047055157, "percentage": 11.12, "elapsed_time": "8:12:33", "remaining_time": "2 days, 17:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 9627, "loss": 1.9906, "learning_rate": 9.697159602906603e-05, "epoch": 0.11135348499013192, "percentage": 11.14, "elapsed_time": "8:13:02", "remaining_time": "2 days, 17:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1073, "total_steps": 9627, "loss": 1.9341, "learning_rate": 9.696600125882202e-05, "epoch": 0.11145735950971226, "percentage": 11.15, "elapsed_time": "8:13:30", "remaining_time": "2 days, 17:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 9627, "loss": 1.929, "learning_rate": 9.696040148706523e-05, "epoch": 0.11156123402929262, "percentage": 11.16, "elapsed_time": "8:13:59", "remaining_time": "2 days, 17:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 9627, "loss": 1.8981, "learning_rate": 9.695479671439198e-05, "epoch": 0.11166510854887296, "percentage": 11.17, "elapsed_time": "8:14:28", "remaining_time": "2 days, 17:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 9627, "loss": 1.689, "learning_rate": 9.694918694139915e-05, "epoch": 0.11176898306845331, "percentage": 11.18, "elapsed_time": "8:14:56", "remaining_time": "2 days, 17:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1077, "total_steps": 9627, "loss": 1.6753, "learning_rate": 9.694357216868413e-05, "epoch": 0.11187285758803366, "percentage": 11.19, "elapsed_time": "8:15:24", "remaining_time": "2 days, 17:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 9627, "loss": 1.6901, "learning_rate": 9.693795239684484e-05, "epoch": 0.111976732107614, "percentage": 11.2, "elapsed_time": "8:15:53", "remaining_time": "2 days, 17:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1079, "total_steps": 9627, "loss": 1.6372, "learning_rate": 9.693232762647976e-05, "epoch": 0.11208060662719435, "percentage": 11.21, "elapsed_time": "8:16:22", "remaining_time": "2 days, 17:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 9627, "loss": 1.8587, "learning_rate": 9.692669785818786e-05, "epoch": 0.11218448114677469, "percentage": 11.22, "elapsed_time": "8:16:51", "remaining_time": "2 days, 17:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1081, "total_steps": 9627, "loss": 1.9017, "learning_rate": 9.69210630925687e-05, "epoch": 0.11228835566635505, "percentage": 11.23, "elapsed_time": "8:17:18", "remaining_time": "2 days, 17:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 9627, "loss": 1.7744, "learning_rate": 9.69154233302223e-05, "epoch": 0.11239223018593539, "percentage": 11.24, "elapsed_time": "8:17:48", "remaining_time": "2 days, 17:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1083, "total_steps": 9627, "loss": 1.6596, "learning_rate": 9.690977857174927e-05, "epoch": 0.11249610470551574, "percentage": 11.25, "elapsed_time": "8:18:16", "remaining_time": "2 days, 17:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 9627, "loss": 1.8651, "learning_rate": 9.690412881775076e-05, "epoch": 0.11259997922509608, "percentage": 11.26, "elapsed_time": "8:18:44", "remaining_time": "2 days, 17:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 9627, "loss": 1.9878, "learning_rate": 9.689847406882838e-05, "epoch": 0.11270385374467642, "percentage": 11.27, "elapsed_time": "8:19:12", "remaining_time": "2 days, 17:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 9627, "loss": 1.9459, "learning_rate": 9.689281432558432e-05, "epoch": 0.11280772826425678, "percentage": 11.28, "elapsed_time": "8:19:42", "remaining_time": "2 days, 17:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1087, "total_steps": 9627, "loss": 1.7604, "learning_rate": 9.688714958862133e-05, "epoch": 0.11291160278383712, "percentage": 11.29, "elapsed_time": "8:20:10", "remaining_time": "2 days, 17:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 9627, "loss": 1.8102, "learning_rate": 9.688147985854264e-05, "epoch": 0.11301547730341747, "percentage": 11.3, "elapsed_time": "8:20:39", "remaining_time": "2 days, 17:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1089, "total_steps": 9627, "loss": 1.8611, "learning_rate": 9.687580513595202e-05, "epoch": 0.11311935182299782, "percentage": 11.31, "elapsed_time": "8:21:06", "remaining_time": "2 days, 17:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 9627, "loss": 1.962, "learning_rate": 9.687012542145382e-05, "epoch": 0.11322322634257817, "percentage": 11.32, "elapsed_time": "8:21:35", "remaining_time": "2 days, 17:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1091, "total_steps": 9627, "loss": 1.7224, "learning_rate": 9.686444071565285e-05, "epoch": 0.11332710086215851, "percentage": 11.33, "elapsed_time": "8:22:03", "remaining_time": "2 days, 17:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 9627, "loss": 1.715, "learning_rate": 9.68587510191545e-05, "epoch": 0.11343097538173887, "percentage": 11.34, "elapsed_time": "8:22:30", "remaining_time": "2 days, 17:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1093, "total_steps": 9627, "loss": 1.6688, "learning_rate": 9.685305633256469e-05, "epoch": 0.11353484990131921, "percentage": 11.35, "elapsed_time": "8:22:59", "remaining_time": "2 days, 17:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 9627, "loss": 1.851, "learning_rate": 9.684735665648983e-05, "epoch": 0.11363872442089955, "percentage": 11.36, "elapsed_time": "8:23:27", "remaining_time": "2 days, 17:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 9627, "loss": 1.8039, "learning_rate": 9.684165199153692e-05, "epoch": 0.1137425989404799, "percentage": 11.37, "elapsed_time": "8:23:56", "remaining_time": "2 days, 17:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 9627, "loss": 1.8317, "learning_rate": 9.683594233831345e-05, "epoch": 0.11384647346006024, "percentage": 11.38, "elapsed_time": "8:24:24", "remaining_time": "2 days, 17:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1097, "total_steps": 9627, "loss": 1.9756, "learning_rate": 9.683022769742746e-05, "epoch": 0.1139503479796406, "percentage": 11.4, "elapsed_time": "8:24:52", "remaining_time": "2 days, 17:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 9627, "loss": 1.6867, "learning_rate": 9.68245080694875e-05, "epoch": 0.11405422249922094, "percentage": 11.41, "elapsed_time": "8:25:21", "remaining_time": "2 days, 17:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1099, "total_steps": 9627, "loss": 1.9397, "learning_rate": 9.68187834551027e-05, "epoch": 0.1141580970188013, "percentage": 11.42, "elapsed_time": "8:25:48", "remaining_time": "2 days, 17:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 9627, "loss": 1.7001, "learning_rate": 9.681305385488264e-05, "epoch": 0.11426197153838163, "percentage": 11.43, "elapsed_time": "8:26:18", "remaining_time": "2 days, 17:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1101, "total_steps": 9627, "loss": 1.774, "learning_rate": 9.680731926943752e-05, "epoch": 0.11436584605796198, "percentage": 11.44, "elapsed_time": "8:26:45", "remaining_time": "2 days, 17:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 9627, "loss": 1.7585, "learning_rate": 9.680157969937799e-05, "epoch": 0.11446972057754233, "percentage": 11.45, "elapsed_time": "8:27:13", "remaining_time": "2 days, 17:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1103, "total_steps": 9627, "loss": 1.8175, "learning_rate": 9.67958351453153e-05, "epoch": 0.11457359509712267, "percentage": 11.46, "elapsed_time": "8:27:42", "remaining_time": "2 days, 17:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 9627, "loss": 1.7941, "learning_rate": 9.679008560786117e-05, "epoch": 0.11467746961670303, "percentage": 11.47, "elapsed_time": "8:28:10", "remaining_time": "2 days, 17:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 9627, "loss": 1.7144, "learning_rate": 9.678433108762791e-05, "epoch": 0.11478134413628337, "percentage": 11.48, "elapsed_time": "8:28:38", "remaining_time": "2 days, 17:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 9627, "loss": 1.9284, "learning_rate": 9.677857158522833e-05, "epoch": 0.11488521865586372, "percentage": 11.49, "elapsed_time": "8:29:06", "remaining_time": "2 days, 17:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1107, "total_steps": 9627, "loss": 1.5077, "learning_rate": 9.677280710127575e-05, "epoch": 0.11498909317544406, "percentage": 11.5, "elapsed_time": "8:29:35", "remaining_time": "2 days, 17:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 9627, "loss": 2.0279, "learning_rate": 9.676703763638406e-05, "epoch": 0.11509296769502442, "percentage": 11.51, "elapsed_time": "8:30:04", "remaining_time": "2 days, 17:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1109, "total_steps": 9627, "loss": 1.9437, "learning_rate": 9.676126319116766e-05, "epoch": 0.11519684221460476, "percentage": 11.52, "elapsed_time": "8:30:31", "remaining_time": "2 days, 17:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 9627, "loss": 1.8091, "learning_rate": 9.675548376624148e-05, "epoch": 0.1153007167341851, "percentage": 11.53, "elapsed_time": "8:31:00", "remaining_time": "2 days, 17:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1111, "total_steps": 9627, "loss": 1.7403, "learning_rate": 9.674969936222099e-05, "epoch": 0.11540459125376545, "percentage": 11.54, "elapsed_time": "8:31:27", "remaining_time": "2 days, 17:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 9627, "loss": 1.9467, "learning_rate": 9.674390997972218e-05, "epoch": 0.1155084657733458, "percentage": 11.55, "elapsed_time": "8:31:55", "remaining_time": "2 days, 17:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1113, "total_steps": 9627, "loss": 1.8208, "learning_rate": 9.673811561936157e-05, "epoch": 0.11561234029292615, "percentage": 11.56, "elapsed_time": "8:32:25", "remaining_time": "2 days, 17:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 9627, "loss": 1.7336, "learning_rate": 9.673231628175622e-05, "epoch": 0.11571621481250649, "percentage": 11.57, "elapsed_time": "8:32:53", "remaining_time": "2 days, 17:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 9627, "loss": 1.9191, "learning_rate": 9.672651196752371e-05, "epoch": 0.11582008933208685, "percentage": 11.58, "elapsed_time": "8:33:21", "remaining_time": "2 days, 17:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 9627, "loss": 1.7849, "learning_rate": 9.672070267728215e-05, "epoch": 0.11592396385166719, "percentage": 11.59, "elapsed_time": "8:33:49", "remaining_time": "2 days, 17:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1117, "total_steps": 9627, "loss": 2.076, "learning_rate": 9.67148884116502e-05, "epoch": 0.11602783837124753, "percentage": 11.6, "elapsed_time": "8:34:17", "remaining_time": "2 days, 17:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 9627, "loss": 1.7839, "learning_rate": 9.670906917124703e-05, "epoch": 0.11613171289082788, "percentage": 11.61, "elapsed_time": "8:34:45", "remaining_time": "2 days, 17:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1119, "total_steps": 9627, "loss": 1.7778, "learning_rate": 9.670324495669231e-05, "epoch": 0.11623558741040822, "percentage": 11.62, "elapsed_time": "8:35:13", "remaining_time": "2 days, 17:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 9627, "loss": 1.8653, "learning_rate": 9.669741576860634e-05, "epoch": 0.11633946192998858, "percentage": 11.63, "elapsed_time": "8:35:42", "remaining_time": "2 days, 17:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1121, "total_steps": 9627, "loss": 1.9041, "learning_rate": 9.669158160760982e-05, "epoch": 0.11644333644956892, "percentage": 11.64, "elapsed_time": "8:36:10", "remaining_time": "2 days, 17:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 9627, "loss": 1.5888, "learning_rate": 9.668574247432407e-05, "epoch": 0.11654721096914927, "percentage": 11.65, "elapsed_time": "8:36:38", "remaining_time": "2 days, 17:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1123, "total_steps": 9627, "loss": 1.8802, "learning_rate": 9.667989836937092e-05, "epoch": 0.11665108548872961, "percentage": 11.67, "elapsed_time": "8:37:06", "remaining_time": "2 days, 17:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 9627, "loss": 1.8201, "learning_rate": 9.66740492933727e-05, "epoch": 0.11675496000830995, "percentage": 11.68, "elapsed_time": "8:37:34", "remaining_time": "2 days, 17:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 9627, "loss": 1.758, "learning_rate": 9.66681952469523e-05, "epoch": 0.11685883452789031, "percentage": 11.69, "elapsed_time": "8:38:04", "remaining_time": "2 days, 17:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 9627, "loss": 1.8567, "learning_rate": 9.666233623073315e-05, "epoch": 0.11696270904747065, "percentage": 11.7, "elapsed_time": "8:38:31", "remaining_time": "2 days, 17:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1127, "total_steps": 9627, "loss": 1.8514, "learning_rate": 9.665647224533915e-05, "epoch": 0.117066583567051, "percentage": 11.71, "elapsed_time": "8:39:00", "remaining_time": "2 days, 17:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 9627, "loss": 1.9686, "learning_rate": 9.665060329139479e-05, "epoch": 0.11717045808663135, "percentage": 11.72, "elapsed_time": "8:39:28", "remaining_time": "2 days, 17:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1129, "total_steps": 9627, "loss": 1.6642, "learning_rate": 9.66447293695251e-05, "epoch": 0.1172743326062117, "percentage": 11.73, "elapsed_time": "8:39:56", "remaining_time": "2 days, 17:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 9627, "loss": 1.6711, "learning_rate": 9.663885048035555e-05, "epoch": 0.11737820712579204, "percentage": 11.74, "elapsed_time": "8:40:25", "remaining_time": "2 days, 17:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1131, "total_steps": 9627, "loss": 1.7615, "learning_rate": 9.663296662451221e-05, "epoch": 0.1174820816453724, "percentage": 11.75, "elapsed_time": "8:40:52", "remaining_time": "2 days, 17:12:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 9627, "loss": 1.6615, "learning_rate": 9.66270778026217e-05, "epoch": 0.11758595616495274, "percentage": 11.76, "elapsed_time": "8:41:21", "remaining_time": "2 days, 17:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1133, "total_steps": 9627, "loss": 1.8592, "learning_rate": 9.662118401531108e-05, "epoch": 0.11768983068453308, "percentage": 11.77, "elapsed_time": "8:41:49", "remaining_time": "2 days, 17:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 9627, "loss": 1.8253, "learning_rate": 9.661528526320804e-05, "epoch": 0.11779370520411343, "percentage": 11.78, "elapsed_time": "8:42:18", "remaining_time": "2 days, 17:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 9627, "loss": 1.592, "learning_rate": 9.660938154694075e-05, "epoch": 0.11789757972369377, "percentage": 11.79, "elapsed_time": "8:42:46", "remaining_time": "2 days, 17:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 9627, "loss": 1.6502, "learning_rate": 9.660347286713787e-05, "epoch": 0.11800145424327413, "percentage": 11.8, "elapsed_time": "8:43:15", "remaining_time": "2 days, 17:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1137, "total_steps": 9627, "loss": 1.6945, "learning_rate": 9.659755922442866e-05, "epoch": 0.11810532876285447, "percentage": 11.81, "elapsed_time": "8:43:42", "remaining_time": "2 days, 17:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 9627, "loss": 1.7614, "learning_rate": 9.659164061944285e-05, "epoch": 0.11820920328243482, "percentage": 11.82, "elapsed_time": "8:44:10", "remaining_time": "2 days, 17:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1139, "total_steps": 9627, "loss": 1.8105, "learning_rate": 9.658571705281076e-05, "epoch": 0.11831307780201517, "percentage": 11.83, "elapsed_time": "8:44:40", "remaining_time": "2 days, 17:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 9627, "loss": 1.6527, "learning_rate": 9.657978852516319e-05, "epoch": 0.1184169523215955, "percentage": 11.84, "elapsed_time": "8:45:08", "remaining_time": "2 days, 17:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1141, "total_steps": 9627, "loss": 1.8393, "learning_rate": 9.657385503713146e-05, "epoch": 0.11852082684117586, "percentage": 11.85, "elapsed_time": "8:45:37", "remaining_time": "2 days, 17:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 9627, "loss": 1.7833, "learning_rate": 9.656791658934747e-05, "epoch": 0.1186247013607562, "percentage": 11.86, "elapsed_time": "8:46:04", "remaining_time": "2 days, 17:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1143, "total_steps": 9627, "loss": 1.9837, "learning_rate": 9.656197318244359e-05, "epoch": 0.11872857588033656, "percentage": 11.87, "elapsed_time": "8:46:34", "remaining_time": "2 days, 17:08:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 9627, "loss": 1.8836, "learning_rate": 9.655602481705279e-05, "epoch": 0.1188324503999169, "percentage": 11.88, "elapsed_time": "8:47:01", "remaining_time": "2 days, 17:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 9627, "loss": 1.7552, "learning_rate": 9.655007149380849e-05, "epoch": 0.11893632491949725, "percentage": 11.89, "elapsed_time": "8:47:29", "remaining_time": "2 days, 17:07:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 9627, "loss": 1.6319, "learning_rate": 9.654411321334468e-05, "epoch": 0.11904019943907759, "percentage": 11.9, "elapsed_time": "8:47:57", "remaining_time": "2 days, 17:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1147, "total_steps": 9627, "loss": 1.6788, "learning_rate": 9.653814997629587e-05, "epoch": 0.11914407395865795, "percentage": 11.91, "elapsed_time": "8:48:26", "remaining_time": "2 days, 17:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 9627, "loss": 1.8694, "learning_rate": 9.653218178329709e-05, "epoch": 0.11924794847823829, "percentage": 11.92, "elapsed_time": "8:48:54", "remaining_time": "2 days, 17:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1149, "total_steps": 9627, "loss": 1.7641, "learning_rate": 9.652620863498393e-05, "epoch": 0.11935182299781863, "percentage": 11.94, "elapsed_time": "8:49:23", "remaining_time": "2 days, 17:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 9627, "loss": 1.8416, "learning_rate": 9.652023053199247e-05, "epoch": 0.11945569751739898, "percentage": 11.95, "elapsed_time": "8:49:51", "remaining_time": "2 days, 17:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1151, "total_steps": 9627, "loss": 1.9727, "learning_rate": 9.651424747495931e-05, "epoch": 0.11955957203697933, "percentage": 11.96, "elapsed_time": "8:50:18", "remaining_time": "2 days, 17:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 9627, "loss": 1.6429, "learning_rate": 9.650825946452164e-05, "epoch": 0.11966344655655968, "percentage": 11.97, "elapsed_time": "8:50:46", "remaining_time": "2 days, 17:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1153, "total_steps": 9627, "loss": 1.7789, "learning_rate": 9.65022665013171e-05, "epoch": 0.11976732107614002, "percentage": 11.98, "elapsed_time": "8:51:14", "remaining_time": "2 days, 17:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 9627, "loss": 1.8482, "learning_rate": 9.64962685859839e-05, "epoch": 0.11987119559572038, "percentage": 11.99, "elapsed_time": "8:51:43", "remaining_time": "2 days, 17:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 9627, "loss": 1.621, "learning_rate": 9.64902657191608e-05, "epoch": 0.11997507011530072, "percentage": 12.0, "elapsed_time": "8:52:10", "remaining_time": "2 days, 17:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 9627, "loss": 1.869, "learning_rate": 9.648425790148704e-05, "epoch": 0.12007894463488106, "percentage": 12.01, "elapsed_time": "8:52:39", "remaining_time": "2 days, 17:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1157, "total_steps": 9627, "loss": 1.8155, "learning_rate": 9.64782451336024e-05, "epoch": 0.12018281915446141, "percentage": 12.02, "elapsed_time": "8:53:06", "remaining_time": "2 days, 17:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 9627, "loss": 1.6419, "learning_rate": 9.64722274161472e-05, "epoch": 0.12028669367404175, "percentage": 12.03, "elapsed_time": "8:53:34", "remaining_time": "2 days, 17:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1159, "total_steps": 9627, "loss": 1.8969, "learning_rate": 9.646620474976226e-05, "epoch": 0.12039056819362211, "percentage": 12.04, "elapsed_time": "8:54:02", "remaining_time": "2 days, 17:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 9627, "loss": 1.7814, "learning_rate": 9.6460177135089e-05, "epoch": 0.12049444271320245, "percentage": 12.05, "elapsed_time": "8:54:30", "remaining_time": "2 days, 17:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1161, "total_steps": 9627, "loss": 1.8611, "learning_rate": 9.645414457276925e-05, "epoch": 0.1205983172327828, "percentage": 12.06, "elapsed_time": "8:54:58", "remaining_time": "2 days, 17:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 9627, "loss": 1.838, "learning_rate": 9.644810706344547e-05, "epoch": 0.12070219175236314, "percentage": 12.07, "elapsed_time": "8:55:25", "remaining_time": "2 days, 17:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1163, "total_steps": 9627, "loss": 1.7295, "learning_rate": 9.644206460776058e-05, "epoch": 0.1208060662719435, "percentage": 12.08, "elapsed_time": "8:55:53", "remaining_time": "2 days, 17:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 9627, "loss": 1.8078, "learning_rate": 9.643601720635809e-05, "epoch": 0.12090994079152384, "percentage": 12.09, "elapsed_time": "8:56:21", "remaining_time": "2 days, 16:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 9627, "loss": 1.8958, "learning_rate": 9.642996485988198e-05, "epoch": 0.12101381531110418, "percentage": 12.1, "elapsed_time": "8:56:48", "remaining_time": "2 days, 16:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 9627, "loss": 1.7418, "learning_rate": 9.642390756897677e-05, "epoch": 0.12111768983068454, "percentage": 12.11, "elapsed_time": "8:57:17", "remaining_time": "2 days, 16:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1167, "total_steps": 9627, "loss": 1.6745, "learning_rate": 9.641784533428754e-05, "epoch": 0.12122156435026488, "percentage": 12.12, "elapsed_time": "8:57:45", "remaining_time": "2 days, 16:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 9627, "loss": 2.0477, "learning_rate": 9.641177815645984e-05, "epoch": 0.12132543886984523, "percentage": 12.13, "elapsed_time": "8:58:12", "remaining_time": "2 days, 16:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1169, "total_steps": 9627, "loss": 1.8097, "learning_rate": 9.64057060361398e-05, "epoch": 0.12142931338942557, "percentage": 12.14, "elapsed_time": "8:58:39", "remaining_time": "2 days, 16:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 9627, "loss": 1.921, "learning_rate": 9.639962897397404e-05, "epoch": 0.12153318790900593, "percentage": 12.15, "elapsed_time": "8:59:07", "remaining_time": "2 days, 16:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1171, "total_steps": 9627, "loss": 1.9793, "learning_rate": 9.639354697060974e-05, "epoch": 0.12163706242858627, "percentage": 12.16, "elapsed_time": "8:59:35", "remaining_time": "2 days, 16:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 9627, "loss": 1.685, "learning_rate": 9.638746002669455e-05, "epoch": 0.12174093694816661, "percentage": 12.17, "elapsed_time": "9:00:03", "remaining_time": "2 days, 16:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1173, "total_steps": 9627, "loss": 1.6935, "learning_rate": 9.638136814287672e-05, "epoch": 0.12184481146774696, "percentage": 12.18, "elapsed_time": "9:00:31", "remaining_time": "2 days, 16:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 9627, "loss": 1.6975, "learning_rate": 9.637527131980496e-05, "epoch": 0.1219486859873273, "percentage": 12.19, "elapsed_time": "9:00:58", "remaining_time": "2 days, 16:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 9627, "loss": 1.982, "learning_rate": 9.636916955812856e-05, "epoch": 0.12205256050690766, "percentage": 12.21, "elapsed_time": "9:01:25", "remaining_time": "2 days, 16:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 9627, "loss": 1.8531, "learning_rate": 9.636306285849728e-05, "epoch": 0.122156435026488, "percentage": 12.22, "elapsed_time": "9:01:54", "remaining_time": "2 days, 16:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1177, "total_steps": 9627, "loss": 1.9038, "learning_rate": 9.635695122156145e-05, "epoch": 0.12226030954606835, "percentage": 12.23, "elapsed_time": "9:02:21", "remaining_time": "2 days, 16:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 9627, "loss": 2.0153, "learning_rate": 9.635083464797192e-05, "epoch": 0.1223641840656487, "percentage": 12.24, "elapsed_time": "9:02:50", "remaining_time": "2 days, 16:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1179, "total_steps": 9627, "loss": 1.743, "learning_rate": 9.634471313838005e-05, "epoch": 0.12246805858522904, "percentage": 12.25, "elapsed_time": "9:03:16", "remaining_time": "2 days, 16:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 9627, "loss": 1.7878, "learning_rate": 9.633858669343774e-05, "epoch": 0.12257193310480939, "percentage": 12.26, "elapsed_time": "9:03:45", "remaining_time": "2 days, 16:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1181, "total_steps": 9627, "loss": 1.9123, "learning_rate": 9.633245531379739e-05, "epoch": 0.12267580762438973, "percentage": 12.27, "elapsed_time": "9:04:12", "remaining_time": "2 days, 16:51:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 9627, "loss": 1.8383, "learning_rate": 9.632631900011197e-05, "epoch": 0.12277968214397009, "percentage": 12.28, "elapsed_time": "9:04:41", "remaining_time": "2 days, 16:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1183, "total_steps": 9627, "loss": 1.817, "learning_rate": 9.632017775303492e-05, "epoch": 0.12288355666355043, "percentage": 12.29, "elapsed_time": "9:05:09", "remaining_time": "2 days, 16:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 9627, "loss": 1.9845, "learning_rate": 9.631403157322026e-05, "epoch": 0.12298743118313078, "percentage": 12.3, "elapsed_time": "9:05:35", "remaining_time": "2 days, 16:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1185, "total_steps": 9627, "loss": 1.904, "learning_rate": 9.630788046132251e-05, "epoch": 0.12309130570271112, "percentage": 12.31, "elapsed_time": "9:06:03", "remaining_time": "2 days, 16:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1186, "total_steps": 9627, "loss": 1.7073, "learning_rate": 9.63017244179967e-05, "epoch": 0.12319518022229148, "percentage": 12.32, "elapsed_time": "9:06:31", "remaining_time": "2 days, 16:49:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1187, "total_steps": 9627, "loss": 1.7045, "learning_rate": 9.629556344389839e-05, "epoch": 0.12329905474187182, "percentage": 12.33, "elapsed_time": "9:07:00", "remaining_time": "2 days, 16:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1188, "total_steps": 9627, "loss": 1.7442, "learning_rate": 9.628939753968371e-05, "epoch": 0.12340292926145216, "percentage": 12.34, "elapsed_time": "9:07:27", "remaining_time": "2 days, 16:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1189, "total_steps": 9627, "loss": 1.7656, "learning_rate": 9.628322670600926e-05, "epoch": 0.12350680378103251, "percentage": 12.35, "elapsed_time": "9:07:54", "remaining_time": "2 days, 16:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 9627, "loss": 2.0144, "learning_rate": 9.627705094353219e-05, "epoch": 0.12361067830061286, "percentage": 12.36, "elapsed_time": "9:08:23", "remaining_time": "2 days, 16:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1191, "total_steps": 9627, "loss": 1.8333, "learning_rate": 9.627087025291015e-05, "epoch": 0.12371455282019321, "percentage": 12.37, "elapsed_time": "9:08:50", "remaining_time": "2 days, 16:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1192, "total_steps": 9627, "loss": 1.5966, "learning_rate": 9.626468463480138e-05, "epoch": 0.12381842733977355, "percentage": 12.38, "elapsed_time": "9:09:18", "remaining_time": "2 days, 16:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1193, "total_steps": 9627, "loss": 1.7578, "learning_rate": 9.625849408986456e-05, "epoch": 0.1239223018593539, "percentage": 12.39, "elapsed_time": "9:09:46", "remaining_time": "2 days, 16:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1194, "total_steps": 9627, "loss": 1.6883, "learning_rate": 9.625229861875897e-05, "epoch": 0.12402617637893425, "percentage": 12.4, "elapsed_time": "9:10:13", "remaining_time": "2 days, 16:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1195, "total_steps": 9627, "loss": 1.534, "learning_rate": 9.624609822214434e-05, "epoch": 0.12413005089851459, "percentage": 12.41, "elapsed_time": "9:10:41", "remaining_time": "2 days, 16:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1196, "total_steps": 9627, "loss": 1.804, "learning_rate": 9.623989290068099e-05, "epoch": 0.12423392541809494, "percentage": 12.42, "elapsed_time": "9:11:09", "remaining_time": "2 days, 16:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1197, "total_steps": 9627, "loss": 1.8282, "learning_rate": 9.623368265502973e-05, "epoch": 0.12433779993767528, "percentage": 12.43, "elapsed_time": "9:11:36", "remaining_time": "2 days, 16:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1198, "total_steps": 9627, "loss": 1.748, "learning_rate": 9.62274674858519e-05, "epoch": 0.12444167445725564, "percentage": 12.44, "elapsed_time": "9:12:04", "remaining_time": "2 days, 16:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1199, "total_steps": 9627, "loss": 1.9086, "learning_rate": 9.622124739380936e-05, "epoch": 0.12454554897683598, "percentage": 12.45, "elapsed_time": "9:12:32", "remaining_time": "2 days, 16:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 9627, "loss": 1.7812, "learning_rate": 9.621502237956452e-05, "epoch": 0.12464942349641633, "percentage": 12.46, "elapsed_time": "9:13:00", "remaining_time": "2 days, 16:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1201, "total_steps": 9627, "loss": 1.6562, "learning_rate": 9.62087924437803e-05, "epoch": 0.12475329801599667, "percentage": 12.48, "elapsed_time": "9:13:27", "remaining_time": "2 days, 16:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1202, "total_steps": 9627, "loss": 1.743, "learning_rate": 9.620255758712012e-05, "epoch": 0.12485717253557703, "percentage": 12.49, "elapsed_time": "9:13:55", "remaining_time": "2 days, 16:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1203, "total_steps": 9627, "loss": 1.7807, "learning_rate": 9.619631781024797e-05, "epoch": 0.12496104705515737, "percentage": 12.5, "elapsed_time": "9:14:22", "remaining_time": "2 days, 16:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1204, "total_steps": 9627, "loss": 1.8727, "learning_rate": 9.619007311382828e-05, "epoch": 0.12506492157473773, "percentage": 12.51, "elapsed_time": "9:14:51", "remaining_time": "2 days, 16:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1205, "total_steps": 9627, "loss": 1.6474, "learning_rate": 9.618382349852612e-05, "epoch": 0.12516879609431805, "percentage": 12.52, "elapsed_time": "9:15:18", "remaining_time": "2 days, 16:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1206, "total_steps": 9627, "loss": 1.7651, "learning_rate": 9.617756896500701e-05, "epoch": 0.1252726706138984, "percentage": 12.53, "elapsed_time": "9:15:45", "remaining_time": "2 days, 16:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1207, "total_steps": 9627, "loss": 1.6898, "learning_rate": 9.6171309513937e-05, "epoch": 0.12537654513347876, "percentage": 12.54, "elapsed_time": "9:16:14", "remaining_time": "2 days, 16:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1208, "total_steps": 9627, "loss": 1.5825, "learning_rate": 9.616504514598267e-05, "epoch": 0.12548041965305912, "percentage": 12.55, "elapsed_time": "9:16:41", "remaining_time": "2 days, 16:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1209, "total_steps": 9627, "loss": 1.7711, "learning_rate": 9.615877586181114e-05, "epoch": 0.12558429417263944, "percentage": 12.56, "elapsed_time": "9:17:08", "remaining_time": "2 days, 16:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 9627, "loss": 1.8772, "learning_rate": 9.615250166209003e-05, "epoch": 0.1256881686922198, "percentage": 12.57, "elapsed_time": "9:17:37", "remaining_time": "2 days, 16:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1211, "total_steps": 9627, "loss": 1.6718, "learning_rate": 9.614622254748749e-05, "epoch": 0.12579204321180015, "percentage": 12.58, "elapsed_time": "9:18:03", "remaining_time": "2 days, 16:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1212, "total_steps": 9627, "loss": 1.7133, "learning_rate": 9.613993851867221e-05, "epoch": 0.12589591773138048, "percentage": 12.59, "elapsed_time": "9:18:32", "remaining_time": "2 days, 16:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1213, "total_steps": 9627, "loss": 1.8524, "learning_rate": 9.613364957631339e-05, "epoch": 0.12599979225096083, "percentage": 12.6, "elapsed_time": "9:18:59", "remaining_time": "2 days, 16:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1214, "total_steps": 9627, "loss": 1.7747, "learning_rate": 9.612735572108073e-05, "epoch": 0.1261036667705412, "percentage": 12.61, "elapsed_time": "9:19:28", "remaining_time": "2 days, 16:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1215, "total_steps": 9627, "loss": 1.7503, "learning_rate": 9.61210569536445e-05, "epoch": 0.12620754129012154, "percentage": 12.62, "elapsed_time": "9:19:54", "remaining_time": "2 days, 16:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1216, "total_steps": 9627, "loss": 1.8134, "learning_rate": 9.611475327467547e-05, "epoch": 0.12631141580970187, "percentage": 12.63, "elapsed_time": "9:20:22", "remaining_time": "2 days, 16:36:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1217, "total_steps": 9627, "loss": 1.9043, "learning_rate": 9.610844468484492e-05, "epoch": 0.12641529032928223, "percentage": 12.64, "elapsed_time": "9:20:49", "remaining_time": "2 days, 16:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1218, "total_steps": 9627, "loss": 1.6922, "learning_rate": 9.610213118482468e-05, "epoch": 0.12651916484886258, "percentage": 12.65, "elapsed_time": "9:21:18", "remaining_time": "2 days, 16:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1219, "total_steps": 9627, "loss": 1.8249, "learning_rate": 9.609581277528708e-05, "epoch": 0.1266230393684429, "percentage": 12.66, "elapsed_time": "9:21:44", "remaining_time": "2 days, 16:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 9627, "loss": 1.6571, "learning_rate": 9.608948945690496e-05, "epoch": 0.12672691388802326, "percentage": 12.67, "elapsed_time": "9:22:13", "remaining_time": "2 days, 16:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1221, "total_steps": 9627, "loss": 1.8308, "learning_rate": 9.608316123035172e-05, "epoch": 0.12683078840760362, "percentage": 12.68, "elapsed_time": "9:22:40", "remaining_time": "2 days, 16:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1222, "total_steps": 9627, "loss": 1.8263, "learning_rate": 9.60768280963013e-05, "epoch": 0.12693466292718397, "percentage": 12.69, "elapsed_time": "9:23:07", "remaining_time": "2 days, 16:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1223, "total_steps": 9627, "loss": 1.8465, "learning_rate": 9.60704900554281e-05, "epoch": 0.1270385374467643, "percentage": 12.7, "elapsed_time": "9:23:36", "remaining_time": "2 days, 16:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1224, "total_steps": 9627, "loss": 1.9523, "learning_rate": 9.606414710840706e-05, "epoch": 0.12714241196634465, "percentage": 12.71, "elapsed_time": "9:24:03", "remaining_time": "2 days, 16:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1225, "total_steps": 9627, "loss": 1.8436, "learning_rate": 9.605779925591366e-05, "epoch": 0.127246286485925, "percentage": 12.72, "elapsed_time": "9:24:31", "remaining_time": "2 days, 16:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1226, "total_steps": 9627, "loss": 1.8095, "learning_rate": 9.605144649862391e-05, "epoch": 0.12735016100550534, "percentage": 12.74, "elapsed_time": "9:24:59", "remaining_time": "2 days, 16:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1227, "total_steps": 9627, "loss": 1.9452, "learning_rate": 9.604508883721432e-05, "epoch": 0.1274540355250857, "percentage": 12.75, "elapsed_time": "9:25:26", "remaining_time": "2 days, 16:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1228, "total_steps": 9627, "loss": 1.8987, "learning_rate": 9.603872627236194e-05, "epoch": 0.12755791004466605, "percentage": 12.76, "elapsed_time": "9:25:54", "remaining_time": "2 days, 16:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1229, "total_steps": 9627, "loss": 1.6107, "learning_rate": 9.603235880474433e-05, "epoch": 0.1276617845642464, "percentage": 12.77, "elapsed_time": "9:26:21", "remaining_time": "2 days, 16:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 9627, "loss": 1.5594, "learning_rate": 9.602598643503957e-05, "epoch": 0.12776565908382673, "percentage": 12.78, "elapsed_time": "9:26:50", "remaining_time": "2 days, 16:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1231, "total_steps": 9627, "loss": 2.082, "learning_rate": 9.601960916392627e-05, "epoch": 0.12786953360340708, "percentage": 12.79, "elapsed_time": "9:27:17", "remaining_time": "2 days, 16:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1232, "total_steps": 9627, "loss": 1.7435, "learning_rate": 9.601322699208357e-05, "epoch": 0.12797340812298744, "percentage": 12.8, "elapsed_time": "9:27:45", "remaining_time": "2 days, 16:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1233, "total_steps": 9627, "loss": 1.7594, "learning_rate": 9.60068399201911e-05, "epoch": 0.1280772826425678, "percentage": 12.81, "elapsed_time": "9:28:13", "remaining_time": "2 days, 16:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1234, "total_steps": 9627, "loss": 1.8354, "learning_rate": 9.600044794892905e-05, "epoch": 0.12818115716214812, "percentage": 12.82, "elapsed_time": "9:28:40", "remaining_time": "2 days, 16:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1235, "total_steps": 9627, "loss": 1.7715, "learning_rate": 9.599405107897811e-05, "epoch": 0.12828503168172847, "percentage": 12.83, "elapsed_time": "9:29:08", "remaining_time": "2 days, 16:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1236, "total_steps": 9627, "loss": 1.6034, "learning_rate": 9.598764931101949e-05, "epoch": 0.12838890620130883, "percentage": 12.84, "elapsed_time": "9:29:35", "remaining_time": "2 days, 16:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1237, "total_steps": 9627, "loss": 1.6561, "learning_rate": 9.598124264573495e-05, "epoch": 0.12849278072088915, "percentage": 12.85, "elapsed_time": "9:30:04", "remaining_time": "2 days, 16:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1238, "total_steps": 9627, "loss": 1.8149, "learning_rate": 9.597483108380674e-05, "epoch": 0.1285966552404695, "percentage": 12.86, "elapsed_time": "9:30:31", "remaining_time": "2 days, 16:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1239, "total_steps": 9627, "loss": 1.8963, "learning_rate": 9.596841462591761e-05, "epoch": 0.12870052976004986, "percentage": 12.87, "elapsed_time": "9:30:57", "remaining_time": "2 days, 16:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 9627, "loss": 1.7161, "learning_rate": 9.596199327275091e-05, "epoch": 0.12880440427963022, "percentage": 12.88, "elapsed_time": "9:31:26", "remaining_time": "2 days, 16:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1241, "total_steps": 9627, "loss": 1.86, "learning_rate": 9.595556702499045e-05, "epoch": 0.12890827879921055, "percentage": 12.89, "elapsed_time": "9:31:54", "remaining_time": "2 days, 16:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1242, "total_steps": 9627, "loss": 1.5897, "learning_rate": 9.594913588332055e-05, "epoch": 0.1290121533187909, "percentage": 12.9, "elapsed_time": "9:32:21", "remaining_time": "2 days, 16:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1243, "total_steps": 9627, "loss": 1.8549, "learning_rate": 9.594269984842612e-05, "epoch": 0.12911602783837126, "percentage": 12.91, "elapsed_time": "9:32:50", "remaining_time": "2 days, 16:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1244, "total_steps": 9627, "loss": 1.8379, "learning_rate": 9.59362589209925e-05, "epoch": 0.12921990235795158, "percentage": 12.92, "elapsed_time": "9:33:16", "remaining_time": "2 days, 16:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1245, "total_steps": 9627, "loss": 1.8592, "learning_rate": 9.592981310170563e-05, "epoch": 0.12932377687753194, "percentage": 12.93, "elapsed_time": "9:33:45", "remaining_time": "2 days, 16:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1246, "total_steps": 9627, "loss": 1.7502, "learning_rate": 9.592336239125193e-05, "epoch": 0.1294276513971123, "percentage": 12.94, "elapsed_time": "9:34:12", "remaining_time": "2 days, 16:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1247, "total_steps": 9627, "loss": 1.8981, "learning_rate": 9.591690679031835e-05, "epoch": 0.12953152591669265, "percentage": 12.95, "elapsed_time": "9:34:40", "remaining_time": "2 days, 16:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1248, "total_steps": 9627, "loss": 1.913, "learning_rate": 9.591044629959236e-05, "epoch": 0.12963540043627297, "percentage": 12.96, "elapsed_time": "9:35:07", "remaining_time": "2 days, 16:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1249, "total_steps": 9627, "loss": 1.6886, "learning_rate": 9.590398091976195e-05, "epoch": 0.12973927495585333, "percentage": 12.97, "elapsed_time": "9:35:35", "remaining_time": "2 days, 16:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 9627, "loss": 1.7328, "learning_rate": 9.589751065151567e-05, "epoch": 0.12984314947543368, "percentage": 12.98, "elapsed_time": "9:36:03", "remaining_time": "2 days, 16:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1251, "total_steps": 9627, "loss": 1.9107, "learning_rate": 9.589103549554248e-05, "epoch": 0.129947023995014, "percentage": 12.99, "elapsed_time": "9:36:30", "remaining_time": "2 days, 16:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1252, "total_steps": 9627, "loss": 1.7693, "learning_rate": 9.5884555452532e-05, "epoch": 0.13005089851459437, "percentage": 13.01, "elapsed_time": "9:36:58", "remaining_time": "2 days, 16:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1253, "total_steps": 9627, "loss": 1.696, "learning_rate": 9.587807052317426e-05, "epoch": 0.13015477303417472, "percentage": 13.02, "elapsed_time": "9:37:25", "remaining_time": "2 days, 16:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1254, "total_steps": 9627, "loss": 1.9454, "learning_rate": 9.587158070815988e-05, "epoch": 0.13025864755375507, "percentage": 13.03, "elapsed_time": "9:37:53", "remaining_time": "2 days, 16:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1255, "total_steps": 9627, "loss": 1.8159, "learning_rate": 9.586508600817997e-05, "epoch": 0.1303625220733354, "percentage": 13.04, "elapsed_time": "9:38:21", "remaining_time": "2 days, 16:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1256, "total_steps": 9627, "loss": 1.7915, "learning_rate": 9.585858642392616e-05, "epoch": 0.13046639659291576, "percentage": 13.05, "elapsed_time": "9:38:49", "remaining_time": "2 days, 16:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1257, "total_steps": 9627, "loss": 1.754, "learning_rate": 9.585208195609059e-05, "epoch": 0.1305702711124961, "percentage": 13.06, "elapsed_time": "9:39:17", "remaining_time": "2 days, 16:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1258, "total_steps": 9627, "loss": 1.8592, "learning_rate": 9.584557260536597e-05, "epoch": 0.13067414563207644, "percentage": 13.07, "elapsed_time": "9:39:44", "remaining_time": "2 days, 16:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1259, "total_steps": 9627, "loss": 1.814, "learning_rate": 9.583905837244547e-05, "epoch": 0.1307780201516568, "percentage": 13.08, "elapsed_time": "9:40:12", "remaining_time": "2 days, 16:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 9627, "loss": 1.7968, "learning_rate": 9.583253925802283e-05, "epoch": 0.13088189467123715, "percentage": 13.09, "elapsed_time": "9:40:39", "remaining_time": "2 days, 16:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1261, "total_steps": 9627, "loss": 2.0191, "learning_rate": 9.582601526279225e-05, "epoch": 0.1309857691908175, "percentage": 13.1, "elapsed_time": "9:41:07", "remaining_time": "2 days, 16:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1262, "total_steps": 9627, "loss": 1.7923, "learning_rate": 9.581948638744849e-05, "epoch": 0.13108964371039783, "percentage": 13.11, "elapsed_time": "9:41:34", "remaining_time": "2 days, 16:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1263, "total_steps": 9627, "loss": 1.6561, "learning_rate": 9.581295263268684e-05, "epoch": 0.13119351822997818, "percentage": 13.12, "elapsed_time": "9:42:01", "remaining_time": "2 days, 16:14:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1264, "total_steps": 9627, "loss": 1.8836, "learning_rate": 9.580641399920311e-05, "epoch": 0.13129739274955854, "percentage": 13.13, "elapsed_time": "9:42:30", "remaining_time": "2 days, 16:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1265, "total_steps": 9627, "loss": 1.7498, "learning_rate": 9.579987048769356e-05, "epoch": 0.1314012672691389, "percentage": 13.14, "elapsed_time": "9:42:57", "remaining_time": "2 days, 16:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1266, "total_steps": 9627, "loss": 1.6476, "learning_rate": 9.579332209885508e-05, "epoch": 0.13150514178871922, "percentage": 13.15, "elapsed_time": "9:43:25", "remaining_time": "2 days, 16:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1267, "total_steps": 9627, "loss": 1.7795, "learning_rate": 9.5786768833385e-05, "epoch": 0.13160901630829958, "percentage": 13.16, "elapsed_time": "9:43:52", "remaining_time": "2 days, 16:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1268, "total_steps": 9627, "loss": 1.718, "learning_rate": 9.578021069198118e-05, "epoch": 0.13171289082787993, "percentage": 13.17, "elapsed_time": "9:44:20", "remaining_time": "2 days, 16:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1269, "total_steps": 9627, "loss": 1.7214, "learning_rate": 9.577364767534202e-05, "epoch": 0.13181676534746026, "percentage": 13.18, "elapsed_time": "9:44:48", "remaining_time": "2 days, 16:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 9627, "loss": 1.6402, "learning_rate": 9.576707978416644e-05, "epoch": 0.1319206398670406, "percentage": 13.19, "elapsed_time": "9:45:15", "remaining_time": "2 days, 16:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1271, "total_steps": 9627, "loss": 1.8282, "learning_rate": 9.576050701915385e-05, "epoch": 0.13202451438662097, "percentage": 13.2, "elapsed_time": "9:45:43", "remaining_time": "2 days, 16:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1272, "total_steps": 9627, "loss": 2.0049, "learning_rate": 9.575392938100422e-05, "epoch": 0.13212838890620132, "percentage": 13.21, "elapsed_time": "9:46:11", "remaining_time": "2 days, 16:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1273, "total_steps": 9627, "loss": 1.678, "learning_rate": 9.5747346870418e-05, "epoch": 0.13223226342578165, "percentage": 13.22, "elapsed_time": "9:46:37", "remaining_time": "2 days, 16:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1274, "total_steps": 9627, "loss": 1.7132, "learning_rate": 9.574075948809618e-05, "epoch": 0.132336137945362, "percentage": 13.23, "elapsed_time": "9:47:06", "remaining_time": "2 days, 16:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1275, "total_steps": 9627, "loss": 1.7306, "learning_rate": 9.573416723474026e-05, "epoch": 0.13244001246494236, "percentage": 13.24, "elapsed_time": "9:47:34", "remaining_time": "2 days, 16:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1276, "total_steps": 9627, "loss": 1.8486, "learning_rate": 9.572757011105227e-05, "epoch": 0.13254388698452269, "percentage": 13.25, "elapsed_time": "9:48:01", "remaining_time": "2 days, 16:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1277, "total_steps": 9627, "loss": 1.7497, "learning_rate": 9.572096811773477e-05, "epoch": 0.13264776150410304, "percentage": 13.26, "elapsed_time": "9:48:29", "remaining_time": "2 days, 16:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1278, "total_steps": 9627, "loss": 1.6892, "learning_rate": 9.571436125549078e-05, "epoch": 0.1327516360236834, "percentage": 13.28, "elapsed_time": "9:48:56", "remaining_time": "2 days, 16:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1279, "total_steps": 9627, "loss": 1.77, "learning_rate": 9.57077495250239e-05, "epoch": 0.13285551054326375, "percentage": 13.29, "elapsed_time": "9:49:24", "remaining_time": "2 days, 16:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 9627, "loss": 1.8936, "learning_rate": 9.570113292703826e-05, "epoch": 0.13295938506284408, "percentage": 13.3, "elapsed_time": "9:49:51", "remaining_time": "2 days, 16:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1281, "total_steps": 9627, "loss": 1.7727, "learning_rate": 9.569451146223843e-05, "epoch": 0.13306325958242443, "percentage": 13.31, "elapsed_time": "9:50:18", "remaining_time": "2 days, 16:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1282, "total_steps": 9627, "loss": 1.8763, "learning_rate": 9.568788513132955e-05, "epoch": 0.13316713410200479, "percentage": 13.32, "elapsed_time": "9:50:47", "remaining_time": "2 days, 16:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1283, "total_steps": 9627, "loss": 1.864, "learning_rate": 9.568125393501728e-05, "epoch": 0.1332710086215851, "percentage": 13.33, "elapsed_time": "9:51:14", "remaining_time": "2 days, 16:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1284, "total_steps": 9627, "loss": 1.7884, "learning_rate": 9.567461787400781e-05, "epoch": 0.13337488314116547, "percentage": 13.34, "elapsed_time": "9:51:41", "remaining_time": "2 days, 16:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1285, "total_steps": 9627, "loss": 1.7951, "learning_rate": 9.566797694900779e-05, "epoch": 0.13347875766074582, "percentage": 13.35, "elapsed_time": "9:52:09", "remaining_time": "2 days, 16:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1286, "total_steps": 9627, "loss": 1.602, "learning_rate": 9.566133116072447e-05, "epoch": 0.13358263218032618, "percentage": 13.36, "elapsed_time": "9:52:36", "remaining_time": "2 days, 16:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1287, "total_steps": 9627, "loss": 1.7799, "learning_rate": 9.565468050986556e-05, "epoch": 0.1336865066999065, "percentage": 13.37, "elapsed_time": "9:53:04", "remaining_time": "2 days, 16:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1288, "total_steps": 9627, "loss": 1.7055, "learning_rate": 9.564802499713928e-05, "epoch": 0.13379038121948686, "percentage": 13.38, "elapsed_time": "9:53:31", "remaining_time": "2 days, 16:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1289, "total_steps": 9627, "loss": 1.8803, "learning_rate": 9.564136462325442e-05, "epoch": 0.13389425573906721, "percentage": 13.39, "elapsed_time": "9:53:59", "remaining_time": "2 days, 16:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 9627, "loss": 1.8929, "learning_rate": 9.563469938892022e-05, "epoch": 0.13399813025864754, "percentage": 13.4, "elapsed_time": "9:54:26", "remaining_time": "2 days, 16:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1291, "total_steps": 9627, "loss": 1.6864, "learning_rate": 9.562802929484651e-05, "epoch": 0.1341020047782279, "percentage": 13.41, "elapsed_time": "9:54:54", "remaining_time": "2 days, 16:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1292, "total_steps": 9627, "loss": 1.7724, "learning_rate": 9.56213543417436e-05, "epoch": 0.13420587929780825, "percentage": 13.42, "elapsed_time": "9:55:20", "remaining_time": "2 days, 16:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1293, "total_steps": 9627, "loss": 1.794, "learning_rate": 9.561467453032231e-05, "epoch": 0.1343097538173886, "percentage": 13.43, "elapsed_time": "9:55:47", "remaining_time": "2 days, 16:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1294, "total_steps": 9627, "loss": 1.7469, "learning_rate": 9.560798986129399e-05, "epoch": 0.13441362833696893, "percentage": 13.44, "elapsed_time": "9:56:16", "remaining_time": "2 days, 15:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1295, "total_steps": 9627, "loss": 1.7181, "learning_rate": 9.56013003353705e-05, "epoch": 0.1345175028565493, "percentage": 13.45, "elapsed_time": "9:56:43", "remaining_time": "2 days, 15:59:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1296, "total_steps": 9627, "loss": 1.6823, "learning_rate": 9.559460595326424e-05, "epoch": 0.13462137737612964, "percentage": 13.46, "elapsed_time": "9:57:10", "remaining_time": "2 days, 15:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1297, "total_steps": 9627, "loss": 1.8669, "learning_rate": 9.558790671568809e-05, "epoch": 0.13472525189570997, "percentage": 13.47, "elapsed_time": "9:57:38", "remaining_time": "2 days, 15:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1298, "total_steps": 9627, "loss": 1.6597, "learning_rate": 9.558120262335546e-05, "epoch": 0.13482912641529032, "percentage": 13.48, "elapsed_time": "9:58:06", "remaining_time": "2 days, 15:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1299, "total_steps": 9627, "loss": 1.8582, "learning_rate": 9.557449367698032e-05, "epoch": 0.13493300093487068, "percentage": 13.49, "elapsed_time": "9:58:33", "remaining_time": "2 days, 15:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 9627, "loss": 1.8483, "learning_rate": 9.55677798772771e-05, "epoch": 0.13503687545445103, "percentage": 13.5, "elapsed_time": "9:59:01", "remaining_time": "2 days, 15:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1301, "total_steps": 9627, "loss": 1.6194, "learning_rate": 9.556106122496076e-05, "epoch": 0.13514074997403136, "percentage": 13.51, "elapsed_time": "9:59:27", "remaining_time": "2 days, 15:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1302, "total_steps": 9627, "loss": 1.8113, "learning_rate": 9.555433772074678e-05, "epoch": 0.13524462449361171, "percentage": 13.52, "elapsed_time": "9:59:56", "remaining_time": "2 days, 15:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1303, "total_steps": 9627, "loss": 1.9416, "learning_rate": 9.554760936535116e-05, "epoch": 0.13534849901319207, "percentage": 13.53, "elapsed_time": "10:00:23", "remaining_time": "2 days, 15:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1304, "total_steps": 9627, "loss": 1.6847, "learning_rate": 9.554087615949046e-05, "epoch": 0.13545237353277242, "percentage": 13.55, "elapsed_time": "10:00:51", "remaining_time": "2 days, 15:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1305, "total_steps": 9627, "loss": 1.8235, "learning_rate": 9.553413810388165e-05, "epoch": 0.13555624805235275, "percentage": 13.56, "elapsed_time": "10:01:18", "remaining_time": "2 days, 15:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1306, "total_steps": 9627, "loss": 1.6378, "learning_rate": 9.552739519924235e-05, "epoch": 0.1356601225719331, "percentage": 13.57, "elapsed_time": "10:01:46", "remaining_time": "2 days, 15:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1307, "total_steps": 9627, "loss": 1.8144, "learning_rate": 9.552064744629054e-05, "epoch": 0.13576399709151346, "percentage": 13.58, "elapsed_time": "10:02:12", "remaining_time": "2 days, 15:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1308, "total_steps": 9627, "loss": 1.6885, "learning_rate": 9.551389484574489e-05, "epoch": 0.1358678716110938, "percentage": 13.59, "elapsed_time": "10:02:39", "remaining_time": "2 days, 15:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1309, "total_steps": 9627, "loss": 2.0096, "learning_rate": 9.550713739832444e-05, "epoch": 0.13597174613067414, "percentage": 13.6, "elapsed_time": "10:03:08", "remaining_time": "2 days, 15:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 9627, "loss": 1.7002, "learning_rate": 9.550037510474883e-05, "epoch": 0.1360756206502545, "percentage": 13.61, "elapsed_time": "10:03:34", "remaining_time": "2 days, 15:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1311, "total_steps": 9627, "loss": 1.7883, "learning_rate": 9.549360796573821e-05, "epoch": 0.13617949516983485, "percentage": 13.62, "elapsed_time": "10:04:03", "remaining_time": "2 days, 15:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1312, "total_steps": 9627, "loss": 1.7193, "learning_rate": 9.548683598201317e-05, "epoch": 0.13628336968941518, "percentage": 13.63, "elapsed_time": "10:04:30", "remaining_time": "2 days, 15:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1313, "total_steps": 9627, "loss": 1.8664, "learning_rate": 9.548005915429495e-05, "epoch": 0.13638724420899553, "percentage": 13.64, "elapsed_time": "10:04:58", "remaining_time": "2 days, 15:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1314, "total_steps": 9627, "loss": 1.7827, "learning_rate": 9.547327748330514e-05, "epoch": 0.1364911187285759, "percentage": 13.65, "elapsed_time": "10:05:25", "remaining_time": "2 days, 15:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1315, "total_steps": 9627, "loss": 1.7287, "learning_rate": 9.5466490969766e-05, "epoch": 0.13659499324815622, "percentage": 13.66, "elapsed_time": "10:05:52", "remaining_time": "2 days, 15:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1316, "total_steps": 9627, "loss": 1.7565, "learning_rate": 9.545969961440025e-05, "epoch": 0.13669886776773657, "percentage": 13.67, "elapsed_time": "10:06:19", "remaining_time": "2 days, 15:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1317, "total_steps": 9627, "loss": 1.8727, "learning_rate": 9.545290341793107e-05, "epoch": 0.13680274228731693, "percentage": 13.68, "elapsed_time": "10:06:48", "remaining_time": "2 days, 15:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1318, "total_steps": 9627, "loss": 1.8201, "learning_rate": 9.544610238108223e-05, "epoch": 0.13690661680689728, "percentage": 13.69, "elapsed_time": "10:07:14", "remaining_time": "2 days, 15:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1319, "total_steps": 9627, "loss": 1.8134, "learning_rate": 9.543929650457796e-05, "epoch": 0.1370104913264776, "percentage": 13.7, "elapsed_time": "10:07:42", "remaining_time": "2 days, 15:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 9627, "loss": 1.6867, "learning_rate": 9.543248578914307e-05, "epoch": 0.13711436584605796, "percentage": 13.71, "elapsed_time": "10:08:09", "remaining_time": "2 days, 15:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1321, "total_steps": 9627, "loss": 1.9418, "learning_rate": 9.542567023550283e-05, "epoch": 0.13721824036563832, "percentage": 13.72, "elapsed_time": "10:08:36", "remaining_time": "2 days, 15:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1322, "total_steps": 9627, "loss": 1.6986, "learning_rate": 9.541884984438304e-05, "epoch": 0.13732211488521864, "percentage": 13.73, "elapsed_time": "10:09:03", "remaining_time": "2 days, 15:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1323, "total_steps": 9627, "loss": 1.6953, "learning_rate": 9.541202461651002e-05, "epoch": 0.137425989404799, "percentage": 13.74, "elapsed_time": "10:09:32", "remaining_time": "2 days, 15:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1324, "total_steps": 9627, "loss": 1.6347, "learning_rate": 9.54051945526106e-05, "epoch": 0.13752986392437935, "percentage": 13.75, "elapsed_time": "10:09:59", "remaining_time": "2 days, 15:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1325, "total_steps": 9627, "loss": 2.0321, "learning_rate": 9.539835965341215e-05, "epoch": 0.1376337384439597, "percentage": 13.76, "elapsed_time": "10:10:27", "remaining_time": "2 days, 15:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1326, "total_steps": 9627, "loss": 1.7978, "learning_rate": 9.539151991964253e-05, "epoch": 0.13773761296354003, "percentage": 13.77, "elapsed_time": "10:10:54", "remaining_time": "2 days, 15:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1327, "total_steps": 9627, "loss": 2.0113, "learning_rate": 9.538467535203007e-05, "epoch": 0.1378414874831204, "percentage": 13.78, "elapsed_time": "10:11:22", "remaining_time": "2 days, 15:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1328, "total_steps": 9627, "loss": 1.7936, "learning_rate": 9.537782595130371e-05, "epoch": 0.13794536200270074, "percentage": 13.79, "elapsed_time": "10:11:48", "remaining_time": "2 days, 15:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1329, "total_steps": 9627, "loss": 1.8352, "learning_rate": 9.537097171819287e-05, "epoch": 0.13804923652228107, "percentage": 13.8, "elapsed_time": "10:12:17", "remaining_time": "2 days, 15:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 9627, "loss": 1.9648, "learning_rate": 9.536411265342742e-05, "epoch": 0.13815311104186143, "percentage": 13.82, "elapsed_time": "10:12:44", "remaining_time": "2 days, 15:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1331, "total_steps": 9627, "loss": 1.6804, "learning_rate": 9.535724875773784e-05, "epoch": 0.13825698556144178, "percentage": 13.83, "elapsed_time": "10:13:11", "remaining_time": "2 days, 15:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1332, "total_steps": 9627, "loss": 1.697, "learning_rate": 9.535038003185507e-05, "epoch": 0.13836086008102214, "percentage": 13.84, "elapsed_time": "10:13:38", "remaining_time": "2 days, 15:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1333, "total_steps": 9627, "loss": 1.8382, "learning_rate": 9.534350647651056e-05, "epoch": 0.13846473460060246, "percentage": 13.85, "elapsed_time": "10:14:06", "remaining_time": "2 days, 15:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1334, "total_steps": 9627, "loss": 1.8386, "learning_rate": 9.533662809243632e-05, "epoch": 0.13856860912018282, "percentage": 13.86, "elapsed_time": "10:14:33", "remaining_time": "2 days, 15:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1335, "total_steps": 9627, "loss": 1.701, "learning_rate": 9.532974488036481e-05, "epoch": 0.13867248363976317, "percentage": 13.87, "elapsed_time": "10:14:59", "remaining_time": "2 days, 15:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1336, "total_steps": 9627, "loss": 1.9953, "learning_rate": 9.532285684102907e-05, "epoch": 0.1387763581593435, "percentage": 13.88, "elapsed_time": "10:15:27", "remaining_time": "2 days, 15:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1337, "total_steps": 9627, "loss": 1.7335, "learning_rate": 9.53159639751626e-05, "epoch": 0.13888023267892385, "percentage": 13.89, "elapsed_time": "10:15:54", "remaining_time": "2 days, 15:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1338, "total_steps": 9627, "loss": 1.929, "learning_rate": 9.530906628349945e-05, "epoch": 0.1389841071985042, "percentage": 13.9, "elapsed_time": "10:16:21", "remaining_time": "2 days, 15:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1339, "total_steps": 9627, "loss": 1.7699, "learning_rate": 9.530216376677417e-05, "epoch": 0.13908798171808456, "percentage": 13.91, "elapsed_time": "10:16:49", "remaining_time": "2 days, 15:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 9627, "loss": 1.8501, "learning_rate": 9.529525642572182e-05, "epoch": 0.1391918562376649, "percentage": 13.92, "elapsed_time": "10:17:15", "remaining_time": "2 days, 15:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1341, "total_steps": 9627, "loss": 1.9139, "learning_rate": 9.528834426107795e-05, "epoch": 0.13929573075724525, "percentage": 13.93, "elapsed_time": "10:17:42", "remaining_time": "2 days, 15:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1342, "total_steps": 9627, "loss": 1.7613, "learning_rate": 9.52814272735787e-05, "epoch": 0.1393996052768256, "percentage": 13.94, "elapsed_time": "10:18:11", "remaining_time": "2 days, 15:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1343, "total_steps": 9627, "loss": 1.7897, "learning_rate": 9.527450546396067e-05, "epoch": 0.13950347979640595, "percentage": 13.95, "elapsed_time": "10:18:37", "remaining_time": "2 days, 15:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1344, "total_steps": 9627, "loss": 1.782, "learning_rate": 9.526757883296094e-05, "epoch": 0.13960735431598628, "percentage": 13.96, "elapsed_time": "10:19:06", "remaining_time": "2 days, 15:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1345, "total_steps": 9627, "loss": 1.7047, "learning_rate": 9.526064738131717e-05, "epoch": 0.13971122883556664, "percentage": 13.97, "elapsed_time": "10:19:32", "remaining_time": "2 days, 15:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1346, "total_steps": 9627, "loss": 1.8108, "learning_rate": 9.52537111097675e-05, "epoch": 0.139815103355147, "percentage": 13.98, "elapsed_time": "10:20:00", "remaining_time": "2 days, 15:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1347, "total_steps": 9627, "loss": 1.7674, "learning_rate": 9.524677001905059e-05, "epoch": 0.13991897787472732, "percentage": 13.99, "elapsed_time": "10:20:27", "remaining_time": "2 days, 15:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1348, "total_steps": 9627, "loss": 1.7181, "learning_rate": 9.52398241099056e-05, "epoch": 0.14002285239430767, "percentage": 14.0, "elapsed_time": "10:20:55", "remaining_time": "2 days, 15:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1349, "total_steps": 9627, "loss": 1.8431, "learning_rate": 9.523287338307224e-05, "epoch": 0.14012672691388803, "percentage": 14.01, "elapsed_time": "10:21:21", "remaining_time": "2 days, 15:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 9627, "loss": 1.6761, "learning_rate": 9.522591783929069e-05, "epoch": 0.14023060143346838, "percentage": 14.02, "elapsed_time": "10:21:49", "remaining_time": "2 days, 15:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1351, "total_steps": 9627, "loss": 1.7923, "learning_rate": 9.521895747930168e-05, "epoch": 0.1403344759530487, "percentage": 14.03, "elapsed_time": "10:22:16", "remaining_time": "2 days, 15:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1352, "total_steps": 9627, "loss": 1.9424, "learning_rate": 9.521199230384641e-05, "epoch": 0.14043835047262906, "percentage": 14.04, "elapsed_time": "10:22:43", "remaining_time": "2 days, 15:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1353, "total_steps": 9627, "loss": 1.7709, "learning_rate": 9.520502231366661e-05, "epoch": 0.14054222499220942, "percentage": 14.05, "elapsed_time": "10:23:11", "remaining_time": "2 days, 15:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1354, "total_steps": 9627, "loss": 1.8535, "learning_rate": 9.519804750950457e-05, "epoch": 0.14064609951178975, "percentage": 14.06, "elapsed_time": "10:23:38", "remaining_time": "2 days, 15:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1355, "total_steps": 9627, "loss": 1.6418, "learning_rate": 9.519106789210301e-05, "epoch": 0.1407499740313701, "percentage": 14.07, "elapsed_time": "10:24:04", "remaining_time": "2 days, 15:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1356, "total_steps": 9627, "loss": 1.7506, "learning_rate": 9.518408346220525e-05, "epoch": 0.14085384855095046, "percentage": 14.09, "elapsed_time": "10:24:33", "remaining_time": "2 days, 15:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1357, "total_steps": 9627, "loss": 1.756, "learning_rate": 9.517709422055502e-05, "epoch": 0.1409577230705308, "percentage": 14.1, "elapsed_time": "10:24:59", "remaining_time": "2 days, 15:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1358, "total_steps": 9627, "loss": 1.7849, "learning_rate": 9.517010016789667e-05, "epoch": 0.14106159759011114, "percentage": 14.11, "elapsed_time": "10:25:27", "remaining_time": "2 days, 15:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1359, "total_steps": 9627, "loss": 2.191, "learning_rate": 9.516310130497498e-05, "epoch": 0.1411654721096915, "percentage": 14.12, "elapsed_time": "10:25:53", "remaining_time": "2 days, 15:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 9627, "loss": 1.6468, "learning_rate": 9.51560976325353e-05, "epoch": 0.14126934662927185, "percentage": 14.13, "elapsed_time": "10:26:21", "remaining_time": "2 days, 15:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1361, "total_steps": 9627, "loss": 1.5898, "learning_rate": 9.514908915132346e-05, "epoch": 0.14137322114885217, "percentage": 14.14, "elapsed_time": "10:26:49", "remaining_time": "2 days, 15:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1362, "total_steps": 9627, "loss": 1.5243, "learning_rate": 9.514207586208578e-05, "epoch": 0.14147709566843253, "percentage": 14.15, "elapsed_time": "10:27:16", "remaining_time": "2 days, 15:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1363, "total_steps": 9627, "loss": 1.8003, "learning_rate": 9.513505776556915e-05, "epoch": 0.14158097018801288, "percentage": 14.16, "elapsed_time": "10:27:43", "remaining_time": "2 days, 15:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1364, "total_steps": 9627, "loss": 1.7633, "learning_rate": 9.512803486252093e-05, "epoch": 0.14168484470759324, "percentage": 14.17, "elapsed_time": "10:28:10", "remaining_time": "2 days, 15:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1365, "total_steps": 9627, "loss": 1.8179, "learning_rate": 9.512100715368902e-05, "epoch": 0.14178871922717357, "percentage": 14.18, "elapsed_time": "10:28:37", "remaining_time": "2 days, 15:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1366, "total_steps": 9627, "loss": 1.8105, "learning_rate": 9.511397463982181e-05, "epoch": 0.14189259374675392, "percentage": 14.19, "elapsed_time": "10:29:05", "remaining_time": "2 days, 15:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1367, "total_steps": 9627, "loss": 1.9222, "learning_rate": 9.510693732166819e-05, "epoch": 0.14199646826633427, "percentage": 14.2, "elapsed_time": "10:29:32", "remaining_time": "2 days, 15:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1368, "total_steps": 9627, "loss": 1.6662, "learning_rate": 9.50998951999776e-05, "epoch": 0.1421003427859146, "percentage": 14.21, "elapsed_time": "10:30:00", "remaining_time": "2 days, 15:23:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1369, "total_steps": 9627, "loss": 1.6714, "learning_rate": 9.509284827549996e-05, "epoch": 0.14220421730549496, "percentage": 14.22, "elapsed_time": "10:30:26", "remaining_time": "2 days, 15:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 9627, "loss": 1.8606, "learning_rate": 9.508579654898571e-05, "epoch": 0.1423080918250753, "percentage": 14.23, "elapsed_time": "10:30:53", "remaining_time": "2 days, 15:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1371, "total_steps": 9627, "loss": 1.8999, "learning_rate": 9.507874002118582e-05, "epoch": 0.14241196634465567, "percentage": 14.24, "elapsed_time": "10:31:20", "remaining_time": "2 days, 15:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1372, "total_steps": 9627, "loss": 1.9342, "learning_rate": 9.507167869285174e-05, "epoch": 0.142515840864236, "percentage": 14.25, "elapsed_time": "10:31:48", "remaining_time": "2 days, 15:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1373, "total_steps": 9627, "loss": 1.8062, "learning_rate": 9.506461256473545e-05, "epoch": 0.14261971538381635, "percentage": 14.26, "elapsed_time": "10:32:15", "remaining_time": "2 days, 15:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1374, "total_steps": 9627, "loss": 1.8751, "learning_rate": 9.505754163758946e-05, "epoch": 0.1427235899033967, "percentage": 14.27, "elapsed_time": "10:32:43", "remaining_time": "2 days, 15:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1375, "total_steps": 9627, "loss": 1.6707, "learning_rate": 9.505046591216674e-05, "epoch": 0.14282746442297706, "percentage": 14.28, "elapsed_time": "10:33:09", "remaining_time": "2 days, 15:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1376, "total_steps": 9627, "loss": 1.8434, "learning_rate": 9.504338538922078e-05, "epoch": 0.14293133894255738, "percentage": 14.29, "elapsed_time": "10:33:38", "remaining_time": "2 days, 15:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1377, "total_steps": 9627, "loss": 1.9281, "learning_rate": 9.503630006950566e-05, "epoch": 0.14303521346213774, "percentage": 14.3, "elapsed_time": "10:34:04", "remaining_time": "2 days, 15:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1378, "total_steps": 9627, "loss": 1.6748, "learning_rate": 9.502920995377587e-05, "epoch": 0.1431390879817181, "percentage": 14.31, "elapsed_time": "10:34:31", "remaining_time": "2 days, 15:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1379, "total_steps": 9627, "loss": 1.767, "learning_rate": 9.502211504278644e-05, "epoch": 0.14324296250129842, "percentage": 14.32, "elapsed_time": "10:34:58", "remaining_time": "2 days, 15:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 9627, "loss": 1.5963, "learning_rate": 9.501501533729297e-05, "epoch": 0.14334683702087878, "percentage": 14.33, "elapsed_time": "10:35:25", "remaining_time": "2 days, 15:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1381, "total_steps": 9627, "loss": 1.7736, "learning_rate": 9.50079108380515e-05, "epoch": 0.14345071154045913, "percentage": 14.35, "elapsed_time": "10:35:53", "remaining_time": "2 days, 15:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1382, "total_steps": 9627, "loss": 1.8277, "learning_rate": 9.500080154581859e-05, "epoch": 0.14355458606003949, "percentage": 14.36, "elapsed_time": "10:36:20", "remaining_time": "2 days, 15:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1383, "total_steps": 9627, "loss": 1.7244, "learning_rate": 9.499368746135133e-05, "epoch": 0.1436584605796198, "percentage": 14.37, "elapsed_time": "10:36:47", "remaining_time": "2 days, 15:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1384, "total_steps": 9627, "loss": 1.8232, "learning_rate": 9.498656858540731e-05, "epoch": 0.14376233509920017, "percentage": 14.38, "elapsed_time": "10:37:14", "remaining_time": "2 days, 15:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1385, "total_steps": 9627, "loss": 1.7515, "learning_rate": 9.497944491874467e-05, "epoch": 0.14386620961878052, "percentage": 14.39, "elapsed_time": "10:37:40", "remaining_time": "2 days, 15:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1386, "total_steps": 9627, "loss": 1.8021, "learning_rate": 9.4972316462122e-05, "epoch": 0.14397008413836085, "percentage": 14.4, "elapsed_time": "10:38:07", "remaining_time": "2 days, 15:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1387, "total_steps": 9627, "loss": 1.8813, "learning_rate": 9.49651832162984e-05, "epoch": 0.1440739586579412, "percentage": 14.41, "elapsed_time": "10:38:34", "remaining_time": "2 days, 15:13:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1388, "total_steps": 9627, "loss": 1.7155, "learning_rate": 9.495804518203355e-05, "epoch": 0.14417783317752156, "percentage": 14.42, "elapsed_time": "10:39:01", "remaining_time": "2 days, 15:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1389, "total_steps": 9627, "loss": 1.8771, "learning_rate": 9.495090236008756e-05, "epoch": 0.1442817076971019, "percentage": 14.43, "elapsed_time": "10:39:28", "remaining_time": "2 days, 15:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 9627, "loss": 1.894, "learning_rate": 9.49437547512211e-05, "epoch": 0.14438558221668224, "percentage": 14.44, "elapsed_time": "10:39:56", "remaining_time": "2 days, 15:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1391, "total_steps": 9627, "loss": 1.7673, "learning_rate": 9.493660235619535e-05, "epoch": 0.1444894567362626, "percentage": 14.45, "elapsed_time": "10:40:22", "remaining_time": "2 days, 15:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1392, "total_steps": 9627, "loss": 2.0935, "learning_rate": 9.492944517577196e-05, "epoch": 0.14459333125584295, "percentage": 14.46, "elapsed_time": "10:40:48", "remaining_time": "2 days, 15:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1393, "total_steps": 9627, "loss": 1.6482, "learning_rate": 9.492228321071311e-05, "epoch": 0.14469720577542328, "percentage": 14.47, "elapsed_time": "10:41:17", "remaining_time": "2 days, 15:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1394, "total_steps": 9627, "loss": 1.6859, "learning_rate": 9.491511646178151e-05, "epoch": 0.14480108029500363, "percentage": 14.48, "elapsed_time": "10:41:43", "remaining_time": "2 days, 15:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1395, "total_steps": 9627, "loss": 1.6268, "learning_rate": 9.490794492974038e-05, "epoch": 0.14490495481458399, "percentage": 14.49, "elapsed_time": "10:42:11", "remaining_time": "2 days, 15:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1396, "total_steps": 9627, "loss": 1.8217, "learning_rate": 9.490076861535339e-05, "epoch": 0.14500882933416434, "percentage": 14.5, "elapsed_time": "10:42:37", "remaining_time": "2 days, 15:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1397, "total_steps": 9627, "loss": 1.7979, "learning_rate": 9.489358751938477e-05, "epoch": 0.14511270385374467, "percentage": 14.51, "elapsed_time": "10:43:06", "remaining_time": "2 days, 15:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1398, "total_steps": 9627, "loss": 1.7041, "learning_rate": 9.488640164259929e-05, "epoch": 0.14521657837332502, "percentage": 14.52, "elapsed_time": "10:43:32", "remaining_time": "2 days, 15:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1399, "total_steps": 9627, "loss": 1.8746, "learning_rate": 9.487921098576216e-05, "epoch": 0.14532045289290538, "percentage": 14.53, "elapsed_time": "10:44:00", "remaining_time": "2 days, 15:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 9627, "loss": 1.9115, "learning_rate": 9.487201554963911e-05, "epoch": 0.1454243274124857, "percentage": 14.54, "elapsed_time": "10:44:26", "remaining_time": "2 days, 15:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1401, "total_steps": 9627, "loss": 1.6462, "learning_rate": 9.486481533499642e-05, "epoch": 0.14552820193206606, "percentage": 14.55, "elapsed_time": "10:44:54", "remaining_time": "2 days, 15:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1402, "total_steps": 9627, "loss": 1.5963, "learning_rate": 9.485761034260087e-05, "epoch": 0.14563207645164641, "percentage": 14.56, "elapsed_time": "10:45:20", "remaining_time": "2 days, 15:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1403, "total_steps": 9627, "loss": 1.7931, "learning_rate": 9.485040057321972e-05, "epoch": 0.14573595097122677, "percentage": 14.57, "elapsed_time": "10:45:48", "remaining_time": "2 days, 15:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1404, "total_steps": 9627, "loss": 2.0324, "learning_rate": 9.484318602762077e-05, "epoch": 0.1458398254908071, "percentage": 14.58, "elapsed_time": "10:46:14", "remaining_time": "2 days, 15:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1405, "total_steps": 9627, "loss": 1.5949, "learning_rate": 9.483596670657228e-05, "epoch": 0.14594370001038745, "percentage": 14.59, "elapsed_time": "10:46:42", "remaining_time": "2 days, 15:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1406, "total_steps": 9627, "loss": 1.6486, "learning_rate": 9.482874261084307e-05, "epoch": 0.1460475745299678, "percentage": 14.6, "elapsed_time": "10:47:09", "remaining_time": "2 days, 15:03:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1407, "total_steps": 9627, "loss": 1.7674, "learning_rate": 9.482151374120244e-05, "epoch": 0.14615144904954813, "percentage": 14.62, "elapsed_time": "10:47:36", "remaining_time": "2 days, 15:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1408, "total_steps": 9627, "loss": 1.6668, "learning_rate": 9.481428009842024e-05, "epoch": 0.1462553235691285, "percentage": 14.63, "elapsed_time": "10:48:02", "remaining_time": "2 days, 15:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1409, "total_steps": 9627, "loss": 1.7319, "learning_rate": 9.480704168326676e-05, "epoch": 0.14635919808870884, "percentage": 14.64, "elapsed_time": "10:48:29", "remaining_time": "2 days, 15:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 9627, "loss": 1.7501, "learning_rate": 9.479979849651286e-05, "epoch": 0.1464630726082892, "percentage": 14.65, "elapsed_time": "10:48:57", "remaining_time": "2 days, 15:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1411, "total_steps": 9627, "loss": 1.7739, "learning_rate": 9.479255053892986e-05, "epoch": 0.14656694712786952, "percentage": 14.66, "elapsed_time": "10:49:24", "remaining_time": "2 days, 15:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1412, "total_steps": 9627, "loss": 1.8712, "learning_rate": 9.478529781128962e-05, "epoch": 0.14667082164744988, "percentage": 14.67, "elapsed_time": "10:49:50", "remaining_time": "2 days, 15:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1413, "total_steps": 9627, "loss": 1.7262, "learning_rate": 9.477804031436451e-05, "epoch": 0.14677469616703023, "percentage": 14.68, "elapsed_time": "10:50:18", "remaining_time": "2 days, 15:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1414, "total_steps": 9627, "loss": 1.68, "learning_rate": 9.47707780489274e-05, "epoch": 0.1468785706866106, "percentage": 14.69, "elapsed_time": "10:50:45", "remaining_time": "2 days, 14:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1415, "total_steps": 9627, "loss": 1.7192, "learning_rate": 9.476351101575163e-05, "epoch": 0.14698244520619091, "percentage": 14.7, "elapsed_time": "10:51:12", "remaining_time": "2 days, 14:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1416, "total_steps": 9627, "loss": 1.8355, "learning_rate": 9.475623921561112e-05, "epoch": 0.14708631972577127, "percentage": 14.71, "elapsed_time": "10:51:38", "remaining_time": "2 days, 14:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1417, "total_steps": 9627, "loss": 1.5081, "learning_rate": 9.474896264928024e-05, "epoch": 0.14719019424535162, "percentage": 14.72, "elapsed_time": "10:52:06", "remaining_time": "2 days, 14:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1418, "total_steps": 9627, "loss": 1.7609, "learning_rate": 9.47416813175339e-05, "epoch": 0.14729406876493195, "percentage": 14.73, "elapsed_time": "10:52:33", "remaining_time": "2 days, 14:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1419, "total_steps": 9627, "loss": 1.9254, "learning_rate": 9.47343952211475e-05, "epoch": 0.1473979432845123, "percentage": 14.74, "elapsed_time": "10:52:59", "remaining_time": "2 days, 14:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 9627, "loss": 1.8976, "learning_rate": 9.472710436089693e-05, "epoch": 0.14750181780409266, "percentage": 14.75, "elapsed_time": "10:53:28", "remaining_time": "2 days, 14:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1421, "total_steps": 9627, "loss": 1.989, "learning_rate": 9.471980873755865e-05, "epoch": 0.14760569232367302, "percentage": 14.76, "elapsed_time": "10:53:54", "remaining_time": "2 days, 14:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1422, "total_steps": 9627, "loss": 1.7134, "learning_rate": 9.471250835190957e-05, "epoch": 0.14770956684325334, "percentage": 14.77, "elapsed_time": "10:54:21", "remaining_time": "2 days, 14:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1423, "total_steps": 9627, "loss": 1.722, "learning_rate": 9.470520320472712e-05, "epoch": 0.1478134413628337, "percentage": 14.78, "elapsed_time": "10:54:48", "remaining_time": "2 days, 14:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 9627, "loss": 1.5907, "learning_rate": 9.469789329678922e-05, "epoch": 0.14791731588241405, "percentage": 14.79, "elapsed_time": "10:55:15", "remaining_time": "2 days, 14:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1425, "total_steps": 9627, "loss": 1.7298, "learning_rate": 9.469057862887436e-05, "epoch": 0.14802119040199438, "percentage": 14.8, "elapsed_time": "10:55:42", "remaining_time": "2 days, 14:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1426, "total_steps": 9627, "loss": 1.9391, "learning_rate": 9.468325920176148e-05, "epoch": 0.14812506492157473, "percentage": 14.81, "elapsed_time": "10:56:09", "remaining_time": "2 days, 14:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1427, "total_steps": 9627, "loss": 1.7072, "learning_rate": 9.467593501623003e-05, "epoch": 0.1482289394411551, "percentage": 14.82, "elapsed_time": "10:56:36", "remaining_time": "2 days, 14:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1428, "total_steps": 9627, "loss": 1.7929, "learning_rate": 9.466860607305998e-05, "epoch": 0.14833281396073544, "percentage": 14.83, "elapsed_time": "10:57:02", "remaining_time": "2 days, 14:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1429, "total_steps": 9627, "loss": 1.8288, "learning_rate": 9.466127237303182e-05, "epoch": 0.14843668848031577, "percentage": 14.84, "elapsed_time": "10:57:30", "remaining_time": "2 days, 14:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 9627, "loss": 1.7313, "learning_rate": 9.465393391692653e-05, "epoch": 0.14854056299989613, "percentage": 14.85, "elapsed_time": "10:57:58", "remaining_time": "2 days, 14:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1431, "total_steps": 9627, "loss": 1.7905, "learning_rate": 9.464659070552558e-05, "epoch": 0.14864443751947648, "percentage": 14.86, "elapsed_time": "10:58:23", "remaining_time": "2 days, 14:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1432, "total_steps": 9627, "loss": 1.8856, "learning_rate": 9.463924273961099e-05, "epoch": 0.1487483120390568, "percentage": 14.87, "elapsed_time": "10:58:51", "remaining_time": "2 days, 14:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1433, "total_steps": 9627, "loss": 1.7671, "learning_rate": 9.463189001996525e-05, "epoch": 0.14885218655863716, "percentage": 14.89, "elapsed_time": "10:59:18", "remaining_time": "2 days, 14:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1434, "total_steps": 9627, "loss": 1.7791, "learning_rate": 9.462453254737133e-05, "epoch": 0.14895606107821752, "percentage": 14.9, "elapsed_time": "10:59:45", "remaining_time": "2 days, 14:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1435, "total_steps": 9627, "loss": 1.6404, "learning_rate": 9.461717032261282e-05, "epoch": 0.14905993559779787, "percentage": 14.91, "elapsed_time": "11:00:13", "remaining_time": "2 days, 14:48:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1436, "total_steps": 9627, "loss": 1.8078, "learning_rate": 9.460980334647367e-05, "epoch": 0.1491638101173782, "percentage": 14.92, "elapsed_time": "11:00:39", "remaining_time": "2 days, 14:48:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1437, "total_steps": 9627, "loss": 1.6382, "learning_rate": 9.460243161973846e-05, "epoch": 0.14926768463695855, "percentage": 14.93, "elapsed_time": "11:01:07", "remaining_time": "2 days, 14:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1438, "total_steps": 9627, "loss": 1.8884, "learning_rate": 9.459505514319216e-05, "epoch": 0.1493715591565389, "percentage": 14.94, "elapsed_time": "11:01:33", "remaining_time": "2 days, 14:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1439, "total_steps": 9627, "loss": 1.9866, "learning_rate": 9.458767391762038e-05, "epoch": 0.14947543367611923, "percentage": 14.95, "elapsed_time": "11:02:01", "remaining_time": "2 days, 14:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 9627, "loss": 1.8562, "learning_rate": 9.45802879438091e-05, "epoch": 0.1495793081956996, "percentage": 14.96, "elapsed_time": "11:02:27", "remaining_time": "2 days, 14:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1441, "total_steps": 9627, "loss": 1.8974, "learning_rate": 9.457289722254489e-05, "epoch": 0.14968318271527994, "percentage": 14.97, "elapsed_time": "11:02:55", "remaining_time": "2 days, 14:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1442, "total_steps": 9627, "loss": 1.878, "learning_rate": 9.456550175461483e-05, "epoch": 0.1497870572348603, "percentage": 14.98, "elapsed_time": "11:03:21", "remaining_time": "2 days, 14:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1443, "total_steps": 9627, "loss": 1.7597, "learning_rate": 9.455810154080644e-05, "epoch": 0.14989093175444063, "percentage": 14.99, "elapsed_time": "11:03:49", "remaining_time": "2 days, 14:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1444, "total_steps": 9627, "loss": 1.7119, "learning_rate": 9.45506965819078e-05, "epoch": 0.14999480627402098, "percentage": 15.0, "elapsed_time": "11:04:15", "remaining_time": "2 days, 14:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1445, "total_steps": 9627, "loss": 1.7925, "learning_rate": 9.45432868787075e-05, "epoch": 0.15009868079360134, "percentage": 15.01, "elapsed_time": "11:04:43", "remaining_time": "2 days, 14:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1446, "total_steps": 9627, "loss": 1.8274, "learning_rate": 9.453587243199458e-05, "epoch": 0.1502025553131817, "percentage": 15.02, "elapsed_time": "11:05:10", "remaining_time": "2 days, 14:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1447, "total_steps": 9627, "loss": 1.6782, "learning_rate": 9.452845324255865e-05, "epoch": 0.15030642983276202, "percentage": 15.03, "elapsed_time": "11:05:37", "remaining_time": "2 days, 14:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1448, "total_steps": 9627, "loss": 1.8381, "learning_rate": 9.452102931118979e-05, "epoch": 0.15041030435234237, "percentage": 15.04, "elapsed_time": "11:06:03", "remaining_time": "2 days, 14:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1449, "total_steps": 9627, "loss": 1.8949, "learning_rate": 9.451360063867857e-05, "epoch": 0.15051417887192273, "percentage": 15.05, "elapsed_time": "11:06:31", "remaining_time": "2 days, 14:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 9627, "loss": 1.7087, "learning_rate": 9.450616722581611e-05, "epoch": 0.15061805339150305, "percentage": 15.06, "elapsed_time": "11:06:57", "remaining_time": "2 days, 14:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1451, "total_steps": 9627, "loss": 1.7222, "learning_rate": 9.449872907339401e-05, "epoch": 0.1507219279110834, "percentage": 15.07, "elapsed_time": "11:07:25", "remaining_time": "2 days, 14:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1452, "total_steps": 9627, "loss": 1.7871, "learning_rate": 9.449128618220436e-05, "epoch": 0.15082580243066376, "percentage": 15.08, "elapsed_time": "11:07:51", "remaining_time": "2 days, 14:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1453, "total_steps": 9627, "loss": 1.7017, "learning_rate": 9.448383855303977e-05, "epoch": 0.15092967695024412, "percentage": 15.09, "elapsed_time": "11:08:18", "remaining_time": "2 days, 14:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1454, "total_steps": 9627, "loss": 1.9229, "learning_rate": 9.447638618669336e-05, "epoch": 0.15103355146982445, "percentage": 15.1, "elapsed_time": "11:08:45", "remaining_time": "2 days, 14:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1455, "total_steps": 9627, "loss": 1.8912, "learning_rate": 9.446892908395877e-05, "epoch": 0.1511374259894048, "percentage": 15.11, "elapsed_time": "11:09:11", "remaining_time": "2 days, 14:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1456, "total_steps": 9627, "loss": 1.8665, "learning_rate": 9.446146724563009e-05, "epoch": 0.15124130050898515, "percentage": 15.12, "elapsed_time": "11:09:39", "remaining_time": "2 days, 14:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1457, "total_steps": 9627, "loss": 1.6188, "learning_rate": 9.445400067250196e-05, "epoch": 0.15134517502856548, "percentage": 15.13, "elapsed_time": "11:10:05", "remaining_time": "2 days, 14:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1458, "total_steps": 9627, "loss": 1.7484, "learning_rate": 9.44465293653695e-05, "epoch": 0.15144904954814584, "percentage": 15.14, "elapsed_time": "11:10:33", "remaining_time": "2 days, 14:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1459, "total_steps": 9627, "loss": 1.6957, "learning_rate": 9.443905332502837e-05, "epoch": 0.1515529240677262, "percentage": 15.16, "elapsed_time": "11:10:59", "remaining_time": "2 days, 14:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 9627, "loss": 1.866, "learning_rate": 9.443157255227472e-05, "epoch": 0.15165679858730655, "percentage": 15.17, "elapsed_time": "11:11:26", "remaining_time": "2 days, 14:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1461, "total_steps": 9627, "loss": 1.8885, "learning_rate": 9.442408704790516e-05, "epoch": 0.15176067310688687, "percentage": 15.18, "elapsed_time": "11:11:53", "remaining_time": "2 days, 14:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1462, "total_steps": 9627, "loss": 1.5994, "learning_rate": 9.441659681271684e-05, "epoch": 0.15186454762646723, "percentage": 15.19, "elapsed_time": "11:12:20", "remaining_time": "2 days, 14:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1463, "total_steps": 9627, "loss": 1.741, "learning_rate": 9.440910184750743e-05, "epoch": 0.15196842214604758, "percentage": 15.2, "elapsed_time": "11:12:47", "remaining_time": "2 days, 14:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1464, "total_steps": 9627, "loss": 1.7756, "learning_rate": 9.440160215307508e-05, "epoch": 0.1520722966656279, "percentage": 15.21, "elapsed_time": "11:13:14", "remaining_time": "2 days, 14:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1465, "total_steps": 9627, "loss": 1.877, "learning_rate": 9.439409773021844e-05, "epoch": 0.15217617118520826, "percentage": 15.22, "elapsed_time": "11:13:40", "remaining_time": "2 days, 14:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1466, "total_steps": 9627, "loss": 1.7585, "learning_rate": 9.438658857973668e-05, "epoch": 0.15228004570478862, "percentage": 15.23, "elapsed_time": "11:14:06", "remaining_time": "2 days, 14:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1467, "total_steps": 9627, "loss": 1.7805, "learning_rate": 9.437907470242946e-05, "epoch": 0.15238392022436897, "percentage": 15.24, "elapsed_time": "11:14:35", "remaining_time": "2 days, 14:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1468, "total_steps": 9627, "loss": 1.7271, "learning_rate": 9.437155609909696e-05, "epoch": 0.1524877947439493, "percentage": 15.25, "elapsed_time": "11:15:00", "remaining_time": "2 days, 14:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1469, "total_steps": 9627, "loss": 1.858, "learning_rate": 9.436403277053984e-05, "epoch": 0.15259166926352966, "percentage": 15.26, "elapsed_time": "11:15:29", "remaining_time": "2 days, 14:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 9627, "loss": 1.8507, "learning_rate": 9.435650471755931e-05, "epoch": 0.15269554378311, "percentage": 15.27, "elapsed_time": "11:15:54", "remaining_time": "2 days, 14:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1471, "total_steps": 9627, "loss": 1.7086, "learning_rate": 9.4348971940957e-05, "epoch": 0.15279941830269034, "percentage": 15.28, "elapsed_time": "11:16:22", "remaining_time": "2 days, 14:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1472, "total_steps": 9627, "loss": 1.936, "learning_rate": 9.434143444153511e-05, "epoch": 0.1529032928222707, "percentage": 15.29, "elapsed_time": "11:16:48", "remaining_time": "2 days, 14:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1473, "total_steps": 9627, "loss": 1.7736, "learning_rate": 9.433389222009633e-05, "epoch": 0.15300716734185105, "percentage": 15.3, "elapsed_time": "11:17:15", "remaining_time": "2 days, 14:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1474, "total_steps": 9627, "loss": 1.7176, "learning_rate": 9.432634527744386e-05, "epoch": 0.1531110418614314, "percentage": 15.31, "elapsed_time": "11:17:42", "remaining_time": "2 days, 14:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1475, "total_steps": 9627, "loss": 1.9448, "learning_rate": 9.431879361438137e-05, "epoch": 0.15321491638101173, "percentage": 15.32, "elapsed_time": "11:18:09", "remaining_time": "2 days, 14:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1476, "total_steps": 9627, "loss": 1.7773, "learning_rate": 9.431123723171305e-05, "epoch": 0.15331879090059208, "percentage": 15.33, "elapsed_time": "11:18:36", "remaining_time": "2 days, 14:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1477, "total_steps": 9627, "loss": 1.9316, "learning_rate": 9.430367613024361e-05, "epoch": 0.15342266542017244, "percentage": 15.34, "elapsed_time": "11:19:02", "remaining_time": "2 days, 14:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1478, "total_steps": 9627, "loss": 1.5443, "learning_rate": 9.429611031077825e-05, "epoch": 0.15352653993975277, "percentage": 15.35, "elapsed_time": "11:19:30", "remaining_time": "2 days, 14:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1479, "total_steps": 9627, "loss": 1.8619, "learning_rate": 9.428853977412266e-05, "epoch": 0.15363041445933312, "percentage": 15.36, "elapsed_time": "11:19:56", "remaining_time": "2 days, 14:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 9627, "loss": 1.7752, "learning_rate": 9.428096452108305e-05, "epoch": 0.15373428897891347, "percentage": 15.37, "elapsed_time": "11:20:23", "remaining_time": "2 days, 14:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1481, "total_steps": 9627, "loss": 1.7397, "learning_rate": 9.427338455246612e-05, "epoch": 0.15383816349849383, "percentage": 15.38, "elapsed_time": "11:20:50", "remaining_time": "2 days, 14:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1482, "total_steps": 9627, "loss": 1.7385, "learning_rate": 9.426579986907909e-05, "epoch": 0.15394203801807416, "percentage": 15.39, "elapsed_time": "11:21:16", "remaining_time": "2 days, 14:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1483, "total_steps": 9627, "loss": 1.8288, "learning_rate": 9.425821047172965e-05, "epoch": 0.1540459125376545, "percentage": 15.4, "elapsed_time": "11:21:43", "remaining_time": "2 days, 14:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1484, "total_steps": 9627, "loss": 1.9567, "learning_rate": 9.425061636122603e-05, "epoch": 0.15414978705723487, "percentage": 15.41, "elapsed_time": "11:22:09", "remaining_time": "2 days, 14:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1485, "total_steps": 9627, "loss": 1.7383, "learning_rate": 9.424301753837692e-05, "epoch": 0.15425366157681522, "percentage": 15.43, "elapsed_time": "11:22:38", "remaining_time": "2 days, 14:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1486, "total_steps": 9627, "loss": 1.8508, "learning_rate": 9.423541400399157e-05, "epoch": 0.15435753609639555, "percentage": 15.44, "elapsed_time": "11:23:03", "remaining_time": "2 days, 14:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1487, "total_steps": 9627, "loss": 1.9329, "learning_rate": 9.422780575887967e-05, "epoch": 0.1544614106159759, "percentage": 15.45, "elapsed_time": "11:23:31", "remaining_time": "2 days, 14:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1488, "total_steps": 9627, "loss": 1.9418, "learning_rate": 9.422019280385145e-05, "epoch": 0.15456528513555626, "percentage": 15.46, "elapsed_time": "11:23:57", "remaining_time": "2 days, 14:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1489, "total_steps": 9627, "loss": 1.8998, "learning_rate": 9.421257513971762e-05, "epoch": 0.15466915965513658, "percentage": 15.47, "elapsed_time": "11:24:25", "remaining_time": "2 days, 14:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 9627, "loss": 1.8042, "learning_rate": 9.420495276728943e-05, "epoch": 0.15477303417471694, "percentage": 15.48, "elapsed_time": "11:24:51", "remaining_time": "2 days, 14:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1491, "total_steps": 9627, "loss": 1.9044, "learning_rate": 9.419732568737856e-05, "epoch": 0.1548769086942973, "percentage": 15.49, "elapsed_time": "11:25:18", "remaining_time": "2 days, 14:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1492, "total_steps": 9627, "loss": 2.098, "learning_rate": 9.418969390079726e-05, "epoch": 0.15498078321387765, "percentage": 15.5, "elapsed_time": "11:25:44", "remaining_time": "2 days, 14:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1493, "total_steps": 9627, "loss": 1.7396, "learning_rate": 9.418205740835825e-05, "epoch": 0.15508465773345798, "percentage": 15.51, "elapsed_time": "11:26:11", "remaining_time": "2 days, 14:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1494, "total_steps": 9627, "loss": 1.7114, "learning_rate": 9.417441621087476e-05, "epoch": 0.15518853225303833, "percentage": 15.52, "elapsed_time": "11:26:38", "remaining_time": "2 days, 14:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1495, "total_steps": 9627, "loss": 1.828, "learning_rate": 9.416677030916053e-05, "epoch": 0.15529240677261869, "percentage": 15.53, "elapsed_time": "11:27:04", "remaining_time": "2 days, 14:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1496, "total_steps": 9627, "loss": 1.7821, "learning_rate": 9.415911970402976e-05, "epoch": 0.155396281292199, "percentage": 15.54, "elapsed_time": "11:27:31", "remaining_time": "2 days, 14:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1497, "total_steps": 9627, "loss": 1.8746, "learning_rate": 9.41514643962972e-05, "epoch": 0.15550015581177937, "percentage": 15.55, "elapsed_time": "11:27:58", "remaining_time": "2 days, 14:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1498, "total_steps": 9627, "loss": 1.9818, "learning_rate": 9.414380438677808e-05, "epoch": 0.15560403033135972, "percentage": 15.56, "elapsed_time": "11:28:25", "remaining_time": "2 days, 14:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1499, "total_steps": 9627, "loss": 1.7178, "learning_rate": 9.413613967628814e-05, "epoch": 0.15570790485094008, "percentage": 15.57, "elapsed_time": "11:28:51", "remaining_time": "2 days, 14:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 9627, "loss": 1.5971, "learning_rate": 9.412847026564357e-05, "epoch": 0.1558117793705204, "percentage": 15.58, "elapsed_time": "11:29:18", "remaining_time": "2 days, 14:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1501, "total_steps": 9627, "loss": 1.8022, "learning_rate": 9.412079615566116e-05, "epoch": 0.15591565389010076, "percentage": 15.59, "elapsed_time": "11:29:44", "remaining_time": "2 days, 14:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1502, "total_steps": 9627, "loss": 1.8473, "learning_rate": 9.411311734715811e-05, "epoch": 0.1560195284096811, "percentage": 15.6, "elapsed_time": "11:30:11", "remaining_time": "2 days, 14:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1503, "total_steps": 9627, "loss": 1.7718, "learning_rate": 9.410543384095214e-05, "epoch": 0.15612340292926144, "percentage": 15.61, "elapsed_time": "11:30:38", "remaining_time": "2 days, 14:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1504, "total_steps": 9627, "loss": 1.8614, "learning_rate": 9.409774563786152e-05, "epoch": 0.1562272774488418, "percentage": 15.62, "elapsed_time": "11:31:05", "remaining_time": "2 days, 14:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1505, "total_steps": 9627, "loss": 2.1187, "learning_rate": 9.409005273870495e-05, "epoch": 0.15633115196842215, "percentage": 15.63, "elapsed_time": "11:31:31", "remaining_time": "2 days, 14:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1506, "total_steps": 9627, "loss": 1.7244, "learning_rate": 9.40823551443017e-05, "epoch": 0.1564350264880025, "percentage": 15.64, "elapsed_time": "11:31:59", "remaining_time": "2 days, 14:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1507, "total_steps": 9627, "loss": 1.8046, "learning_rate": 9.407465285547147e-05, "epoch": 0.15653890100758283, "percentage": 15.65, "elapsed_time": "11:32:26", "remaining_time": "2 days, 14:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1508, "total_steps": 9627, "loss": 1.7574, "learning_rate": 9.406694587303451e-05, "epoch": 0.15664277552716319, "percentage": 15.66, "elapsed_time": "11:32:52", "remaining_time": "2 days, 14:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1509, "total_steps": 9627, "loss": 1.8895, "learning_rate": 9.405923419781154e-05, "epoch": 0.15674665004674354, "percentage": 15.67, "elapsed_time": "11:33:18", "remaining_time": "2 days, 14:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 9627, "loss": 1.6415, "learning_rate": 9.405151783062381e-05, "epoch": 0.15685052456632387, "percentage": 15.69, "elapsed_time": "11:33:46", "remaining_time": "2 days, 14:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1511, "total_steps": 9627, "loss": 1.7707, "learning_rate": 9.404379677229305e-05, "epoch": 0.15695439908590422, "percentage": 15.7, "elapsed_time": "11:34:12", "remaining_time": "2 days, 14:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1512, "total_steps": 9627, "loss": 1.7814, "learning_rate": 9.403607102364148e-05, "epoch": 0.15705827360548458, "percentage": 15.71, "elapsed_time": "11:34:40", "remaining_time": "2 days, 14:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1513, "total_steps": 9627, "loss": 2.0017, "learning_rate": 9.402834058549184e-05, "epoch": 0.15716214812506493, "percentage": 15.72, "elapsed_time": "11:35:06", "remaining_time": "2 days, 14:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1514, "total_steps": 9627, "loss": 1.8552, "learning_rate": 9.402060545866737e-05, "epoch": 0.15726602264464526, "percentage": 15.73, "elapsed_time": "11:35:33", "remaining_time": "2 days, 14:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1515, "total_steps": 9627, "loss": 1.8447, "learning_rate": 9.401286564399178e-05, "epoch": 0.15736989716422561, "percentage": 15.74, "elapsed_time": "11:36:00", "remaining_time": "2 days, 14:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1516, "total_steps": 9627, "loss": 1.6783, "learning_rate": 9.400512114228935e-05, "epoch": 0.15747377168380597, "percentage": 15.75, "elapsed_time": "11:36:27", "remaining_time": "2 days, 14:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1517, "total_steps": 9627, "loss": 1.7901, "learning_rate": 9.399737195438473e-05, "epoch": 0.1575776462033863, "percentage": 15.76, "elapsed_time": "11:36:53", "remaining_time": "2 days, 14:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1518, "total_steps": 9627, "loss": 1.6647, "learning_rate": 9.398961808110321e-05, "epoch": 0.15768152072296665, "percentage": 15.77, "elapsed_time": "11:37:21", "remaining_time": "2 days, 14:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1519, "total_steps": 9627, "loss": 1.7797, "learning_rate": 9.398185952327048e-05, "epoch": 0.157785395242547, "percentage": 15.78, "elapsed_time": "11:37:47", "remaining_time": "2 days, 14:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 9627, "loss": 1.6302, "learning_rate": 9.397409628171279e-05, "epoch": 0.15788926976212736, "percentage": 15.79, "elapsed_time": "11:38:14", "remaining_time": "2 days, 14:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1521, "total_steps": 9627, "loss": 1.9296, "learning_rate": 9.396632835725687e-05, "epoch": 0.1579931442817077, "percentage": 15.8, "elapsed_time": "11:38:41", "remaining_time": "2 days, 14:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1522, "total_steps": 9627, "loss": 1.9748, "learning_rate": 9.395855575072991e-05, "epoch": 0.15809701880128804, "percentage": 15.81, "elapsed_time": "11:39:07", "remaining_time": "2 days, 14:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1523, "total_steps": 9627, "loss": 1.9662, "learning_rate": 9.395077846295967e-05, "epoch": 0.1582008933208684, "percentage": 15.82, "elapsed_time": "11:39:33", "remaining_time": "2 days, 14:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1524, "total_steps": 9627, "loss": 1.7051, "learning_rate": 9.394299649477434e-05, "epoch": 0.15830476784044875, "percentage": 15.83, "elapsed_time": "11:39:59", "remaining_time": "2 days, 14:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1525, "total_steps": 9627, "loss": 1.8365, "learning_rate": 9.393520984700266e-05, "epoch": 0.15840864236002908, "percentage": 15.84, "elapsed_time": "11:40:27", "remaining_time": "2 days, 14:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1526, "total_steps": 9627, "loss": 1.8812, "learning_rate": 9.392741852047385e-05, "epoch": 0.15851251687960943, "percentage": 15.85, "elapsed_time": "11:40:53", "remaining_time": "2 days, 14:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1527, "total_steps": 9627, "loss": 1.8, "learning_rate": 9.391962251601758e-05, "epoch": 0.1586163913991898, "percentage": 15.86, "elapsed_time": "11:41:20", "remaining_time": "2 days, 14:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1528, "total_steps": 9627, "loss": 1.5527, "learning_rate": 9.391182183446413e-05, "epoch": 0.15872026591877011, "percentage": 15.87, "elapsed_time": "11:41:46", "remaining_time": "2 days, 13:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1529, "total_steps": 9627, "loss": 1.9147, "learning_rate": 9.390401647664417e-05, "epoch": 0.15882414043835047, "percentage": 15.88, "elapsed_time": "11:42:12", "remaining_time": "2 days, 13:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 9627, "loss": 1.7478, "learning_rate": 9.389620644338892e-05, "epoch": 0.15892801495793082, "percentage": 15.89, "elapsed_time": "11:42:40", "remaining_time": "2 days, 13:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1531, "total_steps": 9627, "loss": 1.5696, "learning_rate": 9.388839173553007e-05, "epoch": 0.15903188947751118, "percentage": 15.9, "elapsed_time": "11:43:06", "remaining_time": "2 days, 13:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1532, "total_steps": 9627, "loss": 1.6998, "learning_rate": 9.388057235389986e-05, "epoch": 0.1591357639970915, "percentage": 15.91, "elapsed_time": "11:43:34", "remaining_time": "2 days, 13:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1533, "total_steps": 9627, "loss": 1.8103, "learning_rate": 9.3872748299331e-05, "epoch": 0.15923963851667186, "percentage": 15.92, "elapsed_time": "11:43:59", "remaining_time": "2 days, 13:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1534, "total_steps": 9627, "loss": 1.7707, "learning_rate": 9.386491957265662e-05, "epoch": 0.15934351303625222, "percentage": 15.93, "elapsed_time": "11:44:26", "remaining_time": "2 days, 13:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1535, "total_steps": 9627, "loss": 1.8373, "learning_rate": 9.38570861747105e-05, "epoch": 0.15944738755583254, "percentage": 15.94, "elapsed_time": "11:44:53", "remaining_time": "2 days, 13:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1536, "total_steps": 9627, "loss": 1.7374, "learning_rate": 9.384924810632679e-05, "epoch": 0.1595512620754129, "percentage": 15.96, "elapsed_time": "11:45:20", "remaining_time": "2 days, 13:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1537, "total_steps": 9627, "loss": 2.0285, "learning_rate": 9.384140536834018e-05, "epoch": 0.15965513659499325, "percentage": 15.97, "elapsed_time": "11:45:46", "remaining_time": "2 days, 13:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1538, "total_steps": 9627, "loss": 1.8455, "learning_rate": 9.383355796158588e-05, "epoch": 0.1597590111145736, "percentage": 15.98, "elapsed_time": "11:46:13", "remaining_time": "2 days, 13:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1539, "total_steps": 9627, "loss": 1.8248, "learning_rate": 9.382570588689958e-05, "epoch": 0.15986288563415393, "percentage": 15.99, "elapsed_time": "11:46:39", "remaining_time": "2 days, 13:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 9627, "loss": 2.1518, "learning_rate": 9.381784914511746e-05, "epoch": 0.1599667601537343, "percentage": 16.0, "elapsed_time": "11:47:07", "remaining_time": "2 days, 13:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1541, "total_steps": 9627, "loss": 1.7234, "learning_rate": 9.38099877370762e-05, "epoch": 0.16007063467331464, "percentage": 16.01, "elapsed_time": "11:47:33", "remaining_time": "2 days, 13:52:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1542, "total_steps": 9627, "loss": 1.7744, "learning_rate": 9.380212166361298e-05, "epoch": 0.16017450919289497, "percentage": 16.02, "elapsed_time": "11:48:00", "remaining_time": "2 days, 13:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1543, "total_steps": 9627, "loss": 2.0752, "learning_rate": 9.379425092556545e-05, "epoch": 0.16027838371247533, "percentage": 16.03, "elapsed_time": "11:48:26", "remaining_time": "2 days, 13:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1544, "total_steps": 9627, "loss": 1.7362, "learning_rate": 9.378637552377181e-05, "epoch": 0.16038225823205568, "percentage": 16.04, "elapsed_time": "11:48:53", "remaining_time": "2 days, 13:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1545, "total_steps": 9627, "loss": 1.9631, "learning_rate": 9.377849545907074e-05, "epoch": 0.16048613275163603, "percentage": 16.05, "elapsed_time": "11:49:20", "remaining_time": "2 days, 13:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1546, "total_steps": 9627, "loss": 1.955, "learning_rate": 9.377061073230138e-05, "epoch": 0.16059000727121636, "percentage": 16.06, "elapsed_time": "11:49:46", "remaining_time": "2 days, 13:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1547, "total_steps": 9627, "loss": 1.5817, "learning_rate": 9.37627213443034e-05, "epoch": 0.16069388179079672, "percentage": 16.07, "elapsed_time": "11:50:14", "remaining_time": "2 days, 13:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1548, "total_steps": 9627, "loss": 1.7563, "learning_rate": 9.375482729591696e-05, "epoch": 0.16079775631037707, "percentage": 16.08, "elapsed_time": "11:50:39", "remaining_time": "2 days, 13:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1549, "total_steps": 9627, "loss": 1.7638, "learning_rate": 9.37469285879827e-05, "epoch": 0.1609016308299574, "percentage": 16.09, "elapsed_time": "11:51:07", "remaining_time": "2 days, 13:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 9627, "loss": 1.6821, "learning_rate": 9.373902522134181e-05, "epoch": 0.16100550534953775, "percentage": 16.1, "elapsed_time": "11:51:33", "remaining_time": "2 days, 13:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1551, "total_steps": 9627, "loss": 1.6423, "learning_rate": 9.37311171968359e-05, "epoch": 0.1611093798691181, "percentage": 16.11, "elapsed_time": "11:51:59", "remaining_time": "2 days, 13:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1552, "total_steps": 9627, "loss": 1.7089, "learning_rate": 9.372320451530711e-05, "epoch": 0.16121325438869846, "percentage": 16.12, "elapsed_time": "11:52:27", "remaining_time": "2 days, 13:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1553, "total_steps": 9627, "loss": 1.801, "learning_rate": 9.371528717759811e-05, "epoch": 0.1613171289082788, "percentage": 16.13, "elapsed_time": "11:52:54", "remaining_time": "2 days, 13:46:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1554, "total_steps": 9627, "loss": 1.7258, "learning_rate": 9.370736518455203e-05, "epoch": 0.16142100342785914, "percentage": 16.14, "elapsed_time": "11:53:20", "remaining_time": "2 days, 13:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1555, "total_steps": 9627, "loss": 1.8522, "learning_rate": 9.369943853701246e-05, "epoch": 0.1615248779474395, "percentage": 16.15, "elapsed_time": "11:53:47", "remaining_time": "2 days, 13:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1556, "total_steps": 9627, "loss": 1.6075, "learning_rate": 9.369150723582358e-05, "epoch": 0.16162875246701985, "percentage": 16.16, "elapsed_time": "11:54:14", "remaining_time": "2 days, 13:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1557, "total_steps": 9627, "loss": 1.7797, "learning_rate": 9.368357128182998e-05, "epoch": 0.16173262698660018, "percentage": 16.17, "elapsed_time": "11:54:39", "remaining_time": "2 days, 13:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1558, "total_steps": 9627, "loss": 1.8579, "learning_rate": 9.367563067587677e-05, "epoch": 0.16183650150618054, "percentage": 16.18, "elapsed_time": "11:55:07", "remaining_time": "2 days, 13:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1559, "total_steps": 9627, "loss": 1.708, "learning_rate": 9.366768541880958e-05, "epoch": 0.1619403760257609, "percentage": 16.19, "elapsed_time": "11:55:33", "remaining_time": "2 days, 13:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 9627, "loss": 1.8155, "learning_rate": 9.365973551147453e-05, "epoch": 0.16204425054534122, "percentage": 16.2, "elapsed_time": "11:56:00", "remaining_time": "2 days, 13:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1561, "total_steps": 9627, "loss": 1.7573, "learning_rate": 9.365178095471819e-05, "epoch": 0.16214812506492157, "percentage": 16.21, "elapsed_time": "11:56:26", "remaining_time": "2 days, 13:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1562, "total_steps": 9627, "loss": 1.898, "learning_rate": 9.364382174938768e-05, "epoch": 0.16225199958450193, "percentage": 16.23, "elapsed_time": "11:56:53", "remaining_time": "2 days, 13:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1563, "total_steps": 9627, "loss": 1.6292, "learning_rate": 9.363585789633057e-05, "epoch": 0.16235587410408228, "percentage": 16.24, "elapsed_time": "11:57:19", "remaining_time": "2 days, 13:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1564, "total_steps": 9627, "loss": 1.6484, "learning_rate": 9.3627889396395e-05, "epoch": 0.1624597486236626, "percentage": 16.25, "elapsed_time": "11:57:46", "remaining_time": "2 days, 13:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1565, "total_steps": 9627, "loss": 1.7915, "learning_rate": 9.36199162504295e-05, "epoch": 0.16256362314324296, "percentage": 16.26, "elapsed_time": "11:58:12", "remaining_time": "2 days, 13:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1566, "total_steps": 9627, "loss": 1.6923, "learning_rate": 9.361193845928318e-05, "epoch": 0.16266749766282332, "percentage": 16.27, "elapsed_time": "11:58:39", "remaining_time": "2 days, 13:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1567, "total_steps": 9627, "loss": 1.8842, "learning_rate": 9.360395602380559e-05, "epoch": 0.16277137218240365, "percentage": 16.28, "elapsed_time": "11:59:06", "remaining_time": "2 days, 13:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1568, "total_steps": 9627, "loss": 1.9783, "learning_rate": 9.359596894484682e-05, "epoch": 0.162875246701984, "percentage": 16.29, "elapsed_time": "11:59:32", "remaining_time": "2 days, 13:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1569, "total_steps": 9627, "loss": 1.8153, "learning_rate": 9.35879772232574e-05, "epoch": 0.16297912122156435, "percentage": 16.3, "elapsed_time": "11:59:59", "remaining_time": "2 days, 13:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 9627, "loss": 1.5263, "learning_rate": 9.357998085988842e-05, "epoch": 0.1630829957411447, "percentage": 16.31, "elapsed_time": "12:00:24", "remaining_time": "2 days, 13:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1571, "total_steps": 9627, "loss": 1.6806, "learning_rate": 9.35719798555914e-05, "epoch": 0.16318687026072504, "percentage": 16.32, "elapsed_time": "12:00:52", "remaining_time": "2 days, 13:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1572, "total_steps": 9627, "loss": 1.855, "learning_rate": 9.356397421121842e-05, "epoch": 0.1632907447803054, "percentage": 16.33, "elapsed_time": "12:01:18", "remaining_time": "2 days, 13:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1573, "total_steps": 9627, "loss": 1.8909, "learning_rate": 9.355596392762197e-05, "epoch": 0.16339461929988575, "percentage": 16.34, "elapsed_time": "12:01:44", "remaining_time": "2 days, 13:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1574, "total_steps": 9627, "loss": 1.874, "learning_rate": 9.354794900565515e-05, "epoch": 0.16349849381946607, "percentage": 16.35, "elapsed_time": "12:02:11", "remaining_time": "2 days, 13:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1575, "total_steps": 9627, "loss": 1.6768, "learning_rate": 9.353992944617142e-05, "epoch": 0.16360236833904643, "percentage": 16.36, "elapsed_time": "12:02:38", "remaining_time": "2 days, 13:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1576, "total_steps": 9627, "loss": 1.6279, "learning_rate": 9.353190525002484e-05, "epoch": 0.16370624285862678, "percentage": 16.37, "elapsed_time": "12:03:03", "remaining_time": "2 days, 13:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1577, "total_steps": 9627, "loss": 1.8541, "learning_rate": 9.35238764180699e-05, "epoch": 0.16381011737820714, "percentage": 16.38, "elapsed_time": "12:03:31", "remaining_time": "2 days, 13:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1578, "total_steps": 9627, "loss": 1.5282, "learning_rate": 9.351584295116165e-05, "epoch": 0.16391399189778746, "percentage": 16.39, "elapsed_time": "12:03:57", "remaining_time": "2 days, 13:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1579, "total_steps": 9627, "loss": 1.6896, "learning_rate": 9.350780485015553e-05, "epoch": 0.16401786641736782, "percentage": 16.4, "elapsed_time": "12:04:23", "remaining_time": "2 days, 13:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 9627, "loss": 1.57, "learning_rate": 9.349976211590758e-05, "epoch": 0.16412174093694817, "percentage": 16.41, "elapsed_time": "12:04:49", "remaining_time": "2 days, 13:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1581, "total_steps": 9627, "loss": 1.5819, "learning_rate": 9.349171474927427e-05, "epoch": 0.1642256154565285, "percentage": 16.42, "elapsed_time": "12:05:15", "remaining_time": "2 days, 13:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1582, "total_steps": 9627, "loss": 1.6357, "learning_rate": 9.34836627511126e-05, "epoch": 0.16432948997610886, "percentage": 16.43, "elapsed_time": "12:05:42", "remaining_time": "2 days, 13:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1583, "total_steps": 9627, "loss": 1.7312, "learning_rate": 9.347560612228003e-05, "epoch": 0.1644333644956892, "percentage": 16.44, "elapsed_time": "12:06:08", "remaining_time": "2 days, 13:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1584, "total_steps": 9627, "loss": 1.8537, "learning_rate": 9.346754486363452e-05, "epoch": 0.16453723901526957, "percentage": 16.45, "elapsed_time": "12:06:34", "remaining_time": "2 days, 13:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1585, "total_steps": 9627, "loss": 1.6428, "learning_rate": 9.345947897603455e-05, "epoch": 0.1646411135348499, "percentage": 16.46, "elapsed_time": "12:07:01", "remaining_time": "2 days, 13:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1586, "total_steps": 9627, "loss": 1.8029, "learning_rate": 9.345140846033906e-05, "epoch": 0.16474498805443025, "percentage": 16.47, "elapsed_time": "12:07:27", "remaining_time": "2 days, 13:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1587, "total_steps": 9627, "loss": 1.6589, "learning_rate": 9.344333331740751e-05, "epoch": 0.1648488625740106, "percentage": 16.48, "elapsed_time": "12:07:54", "remaining_time": "2 days, 13:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1588, "total_steps": 9627, "loss": 1.7891, "learning_rate": 9.343525354809984e-05, "epoch": 0.16495273709359093, "percentage": 16.5, "elapsed_time": "12:08:20", "remaining_time": "2 days, 13:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1589, "total_steps": 9627, "loss": 1.7708, "learning_rate": 9.342716915327647e-05, "epoch": 0.16505661161317128, "percentage": 16.51, "elapsed_time": "12:08:47", "remaining_time": "2 days, 13:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 9627, "loss": 1.7155, "learning_rate": 9.341908013379831e-05, "epoch": 0.16516048613275164, "percentage": 16.52, "elapsed_time": "12:09:13", "remaining_time": "2 days, 13:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1591, "total_steps": 9627, "loss": 1.8784, "learning_rate": 9.341098649052681e-05, "epoch": 0.165264360652332, "percentage": 16.53, "elapsed_time": "12:09:39", "remaining_time": "2 days, 13:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1592, "total_steps": 9627, "loss": 1.874, "learning_rate": 9.340288822432388e-05, "epoch": 0.16536823517191232, "percentage": 16.54, "elapsed_time": "12:10:06", "remaining_time": "2 days, 13:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1593, "total_steps": 9627, "loss": 1.5365, "learning_rate": 9.339478533605191e-05, "epoch": 0.16547210969149267, "percentage": 16.55, "elapsed_time": "12:10:32", "remaining_time": "2 days, 13:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1594, "total_steps": 9627, "loss": 1.7984, "learning_rate": 9.338667782657378e-05, "epoch": 0.16557598421107303, "percentage": 16.56, "elapsed_time": "12:10:58", "remaining_time": "2 days, 13:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1595, "total_steps": 9627, "loss": 1.6244, "learning_rate": 9.337856569675288e-05, "epoch": 0.16567985873065338, "percentage": 16.57, "elapsed_time": "12:11:25", "remaining_time": "2 days, 13:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1596, "total_steps": 9627, "loss": 1.8774, "learning_rate": 9.337044894745313e-05, "epoch": 0.1657837332502337, "percentage": 16.58, "elapsed_time": "12:11:51", "remaining_time": "2 days, 13:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1597, "total_steps": 9627, "loss": 1.7503, "learning_rate": 9.336232757953884e-05, "epoch": 0.16588760776981407, "percentage": 16.59, "elapsed_time": "12:12:18", "remaining_time": "2 days, 13:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1598, "total_steps": 9627, "loss": 1.8433, "learning_rate": 9.335420159387491e-05, "epoch": 0.16599148228939442, "percentage": 16.6, "elapsed_time": "12:12:44", "remaining_time": "2 days, 13:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1599, "total_steps": 9627, "loss": 1.8019, "learning_rate": 9.33460709913267e-05, "epoch": 0.16609535680897475, "percentage": 16.61, "elapsed_time": "12:13:11", "remaining_time": "2 days, 13:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 9627, "loss": 1.9248, "learning_rate": 9.333793577276004e-05, "epoch": 0.1661992313285551, "percentage": 16.62, "elapsed_time": "12:13:37", "remaining_time": "2 days, 13:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1601, "total_steps": 9627, "loss": 1.674, "learning_rate": 9.332979593904125e-05, "epoch": 0.16630310584813546, "percentage": 16.63, "elapsed_time": "12:14:03", "remaining_time": "2 days, 13:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1602, "total_steps": 9627, "loss": 1.9506, "learning_rate": 9.33216514910372e-05, "epoch": 0.1664069803677158, "percentage": 16.64, "elapsed_time": "12:14:30", "remaining_time": "2 days, 13:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1603, "total_steps": 9627, "loss": 1.716, "learning_rate": 9.331350242961518e-05, "epoch": 0.16651085488729614, "percentage": 16.65, "elapsed_time": "12:14:56", "remaining_time": "2 days, 13:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1604, "total_steps": 9627, "loss": 1.7274, "learning_rate": 9.3305348755643e-05, "epoch": 0.1666147294068765, "percentage": 16.66, "elapsed_time": "12:15:22", "remaining_time": "2 days, 13:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1605, "total_steps": 9627, "loss": 1.7231, "learning_rate": 9.329719046998898e-05, "epoch": 0.16671860392645685, "percentage": 16.67, "elapsed_time": "12:15:49", "remaining_time": "2 days, 13:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1606, "total_steps": 9627, "loss": 1.6772, "learning_rate": 9.328902757352191e-05, "epoch": 0.16682247844603718, "percentage": 16.68, "elapsed_time": "12:16:16", "remaining_time": "2 days, 13:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1607, "total_steps": 9627, "loss": 1.6853, "learning_rate": 9.328086006711108e-05, "epoch": 0.16692635296561753, "percentage": 16.69, "elapsed_time": "12:16:42", "remaining_time": "2 days, 13:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1608, "total_steps": 9627, "loss": 1.7584, "learning_rate": 9.327268795162622e-05, "epoch": 0.16703022748519789, "percentage": 16.7, "elapsed_time": "12:17:08", "remaining_time": "2 days, 13:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1609, "total_steps": 9627, "loss": 1.7157, "learning_rate": 9.326451122793766e-05, "epoch": 0.16713410200477824, "percentage": 16.71, "elapsed_time": "12:17:35", "remaining_time": "2 days, 13:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 9627, "loss": 1.7911, "learning_rate": 9.325632989691613e-05, "epoch": 0.16723797652435857, "percentage": 16.72, "elapsed_time": "12:18:02", "remaining_time": "2 days, 13:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1611, "total_steps": 9627, "loss": 1.7849, "learning_rate": 9.324814395943289e-05, "epoch": 0.16734185104393892, "percentage": 16.73, "elapsed_time": "12:18:29", "remaining_time": "2 days, 13:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1612, "total_steps": 9627, "loss": 1.9662, "learning_rate": 9.323995341635963e-05, "epoch": 0.16744572556351928, "percentage": 16.74, "elapsed_time": "12:18:54", "remaining_time": "2 days, 13:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1613, "total_steps": 9627, "loss": 1.8091, "learning_rate": 9.323175826856865e-05, "epoch": 0.1675496000830996, "percentage": 16.75, "elapsed_time": "12:19:21", "remaining_time": "2 days, 13:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1614, "total_steps": 9627, "loss": 1.716, "learning_rate": 9.322355851693263e-05, "epoch": 0.16765347460267996, "percentage": 16.77, "elapsed_time": "12:19:48", "remaining_time": "2 days, 13:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1615, "total_steps": 9627, "loss": 1.8553, "learning_rate": 9.321535416232476e-05, "epoch": 0.1677573491222603, "percentage": 16.78, "elapsed_time": "12:20:14", "remaining_time": "2 days, 13:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1616, "total_steps": 9627, "loss": 1.6873, "learning_rate": 9.32071452056188e-05, "epoch": 0.16786122364184067, "percentage": 16.79, "elapsed_time": "12:20:41", "remaining_time": "2 days, 13:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1617, "total_steps": 9627, "loss": 1.7064, "learning_rate": 9.319893164768888e-05, "epoch": 0.167965098161421, "percentage": 16.8, "elapsed_time": "12:21:07", "remaining_time": "2 days, 13:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1618, "total_steps": 9627, "loss": 1.6289, "learning_rate": 9.31907134894097e-05, "epoch": 0.16806897268100135, "percentage": 16.81, "elapsed_time": "12:21:34", "remaining_time": "2 days, 13:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1619, "total_steps": 9627, "loss": 1.7028, "learning_rate": 9.318249073165646e-05, "epoch": 0.1681728472005817, "percentage": 16.82, "elapsed_time": "12:22:01", "remaining_time": "2 days, 13:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 9627, "loss": 1.7427, "learning_rate": 9.317426337530477e-05, "epoch": 0.16827672172016203, "percentage": 16.83, "elapsed_time": "12:22:27", "remaining_time": "2 days, 13:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1621, "total_steps": 9627, "loss": 1.6961, "learning_rate": 9.316603142123082e-05, "epoch": 0.16838059623974239, "percentage": 16.84, "elapsed_time": "12:22:54", "remaining_time": "2 days, 13:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1622, "total_steps": 9627, "loss": 1.8285, "learning_rate": 9.315779487031122e-05, "epoch": 0.16848447075932274, "percentage": 16.85, "elapsed_time": "12:23:20", "remaining_time": "2 days, 13:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1623, "total_steps": 9627, "loss": 1.643, "learning_rate": 9.314955372342311e-05, "epoch": 0.1685883452789031, "percentage": 16.86, "elapsed_time": "12:23:47", "remaining_time": "2 days, 13:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1624, "total_steps": 9627, "loss": 1.8822, "learning_rate": 9.314130798144412e-05, "epoch": 0.16869221979848342, "percentage": 16.87, "elapsed_time": "12:24:13", "remaining_time": "2 days, 13:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1625, "total_steps": 9627, "loss": 1.9001, "learning_rate": 9.313305764525232e-05, "epoch": 0.16879609431806378, "percentage": 16.88, "elapsed_time": "12:24:40", "remaining_time": "2 days, 13:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1626, "total_steps": 9627, "loss": 1.8858, "learning_rate": 9.312480271572634e-05, "epoch": 0.16889996883764413, "percentage": 16.89, "elapsed_time": "12:25:05", "remaining_time": "2 days, 13:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1627, "total_steps": 9627, "loss": 1.8909, "learning_rate": 9.311654319374528e-05, "epoch": 0.16900384335722446, "percentage": 16.9, "elapsed_time": "12:25:33", "remaining_time": "2 days, 13:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1628, "total_steps": 9627, "loss": 1.8039, "learning_rate": 9.310827908018866e-05, "epoch": 0.16910771787680481, "percentage": 16.91, "elapsed_time": "12:25:59", "remaining_time": "2 days, 13:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1629, "total_steps": 9627, "loss": 1.6478, "learning_rate": 9.31000103759366e-05, "epoch": 0.16921159239638517, "percentage": 16.92, "elapsed_time": "12:26:25", "remaining_time": "2 days, 13:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 9627, "loss": 1.7259, "learning_rate": 9.309173708186963e-05, "epoch": 0.16931546691596552, "percentage": 16.93, "elapsed_time": "12:26:51", "remaining_time": "2 days, 13:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1631, "total_steps": 9627, "loss": 1.8386, "learning_rate": 9.308345919886877e-05, "epoch": 0.16941934143554585, "percentage": 16.94, "elapsed_time": "12:27:18", "remaining_time": "2 days, 13:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1632, "total_steps": 9627, "loss": 1.8391, "learning_rate": 9.307517672781557e-05, "epoch": 0.1695232159551262, "percentage": 16.95, "elapsed_time": "12:27:44", "remaining_time": "2 days, 13:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1633, "total_steps": 9627, "loss": 1.8277, "learning_rate": 9.306688966959205e-05, "epoch": 0.16962709047470656, "percentage": 16.96, "elapsed_time": "12:28:10", "remaining_time": "2 days, 13:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1634, "total_steps": 9627, "loss": 1.7996, "learning_rate": 9.305859802508073e-05, "epoch": 0.16973096499428691, "percentage": 16.97, "elapsed_time": "12:28:36", "remaining_time": "2 days, 13:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1635, "total_steps": 9627, "loss": 1.7441, "learning_rate": 9.305030179516458e-05, "epoch": 0.16983483951386724, "percentage": 16.98, "elapsed_time": "12:29:03", "remaining_time": "2 days, 13:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1636, "total_steps": 9627, "loss": 1.9145, "learning_rate": 9.304200098072709e-05, "epoch": 0.1699387140334476, "percentage": 16.99, "elapsed_time": "12:29:29", "remaining_time": "2 days, 13:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1637, "total_steps": 9627, "loss": 1.7381, "learning_rate": 9.303369558265224e-05, "epoch": 0.17004258855302795, "percentage": 17.0, "elapsed_time": "12:29:56", "remaining_time": "2 days, 13:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1638, "total_steps": 9627, "loss": 1.6391, "learning_rate": 9.30253856018245e-05, "epoch": 0.17014646307260828, "percentage": 17.01, "elapsed_time": "12:30:22", "remaining_time": "2 days, 12:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1639, "total_steps": 9627, "loss": 1.8337, "learning_rate": 9.301707103912878e-05, "epoch": 0.17025033759218863, "percentage": 17.03, "elapsed_time": "12:30:48", "remaining_time": "2 days, 12:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 9627, "loss": 1.9798, "learning_rate": 9.300875189545055e-05, "epoch": 0.170354212111769, "percentage": 17.04, "elapsed_time": "12:31:15", "remaining_time": "2 days, 12:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1641, "total_steps": 9627, "loss": 1.6744, "learning_rate": 9.300042817167574e-05, "epoch": 0.17045808663134934, "percentage": 17.05, "elapsed_time": "12:31:40", "remaining_time": "2 days, 12:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1642, "total_steps": 9627, "loss": 2.0351, "learning_rate": 9.299209986869073e-05, "epoch": 0.17056196115092967, "percentage": 17.06, "elapsed_time": "12:32:07", "remaining_time": "2 days, 12:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1643, "total_steps": 9627, "loss": 1.8298, "learning_rate": 9.298376698738242e-05, "epoch": 0.17066583567051002, "percentage": 17.07, "elapsed_time": "12:32:34", "remaining_time": "2 days, 12:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1644, "total_steps": 9627, "loss": 1.7124, "learning_rate": 9.297542952863824e-05, "epoch": 0.17076971019009038, "percentage": 17.08, "elapsed_time": "12:33:00", "remaining_time": "2 days, 12:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1645, "total_steps": 9627, "loss": 2.0271, "learning_rate": 9.296708749334603e-05, "epoch": 0.1708735847096707, "percentage": 17.09, "elapsed_time": "12:33:26", "remaining_time": "2 days, 12:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1646, "total_steps": 9627, "loss": 1.8808, "learning_rate": 9.295874088239416e-05, "epoch": 0.17097745922925106, "percentage": 17.1, "elapsed_time": "12:33:53", "remaining_time": "2 days, 12:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1647, "total_steps": 9627, "loss": 1.8879, "learning_rate": 9.295038969667145e-05, "epoch": 0.17108133374883142, "percentage": 17.11, "elapsed_time": "12:34:19", "remaining_time": "2 days, 12:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1648, "total_steps": 9627, "loss": 1.644, "learning_rate": 9.29420339370673e-05, "epoch": 0.17118520826841177, "percentage": 17.12, "elapsed_time": "12:34:45", "remaining_time": "2 days, 12:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1649, "total_steps": 9627, "loss": 1.907, "learning_rate": 9.293367360447148e-05, "epoch": 0.1712890827879921, "percentage": 17.13, "elapsed_time": "12:35:11", "remaining_time": "2 days, 12:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 9627, "loss": 1.6838, "learning_rate": 9.292530869977432e-05, "epoch": 0.17139295730757245, "percentage": 17.14, "elapsed_time": "12:35:38", "remaining_time": "2 days, 12:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1651, "total_steps": 9627, "loss": 1.8516, "learning_rate": 9.29169392238666e-05, "epoch": 0.1714968318271528, "percentage": 17.15, "elapsed_time": "12:36:05", "remaining_time": "2 days, 12:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1652, "total_steps": 9627, "loss": 1.8696, "learning_rate": 9.290856517763965e-05, "epoch": 0.17160070634673313, "percentage": 17.16, "elapsed_time": "12:36:30", "remaining_time": "2 days, 12:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1653, "total_steps": 9627, "loss": 1.7186, "learning_rate": 9.290018656198517e-05, "epoch": 0.1717045808663135, "percentage": 17.17, "elapsed_time": "12:36:57", "remaining_time": "2 days, 12:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1654, "total_steps": 9627, "loss": 1.6732, "learning_rate": 9.289180337779547e-05, "epoch": 0.17180845538589384, "percentage": 17.18, "elapsed_time": "12:37:24", "remaining_time": "2 days, 12:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1655, "total_steps": 9627, "loss": 1.6082, "learning_rate": 9.288341562596328e-05, "epoch": 0.1719123299054742, "percentage": 17.19, "elapsed_time": "12:37:50", "remaining_time": "2 days, 12:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1656, "total_steps": 9627, "loss": 1.7092, "learning_rate": 9.287502330738183e-05, "epoch": 0.17201620442505453, "percentage": 17.2, "elapsed_time": "12:38:16", "remaining_time": "2 days, 12:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1657, "total_steps": 9627, "loss": 1.6828, "learning_rate": 9.286662642294484e-05, "epoch": 0.17212007894463488, "percentage": 17.21, "elapsed_time": "12:38:43", "remaining_time": "2 days, 12:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1658, "total_steps": 9627, "loss": 1.7037, "learning_rate": 9.28582249735465e-05, "epoch": 0.17222395346421523, "percentage": 17.22, "elapsed_time": "12:39:10", "remaining_time": "2 days, 12:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1659, "total_steps": 9627, "loss": 1.7627, "learning_rate": 9.284981896008152e-05, "epoch": 0.17232782798379556, "percentage": 17.23, "elapsed_time": "12:39:35", "remaining_time": "2 days, 12:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 9627, "loss": 1.8424, "learning_rate": 9.284140838344505e-05, "epoch": 0.17243170250337592, "percentage": 17.24, "elapsed_time": "12:40:03", "remaining_time": "2 days, 12:47:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1661, "total_steps": 9627, "loss": 1.9412, "learning_rate": 9.283299324453276e-05, "epoch": 0.17253557702295627, "percentage": 17.25, "elapsed_time": "12:40:30", "remaining_time": "2 days, 12:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1662, "total_steps": 9627, "loss": 1.6443, "learning_rate": 9.28245735442408e-05, "epoch": 0.17263945154253663, "percentage": 17.26, "elapsed_time": "12:40:55", "remaining_time": "2 days, 12:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1663, "total_steps": 9627, "loss": 1.9303, "learning_rate": 9.281614928346582e-05, "epoch": 0.17274332606211695, "percentage": 17.27, "elapsed_time": "12:41:21", "remaining_time": "2 days, 12:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1664, "total_steps": 9627, "loss": 1.5823, "learning_rate": 9.280772046310491e-05, "epoch": 0.1728472005816973, "percentage": 17.28, "elapsed_time": "12:41:49", "remaining_time": "2 days, 12:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1665, "total_steps": 9627, "loss": 1.6381, "learning_rate": 9.279928708405568e-05, "epoch": 0.17295107510127766, "percentage": 17.3, "elapsed_time": "12:42:14", "remaining_time": "2 days, 12:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1666, "total_steps": 9627, "loss": 1.686, "learning_rate": 9.279084914721623e-05, "epoch": 0.17305494962085802, "percentage": 17.31, "elapsed_time": "12:42:41", "remaining_time": "2 days, 12:44:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1667, "total_steps": 9627, "loss": 1.8426, "learning_rate": 9.278240665348512e-05, "epoch": 0.17315882414043834, "percentage": 17.32, "elapsed_time": "12:43:08", "remaining_time": "2 days, 12:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1668, "total_steps": 9627, "loss": 2.0619, "learning_rate": 9.277395960376143e-05, "epoch": 0.1732626986600187, "percentage": 17.33, "elapsed_time": "12:43:34", "remaining_time": "2 days, 12:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1669, "total_steps": 9627, "loss": 1.7277, "learning_rate": 9.276550799894468e-05, "epoch": 0.17336657317959905, "percentage": 17.34, "elapsed_time": "12:44:00", "remaining_time": "2 days, 12:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 9627, "loss": 1.7649, "learning_rate": 9.275705183993491e-05, "epoch": 0.17347044769917938, "percentage": 17.35, "elapsed_time": "12:44:27", "remaining_time": "2 days, 12:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1671, "total_steps": 9627, "loss": 1.702, "learning_rate": 9.274859112763264e-05, "epoch": 0.17357432221875974, "percentage": 17.36, "elapsed_time": "12:44:53", "remaining_time": "2 days, 12:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1672, "total_steps": 9627, "loss": 1.7485, "learning_rate": 9.274012586293887e-05, "epoch": 0.1736781967383401, "percentage": 17.37, "elapsed_time": "12:45:20", "remaining_time": "2 days, 12:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1673, "total_steps": 9627, "loss": 1.7587, "learning_rate": 9.273165604675509e-05, "epoch": 0.17378207125792045, "percentage": 17.38, "elapsed_time": "12:45:45", "remaining_time": "2 days, 12:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1674, "total_steps": 9627, "loss": 1.7234, "learning_rate": 9.272318167998325e-05, "epoch": 0.17388594577750077, "percentage": 17.39, "elapsed_time": "12:46:12", "remaining_time": "2 days, 12:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1675, "total_steps": 9627, "loss": 1.8682, "learning_rate": 9.27147027635258e-05, "epoch": 0.17398982029708113, "percentage": 17.4, "elapsed_time": "12:46:38", "remaining_time": "2 days, 12:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1676, "total_steps": 9627, "loss": 1.9371, "learning_rate": 9.270621929828571e-05, "epoch": 0.17409369481666148, "percentage": 17.41, "elapsed_time": "12:47:05", "remaining_time": "2 days, 12:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1677, "total_steps": 9627, "loss": 1.8035, "learning_rate": 9.269773128516638e-05, "epoch": 0.1741975693362418, "percentage": 17.42, "elapsed_time": "12:47:31", "remaining_time": "2 days, 12:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1678, "total_steps": 9627, "loss": 1.7536, "learning_rate": 9.268923872507174e-05, "epoch": 0.17430144385582216, "percentage": 17.43, "elapsed_time": "12:47:58", "remaining_time": "2 days, 12:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1679, "total_steps": 9627, "loss": 1.8075, "learning_rate": 9.268074161890614e-05, "epoch": 0.17440531837540252, "percentage": 17.44, "elapsed_time": "12:48:24", "remaining_time": "2 days, 12:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 9627, "loss": 1.8028, "learning_rate": 9.267223996757451e-05, "epoch": 0.17450919289498287, "percentage": 17.45, "elapsed_time": "12:48:51", "remaining_time": "2 days, 12:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1681, "total_steps": 9627, "loss": 1.7143, "learning_rate": 9.266373377198216e-05, "epoch": 0.1746130674145632, "percentage": 17.46, "elapsed_time": "12:49:17", "remaining_time": "2 days, 12:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1682, "total_steps": 9627, "loss": 1.8556, "learning_rate": 9.265522303303494e-05, "epoch": 0.17471694193414355, "percentage": 17.47, "elapsed_time": "12:49:43", "remaining_time": "2 days, 12:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1683, "total_steps": 9627, "loss": 1.6931, "learning_rate": 9.264670775163922e-05, "epoch": 0.1748208164537239, "percentage": 17.48, "elapsed_time": "12:50:10", "remaining_time": "2 days, 12:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1684, "total_steps": 9627, "loss": 1.6403, "learning_rate": 9.263818792870176e-05, "epoch": 0.17492469097330424, "percentage": 17.49, "elapsed_time": "12:50:37", "remaining_time": "2 days, 12:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1685, "total_steps": 9627, "loss": 1.6206, "learning_rate": 9.262966356512987e-05, "epoch": 0.1750285654928846, "percentage": 17.5, "elapsed_time": "12:51:03", "remaining_time": "2 days, 12:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1686, "total_steps": 9627, "loss": 1.6314, "learning_rate": 9.262113466183136e-05, "epoch": 0.17513244001246495, "percentage": 17.51, "elapsed_time": "12:51:30", "remaining_time": "2 days, 12:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1687, "total_steps": 9627, "loss": 1.7696, "learning_rate": 9.261260121971445e-05, "epoch": 0.1752363145320453, "percentage": 17.52, "elapsed_time": "12:51:55", "remaining_time": "2 days, 12:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1688, "total_steps": 9627, "loss": 1.734, "learning_rate": 9.260406323968791e-05, "epoch": 0.17534018905162563, "percentage": 17.53, "elapsed_time": "12:52:22", "remaining_time": "2 days, 12:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1689, "total_steps": 9627, "loss": 1.6301, "learning_rate": 9.259552072266096e-05, "epoch": 0.17544406357120598, "percentage": 17.54, "elapsed_time": "12:52:47", "remaining_time": "2 days, 12:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 9627, "loss": 1.6708, "learning_rate": 9.258697366954329e-05, "epoch": 0.17554793809078634, "percentage": 17.55, "elapsed_time": "12:53:15", "remaining_time": "2 days, 12:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1691, "total_steps": 9627, "loss": 1.7327, "learning_rate": 9.257842208124514e-05, "epoch": 0.17565181261036666, "percentage": 17.57, "elapsed_time": "12:53:41", "remaining_time": "2 days, 12:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1692, "total_steps": 9627, "loss": 1.7489, "learning_rate": 9.256986595867715e-05, "epoch": 0.17575568712994702, "percentage": 17.58, "elapsed_time": "12:54:07", "remaining_time": "2 days, 12:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1693, "total_steps": 9627, "loss": 2.1299, "learning_rate": 9.256130530275048e-05, "epoch": 0.17585956164952737, "percentage": 17.59, "elapsed_time": "12:54:33", "remaining_time": "2 days, 12:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1694, "total_steps": 9627, "loss": 1.8252, "learning_rate": 9.255274011437683e-05, "epoch": 0.17596343616910773, "percentage": 17.6, "elapsed_time": "12:55:00", "remaining_time": "2 days, 12:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1695, "total_steps": 9627, "loss": 1.6666, "learning_rate": 9.254417039446824e-05, "epoch": 0.17606731068868806, "percentage": 17.61, "elapsed_time": "12:55:26", "remaining_time": "2 days, 12:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1696, "total_steps": 9627, "loss": 1.7213, "learning_rate": 9.253559614393739e-05, "epoch": 0.1761711852082684, "percentage": 17.62, "elapsed_time": "12:55:51", "remaining_time": "2 days, 12:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1697, "total_steps": 9627, "loss": 1.8218, "learning_rate": 9.252701736369732e-05, "epoch": 0.17627505972784877, "percentage": 17.63, "elapsed_time": "12:56:19", "remaining_time": "2 days, 12:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1698, "total_steps": 9627, "loss": 1.7478, "learning_rate": 9.251843405466162e-05, "epoch": 0.1763789342474291, "percentage": 17.64, "elapsed_time": "12:56:44", "remaining_time": "2 days, 12:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1699, "total_steps": 9627, "loss": 1.7541, "learning_rate": 9.250984621774437e-05, "epoch": 0.17648280876700945, "percentage": 17.65, "elapsed_time": "12:57:11", "remaining_time": "2 days, 12:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 9627, "loss": 1.6592, "learning_rate": 9.250125385386007e-05, "epoch": 0.1765866832865898, "percentage": 17.66, "elapsed_time": "12:57:37", "remaining_time": "2 days, 12:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1701, "total_steps": 9627, "loss": 1.784, "learning_rate": 9.249265696392377e-05, "epoch": 0.17669055780617016, "percentage": 17.67, "elapsed_time": "12:58:04", "remaining_time": "2 days, 12:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1702, "total_steps": 9627, "loss": 1.7904, "learning_rate": 9.248405554885095e-05, "epoch": 0.17679443232575048, "percentage": 17.68, "elapsed_time": "12:58:30", "remaining_time": "2 days, 12:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1703, "total_steps": 9627, "loss": 1.8846, "learning_rate": 9.24754496095576e-05, "epoch": 0.17689830684533084, "percentage": 17.69, "elapsed_time": "12:58:56", "remaining_time": "2 days, 12:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1704, "total_steps": 9627, "loss": 1.7425, "learning_rate": 9.246683914696019e-05, "epoch": 0.1770021813649112, "percentage": 17.7, "elapsed_time": "12:59:23", "remaining_time": "2 days, 12:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1705, "total_steps": 9627, "loss": 1.8047, "learning_rate": 9.245822416197567e-05, "epoch": 0.17710605588449155, "percentage": 17.71, "elapsed_time": "12:59:49", "remaining_time": "2 days, 12:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1706, "total_steps": 9627, "loss": 1.8033, "learning_rate": 9.244960465552148e-05, "epoch": 0.17720993040407187, "percentage": 17.72, "elapsed_time": "13:00:16", "remaining_time": "2 days, 12:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1707, "total_steps": 9627, "loss": 1.9075, "learning_rate": 9.244098062851549e-05, "epoch": 0.17731380492365223, "percentage": 17.73, "elapsed_time": "13:00:42", "remaining_time": "2 days, 12:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1708, "total_steps": 9627, "loss": 1.8054, "learning_rate": 9.243235208187612e-05, "epoch": 0.17741767944323258, "percentage": 17.74, "elapsed_time": "13:01:09", "remaining_time": "2 days, 12:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1709, "total_steps": 9627, "loss": 1.8205, "learning_rate": 9.242371901652223e-05, "epoch": 0.1775215539628129, "percentage": 17.75, "elapsed_time": "13:01:34", "remaining_time": "2 days, 12:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 9627, "loss": 2.1321, "learning_rate": 9.241508143337319e-05, "epoch": 0.17762542848239327, "percentage": 17.76, "elapsed_time": "13:02:00", "remaining_time": "2 days, 12:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1711, "total_steps": 9627, "loss": 1.6551, "learning_rate": 9.240643933334884e-05, "epoch": 0.17772930300197362, "percentage": 17.77, "elapsed_time": "13:02:27", "remaining_time": "2 days, 12:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1712, "total_steps": 9627, "loss": 1.8644, "learning_rate": 9.239779271736947e-05, "epoch": 0.17783317752155398, "percentage": 17.78, "elapsed_time": "13:02:53", "remaining_time": "2 days, 12:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1713, "total_steps": 9627, "loss": 1.6417, "learning_rate": 9.238914158635589e-05, "epoch": 0.1779370520411343, "percentage": 17.79, "elapsed_time": "13:03:21", "remaining_time": "2 days, 12:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1714, "total_steps": 9627, "loss": 1.7762, "learning_rate": 9.238048594122939e-05, "epoch": 0.17804092656071466, "percentage": 17.8, "elapsed_time": "13:03:46", "remaining_time": "2 days, 12:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1715, "total_steps": 9627, "loss": 1.7897, "learning_rate": 9.237182578291171e-05, "epoch": 0.178144801080295, "percentage": 17.81, "elapsed_time": "13:04:12", "remaining_time": "2 days, 12:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1716, "total_steps": 9627, "loss": 1.8132, "learning_rate": 9.23631611123251e-05, "epoch": 0.17824867559987534, "percentage": 17.82, "elapsed_time": "13:04:40", "remaining_time": "2 days, 12:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1717, "total_steps": 9627, "loss": 1.6795, "learning_rate": 9.235449193039227e-05, "epoch": 0.1783525501194557, "percentage": 17.84, "elapsed_time": "13:05:05", "remaining_time": "2 days, 12:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1718, "total_steps": 9627, "loss": 1.7109, "learning_rate": 9.234581823803645e-05, "epoch": 0.17845642463903605, "percentage": 17.85, "elapsed_time": "13:05:32", "remaining_time": "2 days, 12:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1719, "total_steps": 9627, "loss": 1.8293, "learning_rate": 9.233714003618127e-05, "epoch": 0.1785602991586164, "percentage": 17.86, "elapsed_time": "13:05:59", "remaining_time": "2 days, 12:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 9627, "loss": 1.6718, "learning_rate": 9.232845732575093e-05, "epoch": 0.17866417367819673, "percentage": 17.87, "elapsed_time": "13:06:24", "remaining_time": "2 days, 12:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1721, "total_steps": 9627, "loss": 1.8014, "learning_rate": 9.231977010767005e-05, "epoch": 0.17876804819777709, "percentage": 17.88, "elapsed_time": "13:06:51", "remaining_time": "2 days, 12:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1722, "total_steps": 9627, "loss": 1.6053, "learning_rate": 9.231107838286378e-05, "epoch": 0.17887192271735744, "percentage": 17.89, "elapsed_time": "13:07:17", "remaining_time": "2 days, 12:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1723, "total_steps": 9627, "loss": 1.9612, "learning_rate": 9.230238215225769e-05, "epoch": 0.17897579723693777, "percentage": 17.9, "elapsed_time": "13:07:44", "remaining_time": "2 days, 12:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1724, "total_steps": 9627, "loss": 1.6002, "learning_rate": 9.229368141677788e-05, "epoch": 0.17907967175651812, "percentage": 17.91, "elapsed_time": "13:08:10", "remaining_time": "2 days, 12:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1725, "total_steps": 9627, "loss": 1.7805, "learning_rate": 9.228497617735088e-05, "epoch": 0.17918354627609848, "percentage": 17.92, "elapsed_time": "13:08:37", "remaining_time": "2 days, 12:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1726, "total_steps": 9627, "loss": 1.8624, "learning_rate": 9.227626643490377e-05, "epoch": 0.17928742079567883, "percentage": 17.93, "elapsed_time": "13:09:03", "remaining_time": "2 days, 12:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1727, "total_steps": 9627, "loss": 1.7586, "learning_rate": 9.226755219036405e-05, "epoch": 0.17939129531525916, "percentage": 17.94, "elapsed_time": "13:09:29", "remaining_time": "2 days, 12:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1728, "total_steps": 9627, "loss": 1.6, "learning_rate": 9.225883344465972e-05, "epoch": 0.1794951698348395, "percentage": 17.95, "elapsed_time": "13:09:55", "remaining_time": "2 days, 12:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1729, "total_steps": 9627, "loss": 1.7917, "learning_rate": 9.225011019871927e-05, "epoch": 0.17959904435441987, "percentage": 17.96, "elapsed_time": "13:10:22", "remaining_time": "2 days, 12:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 9627, "loss": 1.7524, "learning_rate": 9.224138245347163e-05, "epoch": 0.1797029188740002, "percentage": 17.97, "elapsed_time": "13:10:48", "remaining_time": "2 days, 12:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1731, "total_steps": 9627, "loss": 1.7125, "learning_rate": 9.223265020984626e-05, "epoch": 0.17980679339358055, "percentage": 17.98, "elapsed_time": "13:11:15", "remaining_time": "2 days, 12:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1732, "total_steps": 9627, "loss": 1.6935, "learning_rate": 9.222391346877308e-05, "epoch": 0.1799106679131609, "percentage": 17.99, "elapsed_time": "13:11:41", "remaining_time": "2 days, 12:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1733, "total_steps": 9627, "loss": 1.7725, "learning_rate": 9.221517223118245e-05, "epoch": 0.18001454243274126, "percentage": 18.0, "elapsed_time": "13:12:07", "remaining_time": "2 days, 12:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1734, "total_steps": 9627, "loss": 1.8192, "learning_rate": 9.22064264980053e-05, "epoch": 0.18011841695232159, "percentage": 18.01, "elapsed_time": "13:12:33", "remaining_time": "2 days, 12:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1735, "total_steps": 9627, "loss": 2.0761, "learning_rate": 9.219767627017293e-05, "epoch": 0.18022229147190194, "percentage": 18.02, "elapsed_time": "13:13:00", "remaining_time": "2 days, 12:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1736, "total_steps": 9627, "loss": 1.978, "learning_rate": 9.218892154861721e-05, "epoch": 0.1803261659914823, "percentage": 18.03, "elapsed_time": "13:13:25", "remaining_time": "2 days, 12:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1737, "total_steps": 9627, "loss": 1.7811, "learning_rate": 9.218016233427042e-05, "epoch": 0.18043004051106262, "percentage": 18.04, "elapsed_time": "13:13:51", "remaining_time": "2 days, 12:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1738, "total_steps": 9627, "loss": 1.9864, "learning_rate": 9.217139862806534e-05, "epoch": 0.18053391503064298, "percentage": 18.05, "elapsed_time": "13:14:19", "remaining_time": "2 days, 12:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1739, "total_steps": 9627, "loss": 1.6712, "learning_rate": 9.21626304309353e-05, "epoch": 0.18063778955022333, "percentage": 18.06, "elapsed_time": "13:14:45", "remaining_time": "2 days, 12:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 9627, "loss": 1.7967, "learning_rate": 9.215385774381395e-05, "epoch": 0.1807416640698037, "percentage": 18.07, "elapsed_time": "13:15:11", "remaining_time": "2 days, 12:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1741, "total_steps": 9627, "loss": 1.8833, "learning_rate": 9.21450805676356e-05, "epoch": 0.18084553858938401, "percentage": 18.08, "elapsed_time": "13:15:37", "remaining_time": "2 days, 12:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1742, "total_steps": 9627, "loss": 1.8027, "learning_rate": 9.213629890333489e-05, "epoch": 0.18094941310896437, "percentage": 18.09, "elapsed_time": "13:16:03", "remaining_time": "2 days, 12:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1743, "total_steps": 9627, "loss": 1.658, "learning_rate": 9.212751275184704e-05, "epoch": 0.18105328762854472, "percentage": 18.11, "elapsed_time": "13:16:30", "remaining_time": "2 days, 12:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1744, "total_steps": 9627, "loss": 1.6251, "learning_rate": 9.211872211410769e-05, "epoch": 0.18115716214812508, "percentage": 18.12, "elapsed_time": "13:16:56", "remaining_time": "2 days, 12:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1745, "total_steps": 9627, "loss": 1.5998, "learning_rate": 9.210992699105296e-05, "epoch": 0.1812610366677054, "percentage": 18.13, "elapsed_time": "13:17:23", "remaining_time": "2 days, 12:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1746, "total_steps": 9627, "loss": 1.8308, "learning_rate": 9.210112738361949e-05, "epoch": 0.18136491118728576, "percentage": 18.14, "elapsed_time": "13:17:49", "remaining_time": "2 days, 12:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1747, "total_steps": 9627, "loss": 1.7902, "learning_rate": 9.209232329274433e-05, "epoch": 0.18146878570686611, "percentage": 18.15, "elapsed_time": "13:18:15", "remaining_time": "2 days, 12:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1748, "total_steps": 9627, "loss": 1.9225, "learning_rate": 9.208351471936509e-05, "epoch": 0.18157266022644644, "percentage": 18.16, "elapsed_time": "13:18:42", "remaining_time": "2 days, 12:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1749, "total_steps": 9627, "loss": 1.7431, "learning_rate": 9.20747016644198e-05, "epoch": 0.1816765347460268, "percentage": 18.17, "elapsed_time": "13:19:08", "remaining_time": "2 days, 11:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 9627, "loss": 1.6417, "learning_rate": 9.206588412884698e-05, "epoch": 0.18178040926560715, "percentage": 18.18, "elapsed_time": "13:19:34", "remaining_time": "2 days, 11:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1751, "total_steps": 9627, "loss": 1.7612, "learning_rate": 9.205706211358563e-05, "epoch": 0.1818842837851875, "percentage": 18.19, "elapsed_time": "13:20:00", "remaining_time": "2 days, 11:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1752, "total_steps": 9627, "loss": 1.6711, "learning_rate": 9.204823561957521e-05, "epoch": 0.18198815830476783, "percentage": 18.2, "elapsed_time": "13:20:27", "remaining_time": "2 days, 11:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1753, "total_steps": 9627, "loss": 1.9513, "learning_rate": 9.203940464775568e-05, "epoch": 0.1820920328243482, "percentage": 18.21, "elapsed_time": "13:20:52", "remaining_time": "2 days, 11:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1754, "total_steps": 9627, "loss": 1.6691, "learning_rate": 9.203056919906748e-05, "epoch": 0.18219590734392854, "percentage": 18.22, "elapsed_time": "13:21:19", "remaining_time": "2 days, 11:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1755, "total_steps": 9627, "loss": 1.6556, "learning_rate": 9.202172927445152e-05, "epoch": 0.18229978186350887, "percentage": 18.23, "elapsed_time": "13:21:45", "remaining_time": "2 days, 11:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1756, "total_steps": 9627, "loss": 1.7761, "learning_rate": 9.201288487484916e-05, "epoch": 0.18240365638308922, "percentage": 18.24, "elapsed_time": "13:22:12", "remaining_time": "2 days, 11:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1757, "total_steps": 9627, "loss": 2.1197, "learning_rate": 9.200403600120229e-05, "epoch": 0.18250753090266958, "percentage": 18.25, "elapsed_time": "13:22:37", "remaining_time": "2 days, 11:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1758, "total_steps": 9627, "loss": 1.9191, "learning_rate": 9.199518265445321e-05, "epoch": 0.18261140542224993, "percentage": 18.26, "elapsed_time": "13:23:03", "remaining_time": "2 days, 11:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1759, "total_steps": 9627, "loss": 1.8001, "learning_rate": 9.198632483554478e-05, "epoch": 0.18271527994183026, "percentage": 18.27, "elapsed_time": "13:23:30", "remaining_time": "2 days, 11:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 9627, "loss": 1.8518, "learning_rate": 9.197746254542025e-05, "epoch": 0.18281915446141062, "percentage": 18.28, "elapsed_time": "13:23:55", "remaining_time": "2 days, 11:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1761, "total_steps": 9627, "loss": 1.952, "learning_rate": 9.196859578502338e-05, "epoch": 0.18292302898099097, "percentage": 18.29, "elapsed_time": "13:24:22", "remaining_time": "2 days, 11:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1762, "total_steps": 9627, "loss": 1.8547, "learning_rate": 9.195972455529844e-05, "epoch": 0.1830269035005713, "percentage": 18.3, "elapsed_time": "13:24:49", "remaining_time": "2 days, 11:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1763, "total_steps": 9627, "loss": 1.9248, "learning_rate": 9.195084885719014e-05, "epoch": 0.18313077802015165, "percentage": 18.31, "elapsed_time": "13:25:15", "remaining_time": "2 days, 11:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1764, "total_steps": 9627, "loss": 1.8411, "learning_rate": 9.194196869164366e-05, "epoch": 0.183234652539732, "percentage": 18.32, "elapsed_time": "13:25:41", "remaining_time": "2 days, 11:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1765, "total_steps": 9627, "loss": 1.6903, "learning_rate": 9.193308405960466e-05, "epoch": 0.18333852705931236, "percentage": 18.33, "elapsed_time": "13:26:07", "remaining_time": "2 days, 11:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1766, "total_steps": 9627, "loss": 1.7171, "learning_rate": 9.192419496201932e-05, "epoch": 0.1834424015788927, "percentage": 18.34, "elapsed_time": "13:26:33", "remaining_time": "2 days, 11:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1767, "total_steps": 9627, "loss": 1.6295, "learning_rate": 9.191530139983423e-05, "epoch": 0.18354627609847304, "percentage": 18.35, "elapsed_time": "13:26:59", "remaining_time": "2 days, 11:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1768, "total_steps": 9627, "loss": 1.5843, "learning_rate": 9.190640337399647e-05, "epoch": 0.1836501506180534, "percentage": 18.37, "elapsed_time": "13:27:26", "remaining_time": "2 days, 11:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1769, "total_steps": 9627, "loss": 1.957, "learning_rate": 9.189750088545367e-05, "epoch": 0.18375402513763373, "percentage": 18.38, "elapsed_time": "13:27:51", "remaining_time": "2 days, 11:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 9627, "loss": 1.9529, "learning_rate": 9.188859393515382e-05, "epoch": 0.18385789965721408, "percentage": 18.39, "elapsed_time": "13:28:17", "remaining_time": "2 days, 11:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1771, "total_steps": 9627, "loss": 1.7235, "learning_rate": 9.187968252404547e-05, "epoch": 0.18396177417679443, "percentage": 18.4, "elapsed_time": "13:28:44", "remaining_time": "2 days, 11:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1772, "total_steps": 9627, "loss": 2.1363, "learning_rate": 9.187076665307758e-05, "epoch": 0.1840656486963748, "percentage": 18.41, "elapsed_time": "13:29:09", "remaining_time": "2 days, 11:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1773, "total_steps": 9627, "loss": 1.7975, "learning_rate": 9.186184632319968e-05, "epoch": 0.18416952321595512, "percentage": 18.42, "elapsed_time": "13:29:36", "remaining_time": "2 days, 11:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1774, "total_steps": 9627, "loss": 1.8601, "learning_rate": 9.185292153536165e-05, "epoch": 0.18427339773553547, "percentage": 18.43, "elapsed_time": "13:30:02", "remaining_time": "2 days, 11:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1775, "total_steps": 9627, "loss": 1.8401, "learning_rate": 9.184399229051397e-05, "epoch": 0.18437727225511583, "percentage": 18.44, "elapsed_time": "13:30:28", "remaining_time": "2 days, 11:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1776, "total_steps": 9627, "loss": 1.7523, "learning_rate": 9.183505858960748e-05, "epoch": 0.18448114677469618, "percentage": 18.45, "elapsed_time": "13:30:55", "remaining_time": "2 days, 11:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1777, "total_steps": 9627, "loss": 1.7327, "learning_rate": 9.18261204335936e-05, "epoch": 0.1845850212942765, "percentage": 18.46, "elapsed_time": "13:31:20", "remaining_time": "2 days, 11:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1778, "total_steps": 9627, "loss": 1.9453, "learning_rate": 9.181717782342414e-05, "epoch": 0.18468889581385686, "percentage": 18.47, "elapsed_time": "13:31:46", "remaining_time": "2 days, 11:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1779, "total_steps": 9627, "loss": 1.5841, "learning_rate": 9.180823076005143e-05, "epoch": 0.18479277033343722, "percentage": 18.48, "elapsed_time": "13:32:13", "remaining_time": "2 days, 11:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 9627, "loss": 1.8535, "learning_rate": 9.179927924442826e-05, "epoch": 0.18489664485301754, "percentage": 18.49, "elapsed_time": "13:32:38", "remaining_time": "2 days, 11:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1781, "total_steps": 9627, "loss": 2.1207, "learning_rate": 9.17903232775079e-05, "epoch": 0.1850005193725979, "percentage": 18.5, "elapsed_time": "13:33:05", "remaining_time": "2 days, 11:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1782, "total_steps": 9627, "loss": 1.9405, "learning_rate": 9.178136286024408e-05, "epoch": 0.18510439389217825, "percentage": 18.51, "elapsed_time": "13:33:30", "remaining_time": "2 days, 11:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1783, "total_steps": 9627, "loss": 1.8607, "learning_rate": 9.177239799359102e-05, "epoch": 0.1852082684117586, "percentage": 18.52, "elapsed_time": "13:33:56", "remaining_time": "2 days, 11:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1784, "total_steps": 9627, "loss": 1.9337, "learning_rate": 9.176342867850343e-05, "epoch": 0.18531214293133894, "percentage": 18.53, "elapsed_time": "13:34:23", "remaining_time": "2 days, 11:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1785, "total_steps": 9627, "loss": 1.8079, "learning_rate": 9.175445491593644e-05, "epoch": 0.1854160174509193, "percentage": 18.54, "elapsed_time": "13:34:49", "remaining_time": "2 days, 11:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1786, "total_steps": 9627, "loss": 1.5856, "learning_rate": 9.174547670684569e-05, "epoch": 0.18551989197049965, "percentage": 18.55, "elapsed_time": "13:35:14", "remaining_time": "2 days, 11:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1787, "total_steps": 9627, "loss": 1.6828, "learning_rate": 9.173649405218732e-05, "epoch": 0.18562376649007997, "percentage": 18.56, "elapsed_time": "13:35:41", "remaining_time": "2 days, 11:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1788, "total_steps": 9627, "loss": 1.5845, "learning_rate": 9.172750695291787e-05, "epoch": 0.18572764100966033, "percentage": 18.57, "elapsed_time": "13:36:07", "remaining_time": "2 days, 11:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1789, "total_steps": 9627, "loss": 1.7407, "learning_rate": 9.171851540999442e-05, "epoch": 0.18583151552924068, "percentage": 18.58, "elapsed_time": "13:36:32", "remaining_time": "2 days, 11:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 9627, "loss": 1.8655, "learning_rate": 9.17095194243745e-05, "epoch": 0.18593539004882104, "percentage": 18.59, "elapsed_time": "13:37:00", "remaining_time": "2 days, 11:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1791, "total_steps": 9627, "loss": 1.7179, "learning_rate": 9.17005189970161e-05, "epoch": 0.18603926456840136, "percentage": 18.6, "elapsed_time": "13:37:25", "remaining_time": "2 days, 11:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1792, "total_steps": 9627, "loss": 1.6426, "learning_rate": 9.169151412887774e-05, "epoch": 0.18614313908798172, "percentage": 18.61, "elapsed_time": "13:37:52", "remaining_time": "2 days, 11:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1793, "total_steps": 9627, "loss": 1.7468, "learning_rate": 9.16825048209183e-05, "epoch": 0.18624701360756207, "percentage": 18.62, "elapsed_time": "13:38:18", "remaining_time": "2 days, 11:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1794, "total_steps": 9627, "loss": 1.5946, "learning_rate": 9.167349107409721e-05, "epoch": 0.1863508881271424, "percentage": 18.64, "elapsed_time": "13:38:44", "remaining_time": "2 days, 11:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1795, "total_steps": 9627, "loss": 1.6169, "learning_rate": 9.166447288937444e-05, "epoch": 0.18645476264672275, "percentage": 18.65, "elapsed_time": "13:39:10", "remaining_time": "2 days, 11:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1796, "total_steps": 9627, "loss": 1.7109, "learning_rate": 9.165545026771026e-05, "epoch": 0.1865586371663031, "percentage": 18.66, "elapsed_time": "13:39:36", "remaining_time": "2 days, 11:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1797, "total_steps": 9627, "loss": 1.7274, "learning_rate": 9.164642321006555e-05, "epoch": 0.18666251168588346, "percentage": 18.67, "elapsed_time": "13:40:02", "remaining_time": "2 days, 11:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1798, "total_steps": 9627, "loss": 1.8982, "learning_rate": 9.163739171740167e-05, "epoch": 0.1867663862054638, "percentage": 18.68, "elapsed_time": "13:40:29", "remaining_time": "2 days, 11:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1799, "total_steps": 9627, "loss": 1.8586, "learning_rate": 9.162835579068032e-05, "epoch": 0.18687026072504415, "percentage": 18.69, "elapsed_time": "13:40:53", "remaining_time": "2 days, 11:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 9627, "loss": 1.8012, "learning_rate": 9.161931543086379e-05, "epoch": 0.1869741352446245, "percentage": 18.7, "elapsed_time": "13:41:21", "remaining_time": "2 days, 11:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1801, "total_steps": 9627, "loss": 1.6804, "learning_rate": 9.161027063891481e-05, "epoch": 0.18707800976420483, "percentage": 18.71, "elapsed_time": "13:41:47", "remaining_time": "2 days, 11:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1802, "total_steps": 9627, "loss": 2.0161, "learning_rate": 9.160122141579659e-05, "epoch": 0.18718188428378518, "percentage": 18.72, "elapsed_time": "13:42:12", "remaining_time": "2 days, 11:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1803, "total_steps": 9627, "loss": 1.7743, "learning_rate": 9.159216776247279e-05, "epoch": 0.18728575880336554, "percentage": 18.73, "elapsed_time": "13:42:40", "remaining_time": "2 days, 11:29:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1804, "total_steps": 9627, "loss": 1.8117, "learning_rate": 9.158310967990755e-05, "epoch": 0.1873896333229459, "percentage": 18.74, "elapsed_time": "13:43:05", "remaining_time": "2 days, 11:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1805, "total_steps": 9627, "loss": 1.8559, "learning_rate": 9.15740471690655e-05, "epoch": 0.18749350784252622, "percentage": 18.75, "elapsed_time": "13:43:32", "remaining_time": "2 days, 11:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1806, "total_steps": 9627, "loss": 1.8888, "learning_rate": 9.156498023091172e-05, "epoch": 0.18759738236210657, "percentage": 18.76, "elapsed_time": "13:43:58", "remaining_time": "2 days, 11:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1807, "total_steps": 9627, "loss": 1.8934, "learning_rate": 9.155590886641174e-05, "epoch": 0.18770125688168693, "percentage": 18.77, "elapsed_time": "13:44:24", "remaining_time": "2 days, 11:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1808, "total_steps": 9627, "loss": 1.8035, "learning_rate": 9.154683307653162e-05, "epoch": 0.18780513140126726, "percentage": 18.78, "elapsed_time": "13:44:50", "remaining_time": "2 days, 11:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1809, "total_steps": 9627, "loss": 1.9612, "learning_rate": 9.153775286223787e-05, "epoch": 0.1879090059208476, "percentage": 18.79, "elapsed_time": "13:45:16", "remaining_time": "2 days, 11:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 9627, "loss": 1.6764, "learning_rate": 9.152866822449743e-05, "epoch": 0.18801288044042797, "percentage": 18.8, "elapsed_time": "13:45:42", "remaining_time": "2 days, 11:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1811, "total_steps": 9627, "loss": 1.7292, "learning_rate": 9.151957916427778e-05, "epoch": 0.18811675496000832, "percentage": 18.81, "elapsed_time": "13:46:08", "remaining_time": "2 days, 11:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1812, "total_steps": 9627, "loss": 1.9939, "learning_rate": 9.151048568254682e-05, "epoch": 0.18822062947958865, "percentage": 18.82, "elapsed_time": "13:46:35", "remaining_time": "2 days, 11:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1813, "total_steps": 9627, "loss": 1.7508, "learning_rate": 9.15013877802729e-05, "epoch": 0.188324503999169, "percentage": 18.83, "elapsed_time": "13:47:00", "remaining_time": "2 days, 11:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1814, "total_steps": 9627, "loss": 1.766, "learning_rate": 9.149228545842492e-05, "epoch": 0.18842837851874936, "percentage": 18.84, "elapsed_time": "13:47:27", "remaining_time": "2 days, 11:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1815, "total_steps": 9627, "loss": 1.8, "learning_rate": 9.148317871797219e-05, "epoch": 0.1885322530383297, "percentage": 18.85, "elapsed_time": "13:47:53", "remaining_time": "2 days, 11:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1816, "total_steps": 9627, "loss": 1.8142, "learning_rate": 9.14740675598845e-05, "epoch": 0.18863612755791004, "percentage": 18.86, "elapsed_time": "13:48:18", "remaining_time": "2 days, 11:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1817, "total_steps": 9627, "loss": 1.9191, "learning_rate": 9.146495198513214e-05, "epoch": 0.1887400020774904, "percentage": 18.87, "elapsed_time": "13:48:46", "remaining_time": "2 days, 11:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1818, "total_steps": 9627, "loss": 1.8575, "learning_rate": 9.145583199468582e-05, "epoch": 0.18884387659707075, "percentage": 18.88, "elapsed_time": "13:49:11", "remaining_time": "2 days, 11:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1819, "total_steps": 9627, "loss": 1.799, "learning_rate": 9.144670758951677e-05, "epoch": 0.18894775111665107, "percentage": 18.89, "elapsed_time": "13:49:37", "remaining_time": "2 days, 11:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 9627, "loss": 1.8317, "learning_rate": 9.143757877059665e-05, "epoch": 0.18905162563623143, "percentage": 18.91, "elapsed_time": "13:50:02", "remaining_time": "2 days, 11:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1821, "total_steps": 9627, "loss": 1.5719, "learning_rate": 9.142844553889762e-05, "epoch": 0.18915550015581178, "percentage": 18.92, "elapsed_time": "13:50:29", "remaining_time": "2 days, 11:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1822, "total_steps": 9627, "loss": 1.7996, "learning_rate": 9.141930789539229e-05, "epoch": 0.18925937467539214, "percentage": 18.93, "elapsed_time": "13:50:55", "remaining_time": "2 days, 11:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1823, "total_steps": 9627, "loss": 1.5699, "learning_rate": 9.141016584105376e-05, "epoch": 0.18936324919497247, "percentage": 18.94, "elapsed_time": "13:51:21", "remaining_time": "2 days, 11:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1824, "total_steps": 9627, "loss": 1.7303, "learning_rate": 9.140101937685558e-05, "epoch": 0.18946712371455282, "percentage": 18.95, "elapsed_time": "13:51:48", "remaining_time": "2 days, 11:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1825, "total_steps": 9627, "loss": 1.7005, "learning_rate": 9.139186850377177e-05, "epoch": 0.18957099823413318, "percentage": 18.96, "elapsed_time": "13:52:14", "remaining_time": "2 days, 11:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1826, "total_steps": 9627, "loss": 1.6708, "learning_rate": 9.138271322277685e-05, "epoch": 0.1896748727537135, "percentage": 18.97, "elapsed_time": "13:52:40", "remaining_time": "2 days, 11:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1827, "total_steps": 9627, "loss": 1.8142, "learning_rate": 9.137355353484573e-05, "epoch": 0.18977874727329386, "percentage": 18.98, "elapsed_time": "13:53:06", "remaining_time": "2 days, 11:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1828, "total_steps": 9627, "loss": 1.741, "learning_rate": 9.136438944095392e-05, "epoch": 0.1898826217928742, "percentage": 18.99, "elapsed_time": "13:53:33", "remaining_time": "2 days, 11:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1829, "total_steps": 9627, "loss": 1.7995, "learning_rate": 9.135522094207729e-05, "epoch": 0.18998649631245457, "percentage": 19.0, "elapsed_time": "13:53:59", "remaining_time": "2 days, 11:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 9627, "loss": 1.5989, "learning_rate": 9.13460480391922e-05, "epoch": 0.1900903708320349, "percentage": 19.01, "elapsed_time": "13:54:24", "remaining_time": "2 days, 11:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1831, "total_steps": 9627, "loss": 1.8601, "learning_rate": 9.13368707332755e-05, "epoch": 0.19019424535161525, "percentage": 19.02, "elapsed_time": "13:54:52", "remaining_time": "2 days, 11:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1832, "total_steps": 9627, "loss": 1.86, "learning_rate": 9.13276890253045e-05, "epoch": 0.1902981198711956, "percentage": 19.03, "elapsed_time": "13:55:17", "remaining_time": "2 days, 11:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1833, "total_steps": 9627, "loss": 1.6658, "learning_rate": 9.131850291625702e-05, "epoch": 0.19040199439077593, "percentage": 19.04, "elapsed_time": "13:55:44", "remaining_time": "2 days, 11:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1834, "total_steps": 9627, "loss": 1.9726, "learning_rate": 9.130931240711126e-05, "epoch": 0.19050586891035629, "percentage": 19.05, "elapsed_time": "13:56:10", "remaining_time": "2 days, 11:13:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1835, "total_steps": 9627, "loss": 1.851, "learning_rate": 9.130011749884595e-05, "epoch": 0.19060974342993664, "percentage": 19.06, "elapsed_time": "13:56:35", "remaining_time": "2 days, 11:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1836, "total_steps": 9627, "loss": 1.8169, "learning_rate": 9.129091819244028e-05, "epoch": 0.190713617949517, "percentage": 19.07, "elapsed_time": "13:57:02", "remaining_time": "2 days, 11:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1837, "total_steps": 9627, "loss": 2.0705, "learning_rate": 9.12817144888739e-05, "epoch": 0.19081749246909732, "percentage": 19.08, "elapsed_time": "13:57:27", "remaining_time": "2 days, 11:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1838, "total_steps": 9627, "loss": 1.7838, "learning_rate": 9.127250638912695e-05, "epoch": 0.19092136698867768, "percentage": 19.09, "elapsed_time": "13:57:54", "remaining_time": "2 days, 11:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1839, "total_steps": 9627, "loss": 1.8239, "learning_rate": 9.126329389418e-05, "epoch": 0.19102524150825803, "percentage": 19.1, "elapsed_time": "13:58:20", "remaining_time": "2 days, 11:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 9627, "loss": 1.6151, "learning_rate": 9.125407700501412e-05, "epoch": 0.19112911602783836, "percentage": 19.11, "elapsed_time": "13:58:46", "remaining_time": "2 days, 11:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1841, "total_steps": 9627, "loss": 1.9243, "learning_rate": 9.124485572261082e-05, "epoch": 0.1912329905474187, "percentage": 19.12, "elapsed_time": "13:59:11", "remaining_time": "2 days, 11:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1842, "total_steps": 9627, "loss": 1.9735, "learning_rate": 9.123563004795213e-05, "epoch": 0.19133686506699907, "percentage": 19.13, "elapsed_time": "13:59:38", "remaining_time": "2 days, 11:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1843, "total_steps": 9627, "loss": 1.8774, "learning_rate": 9.122639998202047e-05, "epoch": 0.19144073958657942, "percentage": 19.14, "elapsed_time": "14:00:04", "remaining_time": "2 days, 11:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1844, "total_steps": 9627, "loss": 1.8337, "learning_rate": 9.12171655257988e-05, "epoch": 0.19154461410615975, "percentage": 19.15, "elapsed_time": "14:00:29", "remaining_time": "2 days, 11:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1845, "total_steps": 9627, "loss": 1.8081, "learning_rate": 9.120792668027049e-05, "epoch": 0.1916484886257401, "percentage": 19.16, "elapsed_time": "14:00:57", "remaining_time": "2 days, 11:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1846, "total_steps": 9627, "loss": 1.8096, "learning_rate": 9.119868344641944e-05, "epoch": 0.19175236314532046, "percentage": 19.18, "elapsed_time": "14:01:22", "remaining_time": "2 days, 11:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1847, "total_steps": 9627, "loss": 1.826, "learning_rate": 9.118943582522996e-05, "epoch": 0.19185623766490079, "percentage": 19.19, "elapsed_time": "14:01:48", "remaining_time": "2 days, 11:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1848, "total_steps": 9627, "loss": 1.6942, "learning_rate": 9.118018381768687e-05, "epoch": 0.19196011218448114, "percentage": 19.2, "elapsed_time": "14:02:15", "remaining_time": "2 days, 11:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1849, "total_steps": 9627, "loss": 1.8741, "learning_rate": 9.11709274247754e-05, "epoch": 0.1920639867040615, "percentage": 19.21, "elapsed_time": "14:02:40", "remaining_time": "2 days, 11:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 9627, "loss": 1.7608, "learning_rate": 9.116166664748131e-05, "epoch": 0.19216786122364185, "percentage": 19.22, "elapsed_time": "14:03:06", "remaining_time": "2 days, 11:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1851, "total_steps": 9627, "loss": 1.715, "learning_rate": 9.11524014867908e-05, "epoch": 0.19227173574322218, "percentage": 19.23, "elapsed_time": "14:03:33", "remaining_time": "2 days, 11:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1852, "total_steps": 9627, "loss": 1.5889, "learning_rate": 9.114313194369053e-05, "epoch": 0.19237561026280253, "percentage": 19.24, "elapsed_time": "14:03:58", "remaining_time": "2 days, 11:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1853, "total_steps": 9627, "loss": 1.6605, "learning_rate": 9.113385801916765e-05, "epoch": 0.1924794847823829, "percentage": 19.25, "elapsed_time": "14:04:25", "remaining_time": "2 days, 11:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1854, "total_steps": 9627, "loss": 1.8351, "learning_rate": 9.112457971420973e-05, "epoch": 0.19258335930196324, "percentage": 19.26, "elapsed_time": "14:04:51", "remaining_time": "2 days, 11:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1855, "total_steps": 9627, "loss": 1.8845, "learning_rate": 9.111529702980486e-05, "epoch": 0.19268723382154357, "percentage": 19.27, "elapsed_time": "14:05:17", "remaining_time": "2 days, 11:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1856, "total_steps": 9627, "loss": 1.8629, "learning_rate": 9.110600996694157e-05, "epoch": 0.19279110834112392, "percentage": 19.28, "elapsed_time": "14:05:43", "remaining_time": "2 days, 11:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1857, "total_steps": 9627, "loss": 1.718, "learning_rate": 9.109671852660885e-05, "epoch": 0.19289498286070428, "percentage": 19.29, "elapsed_time": "14:06:09", "remaining_time": "2 days, 11:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1858, "total_steps": 9627, "loss": 1.6209, "learning_rate": 9.108742270979618e-05, "epoch": 0.1929988573802846, "percentage": 19.3, "elapsed_time": "14:06:35", "remaining_time": "2 days, 10:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1859, "total_steps": 9627, "loss": 1.936, "learning_rate": 9.107812251749349e-05, "epoch": 0.19310273189986496, "percentage": 19.31, "elapsed_time": "14:07:01", "remaining_time": "2 days, 10:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 9627, "loss": 1.8329, "learning_rate": 9.106881795069116e-05, "epoch": 0.19320660641944531, "percentage": 19.32, "elapsed_time": "14:07:27", "remaining_time": "2 days, 10:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1861, "total_steps": 9627, "loss": 1.8072, "learning_rate": 9.105950901038008e-05, "epoch": 0.19331048093902567, "percentage": 19.33, "elapsed_time": "14:07:53", "remaining_time": "2 days, 10:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1862, "total_steps": 9627, "loss": 1.8516, "learning_rate": 9.105019569755157e-05, "epoch": 0.193414355458606, "percentage": 19.34, "elapsed_time": "14:08:19", "remaining_time": "2 days, 10:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1863, "total_steps": 9627, "loss": 1.7609, "learning_rate": 9.104087801319741e-05, "epoch": 0.19351822997818635, "percentage": 19.35, "elapsed_time": "14:08:46", "remaining_time": "2 days, 10:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1864, "total_steps": 9627, "loss": 1.9742, "learning_rate": 9.103155595830988e-05, "epoch": 0.1936221044977667, "percentage": 19.36, "elapsed_time": "14:09:11", "remaining_time": "2 days, 10:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1865, "total_steps": 9627, "loss": 1.71, "learning_rate": 9.10222295338817e-05, "epoch": 0.19372597901734703, "percentage": 19.37, "elapsed_time": "14:09:38", "remaining_time": "2 days, 10:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1866, "total_steps": 9627, "loss": 1.6526, "learning_rate": 9.101289874090605e-05, "epoch": 0.1938298535369274, "percentage": 19.38, "elapsed_time": "14:10:04", "remaining_time": "2 days, 10:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1867, "total_steps": 9627, "loss": 1.787, "learning_rate": 9.10035635803766e-05, "epoch": 0.19393372805650774, "percentage": 19.39, "elapsed_time": "14:10:29", "remaining_time": "2 days, 10:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1868, "total_steps": 9627, "loss": 1.6645, "learning_rate": 9.099422405328748e-05, "epoch": 0.1940376025760881, "percentage": 19.4, "elapsed_time": "14:10:56", "remaining_time": "2 days, 10:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1869, "total_steps": 9627, "loss": 1.8264, "learning_rate": 9.098488016063325e-05, "epoch": 0.19414147709566842, "percentage": 19.41, "elapsed_time": "14:11:22", "remaining_time": "2 days, 10:53:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 9627, "loss": 2.0092, "learning_rate": 9.097553190340899e-05, "epoch": 0.19424535161524878, "percentage": 19.42, "elapsed_time": "14:11:49", "remaining_time": "2 days, 10:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1871, "total_steps": 9627, "loss": 1.7522, "learning_rate": 9.09661792826102e-05, "epoch": 0.19434922613482913, "percentage": 19.43, "elapsed_time": "14:12:14", "remaining_time": "2 days, 10:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1872, "total_steps": 9627, "loss": 1.7053, "learning_rate": 9.095682229923287e-05, "epoch": 0.19445310065440946, "percentage": 19.45, "elapsed_time": "14:12:42", "remaining_time": "2 days, 10:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1873, "total_steps": 9627, "loss": 1.7458, "learning_rate": 9.094746095427342e-05, "epoch": 0.19455697517398982, "percentage": 19.46, "elapsed_time": "14:13:07", "remaining_time": "2 days, 10:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1874, "total_steps": 9627, "loss": 1.7563, "learning_rate": 9.09380952487288e-05, "epoch": 0.19466084969357017, "percentage": 19.47, "elapsed_time": "14:13:33", "remaining_time": "2 days, 10:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1875, "total_steps": 9627, "loss": 1.9391, "learning_rate": 9.092872518359637e-05, "epoch": 0.19476472421315053, "percentage": 19.48, "elapsed_time": "14:14:00", "remaining_time": "2 days, 10:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1876, "total_steps": 9627, "loss": 1.7193, "learning_rate": 9.091935075987395e-05, "epoch": 0.19486859873273085, "percentage": 19.49, "elapsed_time": "14:14:26", "remaining_time": "2 days, 10:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1877, "total_steps": 9627, "loss": 1.7996, "learning_rate": 9.090997197855986e-05, "epoch": 0.1949724732523112, "percentage": 19.5, "elapsed_time": "14:14:53", "remaining_time": "2 days, 10:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1878, "total_steps": 9627, "loss": 1.5394, "learning_rate": 9.090058884065287e-05, "epoch": 0.19507634777189156, "percentage": 19.51, "elapsed_time": "14:15:18", "remaining_time": "2 days, 10:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1879, "total_steps": 9627, "loss": 1.8134, "learning_rate": 9.089120134715222e-05, "epoch": 0.1951802222914719, "percentage": 19.52, "elapsed_time": "14:15:45", "remaining_time": "2 days, 10:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 9627, "loss": 1.7417, "learning_rate": 9.088180949905756e-05, "epoch": 0.19528409681105224, "percentage": 19.53, "elapsed_time": "14:16:11", "remaining_time": "2 days, 10:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1881, "total_steps": 9627, "loss": 1.7162, "learning_rate": 9.087241329736909e-05, "epoch": 0.1953879713306326, "percentage": 19.54, "elapsed_time": "14:16:37", "remaining_time": "2 days, 10:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1882, "total_steps": 9627, "loss": 1.6961, "learning_rate": 9.086301274308742e-05, "epoch": 0.19549184585021295, "percentage": 19.55, "elapsed_time": "14:17:03", "remaining_time": "2 days, 10:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1883, "total_steps": 9627, "loss": 1.6883, "learning_rate": 9.085360783721363e-05, "epoch": 0.19559572036979328, "percentage": 19.56, "elapsed_time": "14:17:30", "remaining_time": "2 days, 10:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1884, "total_steps": 9627, "loss": 1.756, "learning_rate": 9.084419858074928e-05, "epoch": 0.19569959488937363, "percentage": 19.57, "elapsed_time": "14:17:55", "remaining_time": "2 days, 10:45:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1885, "total_steps": 9627, "loss": 1.5695, "learning_rate": 9.08347849746964e-05, "epoch": 0.195803469408954, "percentage": 19.58, "elapsed_time": "14:18:21", "remaining_time": "2 days, 10:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1886, "total_steps": 9627, "loss": 1.7402, "learning_rate": 9.082536702005741e-05, "epoch": 0.19590734392853434, "percentage": 19.59, "elapsed_time": "14:18:48", "remaining_time": "2 days, 10:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1887, "total_steps": 9627, "loss": 1.6901, "learning_rate": 9.08159447178353e-05, "epoch": 0.19601121844811467, "percentage": 19.6, "elapsed_time": "14:19:14", "remaining_time": "2 days, 10:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1888, "total_steps": 9627, "loss": 1.6679, "learning_rate": 9.080651806903346e-05, "epoch": 0.19611509296769503, "percentage": 19.61, "elapsed_time": "14:19:40", "remaining_time": "2 days, 10:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1889, "total_steps": 9627, "loss": 1.6656, "learning_rate": 9.079708707465575e-05, "epoch": 0.19621896748727538, "percentage": 19.62, "elapsed_time": "14:20:06", "remaining_time": "2 days, 10:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 9627, "loss": 1.6932, "learning_rate": 9.078765173570648e-05, "epoch": 0.1963228420068557, "percentage": 19.63, "elapsed_time": "14:20:32", "remaining_time": "2 days, 10:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1891, "total_steps": 9627, "loss": 1.8927, "learning_rate": 9.077821205319045e-05, "epoch": 0.19642671652643606, "percentage": 19.64, "elapsed_time": "14:20:59", "remaining_time": "2 days, 10:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1892, "total_steps": 9627, "loss": 1.7309, "learning_rate": 9.076876802811293e-05, "epoch": 0.19653059104601642, "percentage": 19.65, "elapsed_time": "14:21:25", "remaining_time": "2 days, 10:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1893, "total_steps": 9627, "loss": 1.8704, "learning_rate": 9.075931966147964e-05, "epoch": 0.19663446556559677, "percentage": 19.66, "elapsed_time": "14:21:51", "remaining_time": "2 days, 10:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1894, "total_steps": 9627, "loss": 1.7995, "learning_rate": 9.074986695429673e-05, "epoch": 0.1967383400851771, "percentage": 19.67, "elapsed_time": "14:22:17", "remaining_time": "2 days, 10:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1895, "total_steps": 9627, "loss": 1.7893, "learning_rate": 9.074040990757085e-05, "epoch": 0.19684221460475745, "percentage": 19.68, "elapsed_time": "14:22:43", "remaining_time": "2 days, 10:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1896, "total_steps": 9627, "loss": 1.8473, "learning_rate": 9.07309485223091e-05, "epoch": 0.1969460891243378, "percentage": 19.69, "elapsed_time": "14:23:09", "remaining_time": "2 days, 10:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1897, "total_steps": 9627, "loss": 1.6973, "learning_rate": 9.072148279951905e-05, "epoch": 0.19704996364391814, "percentage": 19.7, "elapsed_time": "14:23:36", "remaining_time": "2 days, 10:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1898, "total_steps": 9627, "loss": 1.5333, "learning_rate": 9.07120127402087e-05, "epoch": 0.1971538381634985, "percentage": 19.72, "elapsed_time": "14:24:02", "remaining_time": "2 days, 10:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1899, "total_steps": 9627, "loss": 1.7896, "learning_rate": 9.070253834538658e-05, "epoch": 0.19725771268307885, "percentage": 19.73, "elapsed_time": "14:24:28", "remaining_time": "2 days, 10:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 9627, "loss": 1.5792, "learning_rate": 9.069305961606162e-05, "epoch": 0.1973615872026592, "percentage": 19.74, "elapsed_time": "14:24:54", "remaining_time": "2 days, 10:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1901, "total_steps": 9627, "loss": 1.9998, "learning_rate": 9.068357655324322e-05, "epoch": 0.19746546172223953, "percentage": 19.75, "elapsed_time": "14:25:20", "remaining_time": "2 days, 10:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1902, "total_steps": 9627, "loss": 1.6883, "learning_rate": 9.067408915794126e-05, "epoch": 0.19756933624181988, "percentage": 19.76, "elapsed_time": "14:25:46", "remaining_time": "2 days, 10:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1903, "total_steps": 9627, "loss": 1.7639, "learning_rate": 9.066459743116609e-05, "epoch": 0.19767321076140024, "percentage": 19.77, "elapsed_time": "14:26:12", "remaining_time": "2 days, 10:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1904, "total_steps": 9627, "loss": 1.8451, "learning_rate": 9.065510137392848e-05, "epoch": 0.19777708528098056, "percentage": 19.78, "elapsed_time": "14:26:39", "remaining_time": "2 days, 10:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1905, "total_steps": 9627, "loss": 1.7716, "learning_rate": 9.06456009872397e-05, "epoch": 0.19788095980056092, "percentage": 19.79, "elapsed_time": "14:27:05", "remaining_time": "2 days, 10:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1906, "total_steps": 9627, "loss": 1.7665, "learning_rate": 9.063609627211145e-05, "epoch": 0.19798483432014127, "percentage": 19.8, "elapsed_time": "14:27:31", "remaining_time": "2 days, 10:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1907, "total_steps": 9627, "loss": 1.7998, "learning_rate": 9.062658722955593e-05, "epoch": 0.19808870883972163, "percentage": 19.81, "elapsed_time": "14:27:57", "remaining_time": "2 days, 10:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1908, "total_steps": 9627, "loss": 1.7033, "learning_rate": 9.061707386058577e-05, "epoch": 0.19819258335930195, "percentage": 19.82, "elapsed_time": "14:28:23", "remaining_time": "2 days, 10:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1909, "total_steps": 9627, "loss": 1.8304, "learning_rate": 9.060755616621406e-05, "epoch": 0.1982964578788823, "percentage": 19.83, "elapsed_time": "14:28:50", "remaining_time": "2 days, 10:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 9627, "loss": 1.6814, "learning_rate": 9.059803414745438e-05, "epoch": 0.19840033239846266, "percentage": 19.84, "elapsed_time": "14:29:16", "remaining_time": "2 days, 10:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1911, "total_steps": 9627, "loss": 1.8224, "learning_rate": 9.058850780532074e-05, "epoch": 0.198504206918043, "percentage": 19.85, "elapsed_time": "14:29:43", "remaining_time": "2 days, 10:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1912, "total_steps": 9627, "loss": 1.6889, "learning_rate": 9.057897714082761e-05, "epoch": 0.19860808143762335, "percentage": 19.86, "elapsed_time": "14:30:08", "remaining_time": "2 days, 10:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1913, "total_steps": 9627, "loss": 1.5652, "learning_rate": 9.056944215498994e-05, "epoch": 0.1987119559572037, "percentage": 19.87, "elapsed_time": "14:30:35", "remaining_time": "2 days, 10:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1914, "total_steps": 9627, "loss": 1.7888, "learning_rate": 9.055990284882317e-05, "epoch": 0.19881583047678406, "percentage": 19.88, "elapsed_time": "14:31:01", "remaining_time": "2 days, 10:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1915, "total_steps": 9627, "loss": 1.8526, "learning_rate": 9.05503592233431e-05, "epoch": 0.19891970499636438, "percentage": 19.89, "elapsed_time": "14:31:26", "remaining_time": "2 days, 10:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1916, "total_steps": 9627, "loss": 1.7178, "learning_rate": 9.054081127956607e-05, "epoch": 0.19902357951594474, "percentage": 19.9, "elapsed_time": "14:31:53", "remaining_time": "2 days, 10:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1917, "total_steps": 9627, "loss": 1.7645, "learning_rate": 9.053125901850888e-05, "epoch": 0.1991274540355251, "percentage": 19.91, "elapsed_time": "14:32:20", "remaining_time": "2 days, 10:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1918, "total_steps": 9627, "loss": 1.9984, "learning_rate": 9.052170244118876e-05, "epoch": 0.19923132855510542, "percentage": 19.92, "elapsed_time": "14:32:46", "remaining_time": "2 days, 10:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1919, "total_steps": 9627, "loss": 1.7952, "learning_rate": 9.05121415486234e-05, "epoch": 0.19933520307468577, "percentage": 19.93, "elapsed_time": "14:33:12", "remaining_time": "2 days, 10:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1920, "total_steps": 9627, "loss": 1.5986, "learning_rate": 9.050257634183099e-05, "epoch": 0.19943907759426613, "percentage": 19.94, "elapsed_time": "14:33:38", "remaining_time": "2 days, 10:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1921, "total_steps": 9627, "loss": 1.5109, "learning_rate": 9.049300682183012e-05, "epoch": 0.19954295211384648, "percentage": 19.95, "elapsed_time": "14:34:05", "remaining_time": "2 days, 10:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1922, "total_steps": 9627, "loss": 1.8023, "learning_rate": 9.048343298963988e-05, "epoch": 0.1996468266334268, "percentage": 19.96, "elapsed_time": "14:34:30", "remaining_time": "2 days, 10:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1923, "total_steps": 9627, "loss": 1.8454, "learning_rate": 9.047385484627982e-05, "epoch": 0.19975070115300717, "percentage": 19.98, "elapsed_time": "14:34:56", "remaining_time": "2 days, 10:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1924, "total_steps": 9627, "loss": 1.7483, "learning_rate": 9.046427239276991e-05, "epoch": 0.19985457567258752, "percentage": 19.99, "elapsed_time": "14:35:23", "remaining_time": "2 days, 10:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1925, "total_steps": 9627, "loss": 1.6541, "learning_rate": 9.045468563013064e-05, "epoch": 0.19995845019216787, "percentage": 20.0, "elapsed_time": "14:35:50", "remaining_time": "2 days, 10:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1926, "total_steps": 9627, "loss": 1.7776, "learning_rate": 9.04450945593829e-05, "epoch": 0.2000623247117482, "percentage": 20.01, "elapsed_time": "14:36:16", "remaining_time": "2 days, 10:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1927, "total_steps": 9627, "loss": 1.7373, "learning_rate": 9.043549918154808e-05, "epoch": 0.20016619923132856, "percentage": 20.02, "elapsed_time": "14:36:41", "remaining_time": "2 days, 10:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1928, "total_steps": 9627, "loss": 1.7154, "learning_rate": 9.0425899497648e-05, "epoch": 0.2002700737509089, "percentage": 20.03, "elapsed_time": "14:37:08", "remaining_time": "2 days, 10:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1929, "total_steps": 9627, "loss": 1.8059, "learning_rate": 9.041629550870496e-05, "epoch": 0.20037394827048924, "percentage": 20.04, "elapsed_time": "14:37:35", "remaining_time": "2 days, 10:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1930, "total_steps": 9627, "loss": 1.7075, "learning_rate": 9.040668721574171e-05, "epoch": 0.2004778227900696, "percentage": 20.05, "elapsed_time": "14:38:01", "remaining_time": "2 days, 10:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1931, "total_steps": 9627, "loss": 1.5313, "learning_rate": 9.039707461978146e-05, "epoch": 0.20058169730964995, "percentage": 20.06, "elapsed_time": "14:38:27", "remaining_time": "2 days, 10:21:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1932, "total_steps": 9627, "loss": 1.792, "learning_rate": 9.038745772184786e-05, "epoch": 0.2006855718292303, "percentage": 20.07, "elapsed_time": "14:38:53", "remaining_time": "2 days, 10:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1933, "total_steps": 9627, "loss": 1.7264, "learning_rate": 9.037783652296505e-05, "epoch": 0.20078944634881063, "percentage": 20.08, "elapsed_time": "14:39:19", "remaining_time": "2 days, 10:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1934, "total_steps": 9627, "loss": 1.6462, "learning_rate": 9.036821102415762e-05, "epoch": 0.20089332086839098, "percentage": 20.09, "elapsed_time": "14:39:45", "remaining_time": "2 days, 10:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1935, "total_steps": 9627, "loss": 1.8057, "learning_rate": 9.03585812264506e-05, "epoch": 0.20099719538797134, "percentage": 20.1, "elapsed_time": "14:40:12", "remaining_time": "2 days, 10:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1936, "total_steps": 9627, "loss": 1.6832, "learning_rate": 9.034894713086947e-05, "epoch": 0.20110106990755167, "percentage": 20.11, "elapsed_time": "14:40:38", "remaining_time": "2 days, 10:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1937, "total_steps": 9627, "loss": 1.8803, "learning_rate": 9.033930873844023e-05, "epoch": 0.20120494442713202, "percentage": 20.12, "elapsed_time": "14:41:04", "remaining_time": "2 days, 10:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1938, "total_steps": 9627, "loss": 1.8326, "learning_rate": 9.032966605018924e-05, "epoch": 0.20130881894671238, "percentage": 20.13, "elapsed_time": "14:41:30", "remaining_time": "2 days, 10:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1939, "total_steps": 9627, "loss": 1.8654, "learning_rate": 9.032001906714343e-05, "epoch": 0.20141269346629273, "percentage": 20.14, "elapsed_time": "14:41:56", "remaining_time": "2 days, 10:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1940, "total_steps": 9627, "loss": 1.8325, "learning_rate": 9.031036779033006e-05, "epoch": 0.20151656798587306, "percentage": 20.15, "elapsed_time": "14:42:23", "remaining_time": "2 days, 10:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1941, "total_steps": 9627, "loss": 1.5501, "learning_rate": 9.030071222077698e-05, "epoch": 0.2016204425054534, "percentage": 20.16, "elapsed_time": "14:42:48", "remaining_time": "2 days, 10:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1942, "total_steps": 9627, "loss": 1.5961, "learning_rate": 9.02910523595124e-05, "epoch": 0.20172431702503377, "percentage": 20.17, "elapsed_time": "14:43:14", "remaining_time": "2 days, 10:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1943, "total_steps": 9627, "loss": 1.7352, "learning_rate": 9.028138820756504e-05, "epoch": 0.2018281915446141, "percentage": 20.18, "elapsed_time": "14:43:41", "remaining_time": "2 days, 10:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1944, "total_steps": 9627, "loss": 1.7462, "learning_rate": 9.027171976596402e-05, "epoch": 0.20193206606419445, "percentage": 20.19, "elapsed_time": "14:44:07", "remaining_time": "2 days, 10:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1945, "total_steps": 9627, "loss": 1.7317, "learning_rate": 9.026204703573899e-05, "epoch": 0.2020359405837748, "percentage": 20.2, "elapsed_time": "14:44:33", "remaining_time": "2 days, 10:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1946, "total_steps": 9627, "loss": 1.7494, "learning_rate": 9.025237001791999e-05, "epoch": 0.20213981510335516, "percentage": 20.21, "elapsed_time": "14:44:59", "remaining_time": "2 days, 10:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1947, "total_steps": 9627, "loss": 1.6797, "learning_rate": 9.024268871353758e-05, "epoch": 0.20224368962293549, "percentage": 20.22, "elapsed_time": "14:45:25", "remaining_time": "2 days, 10:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1948, "total_steps": 9627, "loss": 1.7813, "learning_rate": 9.023300312362273e-05, "epoch": 0.20234756414251584, "percentage": 20.23, "elapsed_time": "14:45:51", "remaining_time": "2 days, 10:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1949, "total_steps": 9627, "loss": 1.8702, "learning_rate": 9.022331324920687e-05, "epoch": 0.2024514386620962, "percentage": 20.25, "elapsed_time": "14:46:18", "remaining_time": "2 days, 10:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 9627, "loss": 1.7838, "learning_rate": 9.02136190913219e-05, "epoch": 0.20255531318167652, "percentage": 20.26, "elapsed_time": "14:46:43", "remaining_time": "2 days, 10:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1951, "total_steps": 9627, "loss": 1.814, "learning_rate": 9.020392065100018e-05, "epoch": 0.20265918770125688, "percentage": 20.27, "elapsed_time": "14:47:10", "remaining_time": "2 days, 10:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1952, "total_steps": 9627, "loss": 1.7414, "learning_rate": 9.019421792927452e-05, "epoch": 0.20276306222083723, "percentage": 20.28, "elapsed_time": "14:47:36", "remaining_time": "2 days, 10:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1953, "total_steps": 9627, "loss": 1.6376, "learning_rate": 9.018451092717816e-05, "epoch": 0.20286693674041759, "percentage": 20.29, "elapsed_time": "14:48:02", "remaining_time": "2 days, 10:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1954, "total_steps": 9627, "loss": 1.6618, "learning_rate": 9.017479964574485e-05, "epoch": 0.2029708112599979, "percentage": 20.3, "elapsed_time": "14:48:29", "remaining_time": "2 days, 10:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1955, "total_steps": 9627, "loss": 1.6952, "learning_rate": 9.016508408600875e-05, "epoch": 0.20307468577957827, "percentage": 20.31, "elapsed_time": "14:48:54", "remaining_time": "2 days, 10:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1956, "total_steps": 9627, "loss": 1.6792, "learning_rate": 9.015536424900449e-05, "epoch": 0.20317856029915862, "percentage": 20.32, "elapsed_time": "14:49:21", "remaining_time": "2 days, 10:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1957, "total_steps": 9627, "loss": 1.7578, "learning_rate": 9.014564013576716e-05, "epoch": 0.20328243481873895, "percentage": 20.33, "elapsed_time": "14:49:46", "remaining_time": "2 days, 10:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1958, "total_steps": 9627, "loss": 1.8505, "learning_rate": 9.013591174733231e-05, "epoch": 0.2033863093383193, "percentage": 20.34, "elapsed_time": "14:50:13", "remaining_time": "2 days, 10:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1959, "total_steps": 9627, "loss": 1.9007, "learning_rate": 9.012617908473593e-05, "epoch": 0.20349018385789966, "percentage": 20.35, "elapsed_time": "14:50:40", "remaining_time": "2 days, 10:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1960, "total_steps": 9627, "loss": 1.7955, "learning_rate": 9.011644214901447e-05, "epoch": 0.20359405837748001, "percentage": 20.36, "elapsed_time": "14:51:05", "remaining_time": "2 days, 10:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1961, "total_steps": 9627, "loss": 1.8637, "learning_rate": 9.010670094120485e-05, "epoch": 0.20369793289706034, "percentage": 20.37, "elapsed_time": "14:51:32", "remaining_time": "2 days, 10:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1962, "total_steps": 9627, "loss": 1.7001, "learning_rate": 9.009695546234443e-05, "epoch": 0.2038018074166407, "percentage": 20.38, "elapsed_time": "14:51:58", "remaining_time": "2 days, 10:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1963, "total_steps": 9627, "loss": 1.6479, "learning_rate": 9.0087205713471e-05, "epoch": 0.20390568193622105, "percentage": 20.39, "elapsed_time": "14:52:23", "remaining_time": "2 days, 10:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1964, "total_steps": 9627, "loss": 1.7622, "learning_rate": 9.007745169562285e-05, "epoch": 0.2040095564558014, "percentage": 20.4, "elapsed_time": "14:52:49", "remaining_time": "2 days, 10:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1965, "total_steps": 9627, "loss": 1.9061, "learning_rate": 9.006769340983873e-05, "epoch": 0.20411343097538173, "percentage": 20.41, "elapsed_time": "14:53:16", "remaining_time": "2 days, 10:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1966, "total_steps": 9627, "loss": 1.823, "learning_rate": 9.00579308571578e-05, "epoch": 0.2042173054949621, "percentage": 20.42, "elapsed_time": "14:53:41", "remaining_time": "2 days, 10:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1967, "total_steps": 9627, "loss": 1.9272, "learning_rate": 9.004816403861969e-05, "epoch": 0.20432118001454244, "percentage": 20.43, "elapsed_time": "14:54:08", "remaining_time": "2 days, 10:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1968, "total_steps": 9627, "loss": 1.7746, "learning_rate": 9.00383929552645e-05, "epoch": 0.20442505453412277, "percentage": 20.44, "elapsed_time": "14:54:34", "remaining_time": "2 days, 10:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1969, "total_steps": 9627, "loss": 1.7197, "learning_rate": 9.002861760813278e-05, "epoch": 0.20452892905370312, "percentage": 20.45, "elapsed_time": "14:55:00", "remaining_time": "2 days, 10:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1970, "total_steps": 9627, "loss": 1.7175, "learning_rate": 9.001883799826551e-05, "epoch": 0.20463280357328348, "percentage": 20.46, "elapsed_time": "14:55:26", "remaining_time": "2 days, 10:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1971, "total_steps": 9627, "loss": 1.7624, "learning_rate": 9.000905412670415e-05, "epoch": 0.20473667809286383, "percentage": 20.47, "elapsed_time": "14:55:53", "remaining_time": "2 days, 9:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1972, "total_steps": 9627, "loss": 1.7201, "learning_rate": 8.999926599449062e-05, "epoch": 0.20484055261244416, "percentage": 20.48, "elapsed_time": "14:56:19", "remaining_time": "2 days, 9:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1973, "total_steps": 9627, "loss": 1.8462, "learning_rate": 8.998947360266726e-05, "epoch": 0.20494442713202451, "percentage": 20.49, "elapsed_time": "14:56:45", "remaining_time": "2 days, 9:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1974, "total_steps": 9627, "loss": 1.7983, "learning_rate": 8.99796769522769e-05, "epoch": 0.20504830165160487, "percentage": 20.5, "elapsed_time": "14:57:11", "remaining_time": "2 days, 9:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1975, "total_steps": 9627, "loss": 2.0234, "learning_rate": 8.996987604436279e-05, "epoch": 0.2051521761711852, "percentage": 20.52, "elapsed_time": "14:57:37", "remaining_time": "2 days, 9:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1976, "total_steps": 9627, "loss": 1.7771, "learning_rate": 8.996007087996866e-05, "epoch": 0.20525605069076555, "percentage": 20.53, "elapsed_time": "14:58:03", "remaining_time": "2 days, 9:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1977, "total_steps": 9627, "loss": 1.6017, "learning_rate": 8.995026146013867e-05, "epoch": 0.2053599252103459, "percentage": 20.54, "elapsed_time": "14:58:29", "remaining_time": "2 days, 9:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1978, "total_steps": 9627, "loss": 1.7722, "learning_rate": 8.994044778591749e-05, "epoch": 0.20546379972992626, "percentage": 20.55, "elapsed_time": "14:58:55", "remaining_time": "2 days, 9:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1979, "total_steps": 9627, "loss": 1.4704, "learning_rate": 8.993062985835013e-05, "epoch": 0.2055676742495066, "percentage": 20.56, "elapsed_time": "14:59:22", "remaining_time": "2 days, 9:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1980, "total_steps": 9627, "loss": 1.6708, "learning_rate": 8.99208076784822e-05, "epoch": 0.20567154876908694, "percentage": 20.57, "elapsed_time": "14:59:47", "remaining_time": "2 days, 9:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1981, "total_steps": 9627, "loss": 1.7259, "learning_rate": 8.991098124735961e-05, "epoch": 0.2057754232886673, "percentage": 20.58, "elapsed_time": "15:00:14", "remaining_time": "2 days, 9:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1982, "total_steps": 9627, "loss": 1.8153, "learning_rate": 8.990115056602885e-05, "epoch": 0.20587929780824762, "percentage": 20.59, "elapsed_time": "15:00:40", "remaining_time": "2 days, 9:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1983, "total_steps": 9627, "loss": 1.7063, "learning_rate": 8.989131563553679e-05, "epoch": 0.20598317232782798, "percentage": 20.6, "elapsed_time": "15:01:06", "remaining_time": "2 days, 9:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1984, "total_steps": 9627, "loss": 1.8642, "learning_rate": 8.98814764569308e-05, "epoch": 0.20608704684740833, "percentage": 20.61, "elapsed_time": "15:01:33", "remaining_time": "2 days, 9:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1985, "total_steps": 9627, "loss": 1.6623, "learning_rate": 8.987163303125863e-05, "epoch": 0.2061909213669887, "percentage": 20.62, "elapsed_time": "15:01:59", "remaining_time": "2 days, 9:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1986, "total_steps": 9627, "loss": 1.7477, "learning_rate": 8.986178535956856e-05, "epoch": 0.20629479588656902, "percentage": 20.63, "elapsed_time": "15:02:25", "remaining_time": "2 days, 9:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1987, "total_steps": 9627, "loss": 1.901, "learning_rate": 8.985193344290929e-05, "epoch": 0.20639867040614937, "percentage": 20.64, "elapsed_time": "15:02:51", "remaining_time": "2 days, 9:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1988, "total_steps": 9627, "loss": 1.7853, "learning_rate": 8.984207728232995e-05, "epoch": 0.20650254492572973, "percentage": 20.65, "elapsed_time": "15:03:18", "remaining_time": "2 days, 9:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1989, "total_steps": 9627, "loss": 1.8616, "learning_rate": 8.983221687888017e-05, "epoch": 0.20660641944531005, "percentage": 20.66, "elapsed_time": "15:03:44", "remaining_time": "2 days, 9:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1990, "total_steps": 9627, "loss": 1.7691, "learning_rate": 8.982235223360999e-05, "epoch": 0.2067102939648904, "percentage": 20.67, "elapsed_time": "15:04:11", "remaining_time": "2 days, 9:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1991, "total_steps": 9627, "loss": 1.8013, "learning_rate": 8.981248334756994e-05, "epoch": 0.20681416848447076, "percentage": 20.68, "elapsed_time": "15:04:36", "remaining_time": "2 days, 9:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1992, "total_steps": 9627, "loss": 1.624, "learning_rate": 8.980261022181095e-05, "epoch": 0.20691804300405112, "percentage": 20.69, "elapsed_time": "15:05:03", "remaining_time": "2 days, 9:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1993, "total_steps": 9627, "loss": 1.6776, "learning_rate": 8.979273285738445e-05, "epoch": 0.20702191752363144, "percentage": 20.7, "elapsed_time": "15:05:28", "remaining_time": "2 days, 9:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1994, "total_steps": 9627, "loss": 1.5715, "learning_rate": 8.978285125534229e-05, "epoch": 0.2071257920432118, "percentage": 20.71, "elapsed_time": "15:05:55", "remaining_time": "2 days, 9:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1995, "total_steps": 9627, "loss": 1.781, "learning_rate": 8.977296541673678e-05, "epoch": 0.20722966656279215, "percentage": 20.72, "elapsed_time": "15:06:21", "remaining_time": "2 days, 9:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1996, "total_steps": 9627, "loss": 1.8291, "learning_rate": 8.976307534262072e-05, "epoch": 0.2073335410823725, "percentage": 20.73, "elapsed_time": "15:06:47", "remaining_time": "2 days, 9:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1997, "total_steps": 9627, "loss": 1.9573, "learning_rate": 8.975318103404728e-05, "epoch": 0.20743741560195283, "percentage": 20.74, "elapsed_time": "15:07:14", "remaining_time": "2 days, 9:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1998, "total_steps": 9627, "loss": 1.7654, "learning_rate": 8.974328249207015e-05, "epoch": 0.2075412901215332, "percentage": 20.75, "elapsed_time": "15:07:40", "remaining_time": "2 days, 9:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1999, "total_steps": 9627, "loss": 1.7762, "learning_rate": 8.973337971774344e-05, "epoch": 0.20764516464111354, "percentage": 20.76, "elapsed_time": "15:08:06", "remaining_time": "2 days, 9:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 9627, "loss": 1.7563, "learning_rate": 8.972347271212173e-05, "epoch": 0.20774903916069387, "percentage": 20.77, "elapsed_time": "15:08:32", "remaining_time": "2 days, 9:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2001, "total_steps": 9627, "loss": 1.6374, "learning_rate": 8.971356147626004e-05, "epoch": 0.20785291368027423, "percentage": 20.79, "elapsed_time": "15:08:59", "remaining_time": "2 days, 9:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2002, "total_steps": 9627, "loss": 1.7564, "learning_rate": 8.970364601121382e-05, "epoch": 0.20795678819985458, "percentage": 20.8, "elapsed_time": "15:09:25", "remaining_time": "2 days, 9:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2003, "total_steps": 9627, "loss": 1.7618, "learning_rate": 8.9693726318039e-05, "epoch": 0.20806066271943494, "percentage": 20.81, "elapsed_time": "15:09:51", "remaining_time": "2 days, 9:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2004, "total_steps": 9627, "loss": 1.6911, "learning_rate": 8.968380239779194e-05, "epoch": 0.20816453723901526, "percentage": 20.82, "elapsed_time": "15:10:18", "remaining_time": "2 days, 9:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2005, "total_steps": 9627, "loss": 1.7087, "learning_rate": 8.96738742515295e-05, "epoch": 0.20826841175859562, "percentage": 20.83, "elapsed_time": "15:10:44", "remaining_time": "2 days, 9:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2006, "total_steps": 9627, "loss": 1.698, "learning_rate": 8.96639418803089e-05, "epoch": 0.20837228627817597, "percentage": 20.84, "elapsed_time": "15:11:09", "remaining_time": "2 days, 9:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2007, "total_steps": 9627, "loss": 1.7733, "learning_rate": 8.965400528518787e-05, "epoch": 0.2084761607977563, "percentage": 20.85, "elapsed_time": "15:11:36", "remaining_time": "2 days, 9:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2008, "total_steps": 9627, "loss": 1.7092, "learning_rate": 8.964406446722459e-05, "epoch": 0.20858003531733665, "percentage": 20.86, "elapsed_time": "15:12:02", "remaining_time": "2 days, 9:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2009, "total_steps": 9627, "loss": 1.6285, "learning_rate": 8.96341194274777e-05, "epoch": 0.208683909836917, "percentage": 20.87, "elapsed_time": "15:12:27", "remaining_time": "2 days, 9:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2010, "total_steps": 9627, "loss": 1.7449, "learning_rate": 8.962417016700624e-05, "epoch": 0.20878778435649736, "percentage": 20.88, "elapsed_time": "15:12:53", "remaining_time": "2 days, 9:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2011, "total_steps": 9627, "loss": 1.7459, "learning_rate": 8.961421668686974e-05, "epoch": 0.2088916588760777, "percentage": 20.89, "elapsed_time": "15:13:20", "remaining_time": "2 days, 9:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2012, "total_steps": 9627, "loss": 1.7329, "learning_rate": 8.960425898812816e-05, "epoch": 0.20899553339565805, "percentage": 20.9, "elapsed_time": "15:13:45", "remaining_time": "2 days, 9:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2013, "total_steps": 9627, "loss": 1.7992, "learning_rate": 8.959429707184192e-05, "epoch": 0.2090994079152384, "percentage": 20.91, "elapsed_time": "15:14:12", "remaining_time": "2 days, 9:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2014, "total_steps": 9627, "loss": 2.0488, "learning_rate": 8.95843309390719e-05, "epoch": 0.20920328243481873, "percentage": 20.92, "elapsed_time": "15:14:38", "remaining_time": "2 days, 9:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2015, "total_steps": 9627, "loss": 1.796, "learning_rate": 8.95743605908794e-05, "epoch": 0.20930715695439908, "percentage": 20.93, "elapsed_time": "15:15:04", "remaining_time": "2 days, 9:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2016, "total_steps": 9627, "loss": 1.8641, "learning_rate": 8.956438602832619e-05, "epoch": 0.20941103147397944, "percentage": 20.94, "elapsed_time": "15:15:30", "remaining_time": "2 days, 9:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2017, "total_steps": 9627, "loss": 1.7898, "learning_rate": 8.955440725247448e-05, "epoch": 0.2095149059935598, "percentage": 20.95, "elapsed_time": "15:15:56", "remaining_time": "2 days, 9:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2018, "total_steps": 9627, "loss": 1.738, "learning_rate": 8.954442426438694e-05, "epoch": 0.20961878051314012, "percentage": 20.96, "elapsed_time": "15:16:23", "remaining_time": "2 days, 9:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2019, "total_steps": 9627, "loss": 1.8819, "learning_rate": 8.953443706512667e-05, "epoch": 0.20972265503272047, "percentage": 20.97, "elapsed_time": "15:16:48", "remaining_time": "2 days, 9:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2020, "total_steps": 9627, "loss": 1.7886, "learning_rate": 8.952444565575723e-05, "epoch": 0.20982652955230083, "percentage": 20.98, "elapsed_time": "15:17:14", "remaining_time": "2 days, 9:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2021, "total_steps": 9627, "loss": 1.7872, "learning_rate": 8.951445003734263e-05, "epoch": 0.20993040407188115, "percentage": 20.99, "elapsed_time": "15:17:41", "remaining_time": "2 days, 9:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2022, "total_steps": 9627, "loss": 1.6917, "learning_rate": 8.950445021094733e-05, "epoch": 0.2100342785914615, "percentage": 21.0, "elapsed_time": "15:18:07", "remaining_time": "2 days, 9:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2023, "total_steps": 9627, "loss": 1.7487, "learning_rate": 8.949444617763623e-05, "epoch": 0.21013815311104186, "percentage": 21.01, "elapsed_time": "15:18:32", "remaining_time": "2 days, 9:32:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2024, "total_steps": 9627, "loss": 1.8752, "learning_rate": 8.948443793847467e-05, "epoch": 0.21024202763062222, "percentage": 21.02, "elapsed_time": "15:19:00", "remaining_time": "2 days, 9:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2025, "total_steps": 9627, "loss": 1.7619, "learning_rate": 8.947442549452846e-05, "epoch": 0.21034590215020255, "percentage": 21.03, "elapsed_time": "15:19:26", "remaining_time": "2 days, 9:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2026, "total_steps": 9627, "loss": 1.5852, "learning_rate": 8.946440884686387e-05, "epoch": 0.2104497766697829, "percentage": 21.04, "elapsed_time": "15:19:51", "remaining_time": "2 days, 9:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2027, "total_steps": 9627, "loss": 1.8503, "learning_rate": 8.945438799654756e-05, "epoch": 0.21055365118936326, "percentage": 21.06, "elapsed_time": "15:20:17", "remaining_time": "2 days, 9:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2028, "total_steps": 9627, "loss": 1.6764, "learning_rate": 8.944436294464669e-05, "epoch": 0.21065752570894358, "percentage": 21.07, "elapsed_time": "15:20:44", "remaining_time": "2 days, 9:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2029, "total_steps": 9627, "loss": 1.6127, "learning_rate": 8.943433369222882e-05, "epoch": 0.21076140022852394, "percentage": 21.08, "elapsed_time": "15:21:09", "remaining_time": "2 days, 9:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2030, "total_steps": 9627, "loss": 1.7161, "learning_rate": 8.942430024036203e-05, "epoch": 0.2108652747481043, "percentage": 21.09, "elapsed_time": "15:21:36", "remaining_time": "2 days, 9:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2031, "total_steps": 9627, "loss": 1.8648, "learning_rate": 8.941426259011478e-05, "epoch": 0.21096914926768465, "percentage": 21.1, "elapsed_time": "15:22:02", "remaining_time": "2 days, 9:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2032, "total_steps": 9627, "loss": 1.7433, "learning_rate": 8.940422074255602e-05, "epoch": 0.21107302378726497, "percentage": 21.11, "elapsed_time": "15:22:29", "remaining_time": "2 days, 9:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2033, "total_steps": 9627, "loss": 1.778, "learning_rate": 8.93941746987551e-05, "epoch": 0.21117689830684533, "percentage": 21.12, "elapsed_time": "15:22:54", "remaining_time": "2 days, 9:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2034, "total_steps": 9627, "loss": 1.7633, "learning_rate": 8.938412445978186e-05, "epoch": 0.21128077282642568, "percentage": 21.13, "elapsed_time": "15:23:20", "remaining_time": "2 days, 9:26:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2035, "total_steps": 9627, "loss": 1.6726, "learning_rate": 8.937407002670659e-05, "epoch": 0.21138464734600604, "percentage": 21.14, "elapsed_time": "15:23:46", "remaining_time": "2 days, 9:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2036, "total_steps": 9627, "loss": 1.7913, "learning_rate": 8.936401140059998e-05, "epoch": 0.21148852186558637, "percentage": 21.15, "elapsed_time": "15:24:13", "remaining_time": "2 days, 9:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2037, "total_steps": 9627, "loss": 1.7161, "learning_rate": 8.935394858253321e-05, "epoch": 0.21159239638516672, "percentage": 21.16, "elapsed_time": "15:24:38", "remaining_time": "2 days, 9:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2038, "total_steps": 9627, "loss": 1.9097, "learning_rate": 8.934388157357788e-05, "epoch": 0.21169627090474707, "percentage": 21.17, "elapsed_time": "15:25:05", "remaining_time": "2 days, 9:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2039, "total_steps": 9627, "loss": 1.9521, "learning_rate": 8.933381037480606e-05, "epoch": 0.2118001454243274, "percentage": 21.18, "elapsed_time": "15:25:30", "remaining_time": "2 days, 9:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2040, "total_steps": 9627, "loss": 1.7008, "learning_rate": 8.932373498729025e-05, "epoch": 0.21190401994390776, "percentage": 21.19, "elapsed_time": "15:25:56", "remaining_time": "2 days, 9:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2041, "total_steps": 9627, "loss": 1.8255, "learning_rate": 8.931365541210342e-05, "epoch": 0.2120078944634881, "percentage": 21.2, "elapsed_time": "15:26:21", "remaining_time": "2 days, 9:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2042, "total_steps": 9627, "loss": 1.9377, "learning_rate": 8.930357165031893e-05, "epoch": 0.21211176898306847, "percentage": 21.21, "elapsed_time": "15:26:48", "remaining_time": "2 days, 9:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2043, "total_steps": 9627, "loss": 1.8809, "learning_rate": 8.929348370301063e-05, "epoch": 0.2122156435026488, "percentage": 21.22, "elapsed_time": "15:27:14", "remaining_time": "2 days, 9:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2044, "total_steps": 9627, "loss": 1.7093, "learning_rate": 8.928339157125283e-05, "epoch": 0.21231951802222915, "percentage": 21.23, "elapsed_time": "15:27:39", "remaining_time": "2 days, 9:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2045, "total_steps": 9627, "loss": 1.7248, "learning_rate": 8.927329525612025e-05, "epoch": 0.2124233925418095, "percentage": 21.24, "elapsed_time": "15:28:06", "remaining_time": "2 days, 9:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2046, "total_steps": 9627, "loss": 1.6424, "learning_rate": 8.926319475868807e-05, "epoch": 0.21252726706138983, "percentage": 21.25, "elapsed_time": "15:28:31", "remaining_time": "2 days, 9:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2047, "total_steps": 9627, "loss": 1.6919, "learning_rate": 8.925309008003192e-05, "epoch": 0.21263114158097018, "percentage": 21.26, "elapsed_time": "15:28:58", "remaining_time": "2 days, 9:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2048, "total_steps": 9627, "loss": 1.8568, "learning_rate": 8.924298122122783e-05, "epoch": 0.21273501610055054, "percentage": 21.27, "elapsed_time": "15:29:23", "remaining_time": "2 days, 9:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2049, "total_steps": 9627, "loss": 1.8214, "learning_rate": 8.923286818335237e-05, "epoch": 0.2128388906201309, "percentage": 21.28, "elapsed_time": "15:29:50", "remaining_time": "2 days, 9:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 9627, "loss": 2.1206, "learning_rate": 8.922275096748247e-05, "epoch": 0.21294276513971122, "percentage": 21.29, "elapsed_time": "15:30:15", "remaining_time": "2 days, 9:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2051, "total_steps": 9627, "loss": 1.8579, "learning_rate": 8.921262957469554e-05, "epoch": 0.21304663965929158, "percentage": 21.3, "elapsed_time": "15:30:42", "remaining_time": "2 days, 9:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2052, "total_steps": 9627, "loss": 1.7962, "learning_rate": 8.920250400606944e-05, "epoch": 0.21315051417887193, "percentage": 21.32, "elapsed_time": "15:31:07", "remaining_time": "2 days, 9:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2053, "total_steps": 9627, "loss": 1.6304, "learning_rate": 8.919237426268246e-05, "epoch": 0.21325438869845226, "percentage": 21.33, "elapsed_time": "15:31:33", "remaining_time": "2 days, 9:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2054, "total_steps": 9627, "loss": 1.9758, "learning_rate": 8.918224034561333e-05, "epoch": 0.2133582632180326, "percentage": 21.34, "elapsed_time": "15:31:59", "remaining_time": "2 days, 9:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2055, "total_steps": 9627, "loss": 1.7476, "learning_rate": 8.917210225594122e-05, "epoch": 0.21346213773761297, "percentage": 21.35, "elapsed_time": "15:32:26", "remaining_time": "2 days, 9:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2056, "total_steps": 9627, "loss": 1.7741, "learning_rate": 8.916195999474579e-05, "epoch": 0.21356601225719332, "percentage": 21.36, "elapsed_time": "15:32:51", "remaining_time": "2 days, 9:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2057, "total_steps": 9627, "loss": 1.7451, "learning_rate": 8.915181356310709e-05, "epoch": 0.21366988677677365, "percentage": 21.37, "elapsed_time": "15:33:18", "remaining_time": "2 days, 9:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2058, "total_steps": 9627, "loss": 1.9665, "learning_rate": 8.914166296210564e-05, "epoch": 0.213773761296354, "percentage": 21.38, "elapsed_time": "15:33:43", "remaining_time": "2 days, 9:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2059, "total_steps": 9627, "loss": 1.6796, "learning_rate": 8.913150819282242e-05, "epoch": 0.21387763581593436, "percentage": 21.39, "elapsed_time": "15:34:10", "remaining_time": "2 days, 9:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2060, "total_steps": 9627, "loss": 1.7107, "learning_rate": 8.912134925633878e-05, "epoch": 0.21398151033551469, "percentage": 21.4, "elapsed_time": "15:34:35", "remaining_time": "2 days, 9:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2061, "total_steps": 9627, "loss": 1.6896, "learning_rate": 8.911118615373661e-05, "epoch": 0.21408538485509504, "percentage": 21.41, "elapsed_time": "15:35:02", "remaining_time": "2 days, 9:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2062, "total_steps": 9627, "loss": 1.8049, "learning_rate": 8.910101888609821e-05, "epoch": 0.2141892593746754, "percentage": 21.42, "elapsed_time": "15:35:28", "remaining_time": "2 days, 9:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2063, "total_steps": 9627, "loss": 1.7652, "learning_rate": 8.909084745450628e-05, "epoch": 0.21429313389425575, "percentage": 21.43, "elapsed_time": "15:35:54", "remaining_time": "2 days, 9:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2064, "total_steps": 9627, "loss": 1.701, "learning_rate": 8.908067186004405e-05, "epoch": 0.21439700841383608, "percentage": 21.44, "elapsed_time": "15:36:20", "remaining_time": "2 days, 9:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2065, "total_steps": 9627, "loss": 1.781, "learning_rate": 8.907049210379508e-05, "epoch": 0.21450088293341643, "percentage": 21.45, "elapsed_time": "15:36:45", "remaining_time": "2 days, 9:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2066, "total_steps": 9627, "loss": 1.6878, "learning_rate": 8.906030818684348e-05, "epoch": 0.21460475745299679, "percentage": 21.46, "elapsed_time": "15:37:12", "remaining_time": "2 days, 9:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2067, "total_steps": 9627, "loss": 1.6964, "learning_rate": 8.905012011027372e-05, "epoch": 0.2147086319725771, "percentage": 21.47, "elapsed_time": "15:37:37", "remaining_time": "2 days, 9:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2068, "total_steps": 9627, "loss": 1.2466, "learning_rate": 8.903992787517078e-05, "epoch": 0.21481250649215747, "percentage": 21.48, "elapsed_time": "15:38:04", "remaining_time": "2 days, 9:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2069, "total_steps": 9627, "loss": 1.7607, "learning_rate": 8.902973148262004e-05, "epoch": 0.21491638101173782, "percentage": 21.49, "elapsed_time": "15:38:29", "remaining_time": "2 days, 9:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2070, "total_steps": 9627, "loss": 1.8514, "learning_rate": 8.901953093370734e-05, "epoch": 0.21502025553131818, "percentage": 21.5, "elapsed_time": "15:38:55", "remaining_time": "2 days, 9:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2071, "total_steps": 9627, "loss": 1.5947, "learning_rate": 8.900932622951897e-05, "epoch": 0.2151241300508985, "percentage": 21.51, "elapsed_time": "15:39:21", "remaining_time": "2 days, 9:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2072, "total_steps": 9627, "loss": 1.7449, "learning_rate": 8.899911737114163e-05, "epoch": 0.21522800457047886, "percentage": 21.52, "elapsed_time": "15:39:47", "remaining_time": "2 days, 9:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2073, "total_steps": 9627, "loss": 1.7266, "learning_rate": 8.898890435966251e-05, "epoch": 0.21533187909005921, "percentage": 21.53, "elapsed_time": "15:40:14", "remaining_time": "2 days, 9:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2074, "total_steps": 9627, "loss": 1.8562, "learning_rate": 8.897868719616919e-05, "epoch": 0.21543575360963957, "percentage": 21.54, "elapsed_time": "15:40:39", "remaining_time": "2 days, 9:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2075, "total_steps": 9627, "loss": 1.8528, "learning_rate": 8.896846588174973e-05, "epoch": 0.2155396281292199, "percentage": 21.55, "elapsed_time": "15:41:05", "remaining_time": "2 days, 9:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2076, "total_steps": 9627, "loss": 1.6268, "learning_rate": 8.89582404174926e-05, "epoch": 0.21564350264880025, "percentage": 21.56, "elapsed_time": "15:41:31", "remaining_time": "2 days, 9:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2077, "total_steps": 9627, "loss": 1.7256, "learning_rate": 8.89480108044868e-05, "epoch": 0.2157473771683806, "percentage": 21.57, "elapsed_time": "15:41:57", "remaining_time": "2 days, 9:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2078, "total_steps": 9627, "loss": 1.7654, "learning_rate": 8.893777704382163e-05, "epoch": 0.21585125168796093, "percentage": 21.59, "elapsed_time": "15:42:23", "remaining_time": "2 days, 9:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2079, "total_steps": 9627, "loss": 1.5765, "learning_rate": 8.892753913658691e-05, "epoch": 0.2159551262075413, "percentage": 21.6, "elapsed_time": "15:42:49", "remaining_time": "2 days, 9:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2080, "total_steps": 9627, "loss": 1.7399, "learning_rate": 8.891729708387294e-05, "epoch": 0.21605900072712164, "percentage": 21.61, "elapsed_time": "15:43:14", "remaining_time": "2 days, 9:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2081, "total_steps": 9627, "loss": 1.8868, "learning_rate": 8.890705088677039e-05, "epoch": 0.216162875246702, "percentage": 21.62, "elapsed_time": "15:43:41", "remaining_time": "2 days, 9:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2082, "total_steps": 9627, "loss": 1.907, "learning_rate": 8.889680054637042e-05, "epoch": 0.21626674976628232, "percentage": 21.63, "elapsed_time": "15:44:07", "remaining_time": "2 days, 9:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2083, "total_steps": 9627, "loss": 1.9046, "learning_rate": 8.888654606376459e-05, "epoch": 0.21637062428586268, "percentage": 21.64, "elapsed_time": "15:44:32", "remaining_time": "2 days, 9:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2084, "total_steps": 9627, "loss": 1.7253, "learning_rate": 8.887628744004493e-05, "epoch": 0.21647449880544303, "percentage": 21.65, "elapsed_time": "15:44:59", "remaining_time": "2 days, 9:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2085, "total_steps": 9627, "loss": 1.7522, "learning_rate": 8.88660246763039e-05, "epoch": 0.21657837332502336, "percentage": 21.66, "elapsed_time": "15:45:24", "remaining_time": "2 days, 8:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2086, "total_steps": 9627, "loss": 1.7231, "learning_rate": 8.885575777363442e-05, "epoch": 0.21668224784460371, "percentage": 21.67, "elapsed_time": "15:45:51", "remaining_time": "2 days, 8:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2087, "total_steps": 9627, "loss": 1.6142, "learning_rate": 8.884548673312981e-05, "epoch": 0.21678612236418407, "percentage": 21.68, "elapsed_time": "15:46:16", "remaining_time": "2 days, 8:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2088, "total_steps": 9627, "loss": 1.8635, "learning_rate": 8.883521155588388e-05, "epoch": 0.21688999688376442, "percentage": 21.69, "elapsed_time": "15:46:43", "remaining_time": "2 days, 8:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2089, "total_steps": 9627, "loss": 1.6453, "learning_rate": 8.882493224299084e-05, "epoch": 0.21699387140334475, "percentage": 21.7, "elapsed_time": "15:47:08", "remaining_time": "2 days, 8:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2090, "total_steps": 9627, "loss": 1.821, "learning_rate": 8.881464879554536e-05, "epoch": 0.2170977459229251, "percentage": 21.71, "elapsed_time": "15:47:35", "remaining_time": "2 days, 8:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2091, "total_steps": 9627, "loss": 1.8536, "learning_rate": 8.880436121464255e-05, "epoch": 0.21720162044250546, "percentage": 21.72, "elapsed_time": "15:48:00", "remaining_time": "2 days, 8:56:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2092, "total_steps": 9627, "loss": 1.7896, "learning_rate": 8.879406950137796e-05, "epoch": 0.2173054949620858, "percentage": 21.73, "elapsed_time": "15:48:26", "remaining_time": "2 days, 8:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2093, "total_steps": 9627, "loss": 1.7763, "learning_rate": 8.878377365684758e-05, "epoch": 0.21740936948166614, "percentage": 21.74, "elapsed_time": "15:48:52", "remaining_time": "2 days, 8:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2094, "total_steps": 9627, "loss": 1.7594, "learning_rate": 8.877347368214783e-05, "epoch": 0.2175132440012465, "percentage": 21.75, "elapsed_time": "15:49:18", "remaining_time": "2 days, 8:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2095, "total_steps": 9627, "loss": 1.9007, "learning_rate": 8.876316957837556e-05, "epoch": 0.21761711852082685, "percentage": 21.76, "elapsed_time": "15:49:44", "remaining_time": "2 days, 8:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2096, "total_steps": 9627, "loss": 1.6164, "learning_rate": 8.87528613466281e-05, "epoch": 0.21772099304040718, "percentage": 21.77, "elapsed_time": "15:50:10", "remaining_time": "2 days, 8:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2097, "total_steps": 9627, "loss": 1.626, "learning_rate": 8.874254898800321e-05, "epoch": 0.21782486755998753, "percentage": 21.78, "elapsed_time": "15:50:36", "remaining_time": "2 days, 8:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2098, "total_steps": 9627, "loss": 1.8004, "learning_rate": 8.873223250359903e-05, "epoch": 0.2179287420795679, "percentage": 21.79, "elapsed_time": "15:51:02", "remaining_time": "2 days, 8:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2099, "total_steps": 9627, "loss": 1.7169, "learning_rate": 8.872191189451422e-05, "epoch": 0.21803261659914822, "percentage": 21.8, "elapsed_time": "15:51:28", "remaining_time": "2 days, 8:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 9627, "loss": 1.6472, "learning_rate": 8.871158716184784e-05, "epoch": 0.21813649111872857, "percentage": 21.81, "elapsed_time": "15:51:54", "remaining_time": "2 days, 8:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2101, "total_steps": 9627, "loss": 1.6177, "learning_rate": 8.87012583066994e-05, "epoch": 0.21824036563830893, "percentage": 21.82, "elapsed_time": "15:52:20", "remaining_time": "2 days, 8:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2102, "total_steps": 9627, "loss": 1.6924, "learning_rate": 8.869092533016882e-05, "epoch": 0.21834424015788928, "percentage": 21.83, "elapsed_time": "15:52:46", "remaining_time": "2 days, 8:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2103, "total_steps": 9627, "loss": 1.8299, "learning_rate": 8.86805882333565e-05, "epoch": 0.2184481146774696, "percentage": 21.84, "elapsed_time": "15:53:12", "remaining_time": "2 days, 8:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2104, "total_steps": 9627, "loss": 1.8411, "learning_rate": 8.867024701736325e-05, "epoch": 0.21855198919704996, "percentage": 21.86, "elapsed_time": "15:53:37", "remaining_time": "2 days, 8:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2105, "total_steps": 9627, "loss": 1.6618, "learning_rate": 8.865990168329031e-05, "epoch": 0.21865586371663032, "percentage": 21.87, "elapsed_time": "15:54:04", "remaining_time": "2 days, 8:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2106, "total_steps": 9627, "loss": 1.8495, "learning_rate": 8.864955223223943e-05, "epoch": 0.21875973823621067, "percentage": 21.88, "elapsed_time": "15:54:29", "remaining_time": "2 days, 8:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2107, "total_steps": 9627, "loss": 1.7565, "learning_rate": 8.863919866531269e-05, "epoch": 0.218863612755791, "percentage": 21.89, "elapsed_time": "15:54:56", "remaining_time": "2 days, 8:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2108, "total_steps": 9627, "loss": 1.7943, "learning_rate": 8.862884098361271e-05, "epoch": 0.21896748727537135, "percentage": 21.9, "elapsed_time": "15:55:22", "remaining_time": "2 days, 8:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2109, "total_steps": 9627, "loss": 1.5722, "learning_rate": 8.861847918824248e-05, "epoch": 0.2190713617949517, "percentage": 21.91, "elapsed_time": "15:55:48", "remaining_time": "2 days, 8:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2110, "total_steps": 9627, "loss": 1.8011, "learning_rate": 8.860811328030545e-05, "epoch": 0.21917523631453203, "percentage": 21.92, "elapsed_time": "15:56:14", "remaining_time": "2 days, 8:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2111, "total_steps": 9627, "loss": 1.7692, "learning_rate": 8.85977432609055e-05, "epoch": 0.2192791108341124, "percentage": 21.93, "elapsed_time": "15:56:40", "remaining_time": "2 days, 8:46:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2112, "total_steps": 9627, "loss": 1.6858, "learning_rate": 8.858736913114698e-05, "epoch": 0.21938298535369274, "percentage": 21.94, "elapsed_time": "15:57:05", "remaining_time": "2 days, 8:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2113, "total_steps": 9627, "loss": 1.5681, "learning_rate": 8.857699089213462e-05, "epoch": 0.2194868598732731, "percentage": 21.95, "elapsed_time": "15:57:32", "remaining_time": "2 days, 8:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2114, "total_steps": 9627, "loss": 1.7354, "learning_rate": 8.856660854497367e-05, "epoch": 0.21959073439285343, "percentage": 21.96, "elapsed_time": "15:57:58", "remaining_time": "2 days, 8:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2115, "total_steps": 9627, "loss": 1.6739, "learning_rate": 8.855622209076972e-05, "epoch": 0.21969460891243378, "percentage": 21.97, "elapsed_time": "15:58:24", "remaining_time": "2 days, 8:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2116, "total_steps": 9627, "loss": 2.0526, "learning_rate": 8.854583153062887e-05, "epoch": 0.21979848343201414, "percentage": 21.98, "elapsed_time": "15:58:50", "remaining_time": "2 days, 8:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2117, "total_steps": 9627, "loss": 1.8204, "learning_rate": 8.853543686565765e-05, "epoch": 0.21990235795159446, "percentage": 21.99, "elapsed_time": "15:59:15", "remaining_time": "2 days, 8:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2118, "total_steps": 9627, "loss": 1.7236, "learning_rate": 8.852503809696297e-05, "epoch": 0.22000623247117482, "percentage": 22.0, "elapsed_time": "15:59:42", "remaining_time": "2 days, 8:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2119, "total_steps": 9627, "loss": 1.7896, "learning_rate": 8.851463522565226e-05, "epoch": 0.22011010699075517, "percentage": 22.01, "elapsed_time": "16:00:07", "remaining_time": "2 days, 8:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2120, "total_steps": 9627, "loss": 1.8652, "learning_rate": 8.85042282528333e-05, "epoch": 0.22021398151033553, "percentage": 22.02, "elapsed_time": "16:00:34", "remaining_time": "2 days, 8:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2121, "total_steps": 9627, "loss": 1.8323, "learning_rate": 8.84938171796144e-05, "epoch": 0.22031785602991585, "percentage": 22.03, "elapsed_time": "16:00:59", "remaining_time": "2 days, 8:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2122, "total_steps": 9627, "loss": 1.6752, "learning_rate": 8.848340200710421e-05, "epoch": 0.2204217305494962, "percentage": 22.04, "elapsed_time": "16:01:25", "remaining_time": "2 days, 8:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2123, "total_steps": 9627, "loss": 1.8893, "learning_rate": 8.847298273641192e-05, "epoch": 0.22052560506907656, "percentage": 22.05, "elapsed_time": "16:01:52", "remaining_time": "2 days, 8:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2124, "total_steps": 9627, "loss": 1.6729, "learning_rate": 8.846255936864703e-05, "epoch": 0.2206294795886569, "percentage": 22.06, "elapsed_time": "16:02:16", "remaining_time": "2 days, 8:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2125, "total_steps": 9627, "loss": 1.6048, "learning_rate": 8.845213190491962e-05, "epoch": 0.22073335410823725, "percentage": 22.07, "elapsed_time": "16:02:43", "remaining_time": "2 days, 8:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2126, "total_steps": 9627, "loss": 1.9401, "learning_rate": 8.844170034634007e-05, "epoch": 0.2208372286278176, "percentage": 22.08, "elapsed_time": "16:03:09", "remaining_time": "2 days, 8:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2127, "total_steps": 9627, "loss": 1.9608, "learning_rate": 8.843126469401931e-05, "epoch": 0.22094110314739795, "percentage": 22.09, "elapsed_time": "16:03:35", "remaining_time": "2 days, 8:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2128, "total_steps": 9627, "loss": 1.7066, "learning_rate": 8.842082494906863e-05, "epoch": 0.22104497766697828, "percentage": 22.1, "elapsed_time": "16:04:01", "remaining_time": "2 days, 8:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2129, "total_steps": 9627, "loss": 1.8553, "learning_rate": 8.841038111259979e-05, "epoch": 0.22114885218655864, "percentage": 22.11, "elapsed_time": "16:04:27", "remaining_time": "2 days, 8:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2130, "total_steps": 9627, "loss": 1.6992, "learning_rate": 8.839993318572497e-05, "epoch": 0.221252726706139, "percentage": 22.13, "elapsed_time": "16:04:53", "remaining_time": "2 days, 8:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2131, "total_steps": 9627, "loss": 1.9582, "learning_rate": 8.83894811695568e-05, "epoch": 0.22135660122571932, "percentage": 22.14, "elapsed_time": "16:05:19", "remaining_time": "2 days, 8:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2132, "total_steps": 9627, "loss": 1.7399, "learning_rate": 8.837902506520835e-05, "epoch": 0.22146047574529967, "percentage": 22.15, "elapsed_time": "16:05:45", "remaining_time": "2 days, 8:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2133, "total_steps": 9627, "loss": 1.6818, "learning_rate": 8.836856487379306e-05, "epoch": 0.22156435026488003, "percentage": 22.16, "elapsed_time": "16:06:10", "remaining_time": "2 days, 8:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2134, "total_steps": 9627, "loss": 1.6495, "learning_rate": 8.835810059642493e-05, "epoch": 0.22166822478446038, "percentage": 22.17, "elapsed_time": "16:06:36", "remaining_time": "2 days, 8:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2135, "total_steps": 9627, "loss": 1.7112, "learning_rate": 8.834763223421828e-05, "epoch": 0.2217720993040407, "percentage": 22.18, "elapsed_time": "16:07:03", "remaining_time": "2 days, 8:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2136, "total_steps": 9627, "loss": 1.713, "learning_rate": 8.833715978828793e-05, "epoch": 0.22187597382362106, "percentage": 22.19, "elapsed_time": "16:07:28", "remaining_time": "2 days, 8:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2137, "total_steps": 9627, "loss": 1.6994, "learning_rate": 8.83266832597491e-05, "epoch": 0.22197984834320142, "percentage": 22.2, "elapsed_time": "16:07:54", "remaining_time": "2 days, 8:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2138, "total_steps": 9627, "loss": 1.6051, "learning_rate": 8.831620264971745e-05, "epoch": 0.22208372286278175, "percentage": 22.21, "elapsed_time": "16:08:19", "remaining_time": "2 days, 8:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2139, "total_steps": 9627, "loss": 1.678, "learning_rate": 8.830571795930911e-05, "epoch": 0.2221875973823621, "percentage": 22.22, "elapsed_time": "16:08:45", "remaining_time": "2 days, 8:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2140, "total_steps": 9627, "loss": 1.6881, "learning_rate": 8.829522918964058e-05, "epoch": 0.22229147190194246, "percentage": 22.23, "elapsed_time": "16:09:12", "remaining_time": "2 days, 8:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2141, "total_steps": 9627, "loss": 1.8456, "learning_rate": 8.828473634182888e-05, "epoch": 0.2223953464215228, "percentage": 22.24, "elapsed_time": "16:09:37", "remaining_time": "2 days, 8:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2142, "total_steps": 9627, "loss": 1.8562, "learning_rate": 8.827423941699137e-05, "epoch": 0.22249922094110314, "percentage": 22.25, "elapsed_time": "16:10:03", "remaining_time": "2 days, 8:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2143, "total_steps": 9627, "loss": 1.7444, "learning_rate": 8.826373841624593e-05, "epoch": 0.2226030954606835, "percentage": 22.26, "elapsed_time": "16:10:29", "remaining_time": "2 days, 8:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2144, "total_steps": 9627, "loss": 1.7901, "learning_rate": 8.825323334071083e-05, "epoch": 0.22270696998026385, "percentage": 22.27, "elapsed_time": "16:10:56", "remaining_time": "2 days, 8:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2145, "total_steps": 9627, "loss": 1.7461, "learning_rate": 8.824272419150475e-05, "epoch": 0.2228108444998442, "percentage": 22.28, "elapsed_time": "16:11:21", "remaining_time": "2 days, 8:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2146, "total_steps": 9627, "loss": 1.782, "learning_rate": 8.823221096974684e-05, "epoch": 0.22291471901942453, "percentage": 22.29, "elapsed_time": "16:11:47", "remaining_time": "2 days, 8:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2147, "total_steps": 9627, "loss": 1.803, "learning_rate": 8.822169367655669e-05, "epoch": 0.22301859353900488, "percentage": 22.3, "elapsed_time": "16:12:13", "remaining_time": "2 days, 8:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2148, "total_steps": 9627, "loss": 1.8741, "learning_rate": 8.821117231305431e-05, "epoch": 0.22312246805858524, "percentage": 22.31, "elapsed_time": "16:12:39", "remaining_time": "2 days, 8:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2149, "total_steps": 9627, "loss": 1.7279, "learning_rate": 8.820064688036014e-05, "epoch": 0.22322634257816557, "percentage": 22.32, "elapsed_time": "16:13:04", "remaining_time": "2 days, 8:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 9627, "loss": 1.8127, "learning_rate": 8.819011737959504e-05, "epoch": 0.22333021709774592, "percentage": 22.33, "elapsed_time": "16:13:29", "remaining_time": "2 days, 8:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2151, "total_steps": 9627, "loss": 1.7985, "learning_rate": 8.817958381188033e-05, "epoch": 0.22343409161732627, "percentage": 22.34, "elapsed_time": "16:13:56", "remaining_time": "2 days, 8:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2152, "total_steps": 9627, "loss": 1.7096, "learning_rate": 8.816904617833778e-05, "epoch": 0.22353796613690663, "percentage": 22.35, "elapsed_time": "16:14:22", "remaining_time": "2 days, 8:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2153, "total_steps": 9627, "loss": 1.7936, "learning_rate": 8.815850448008953e-05, "epoch": 0.22364184065648696, "percentage": 22.36, "elapsed_time": "16:14:47", "remaining_time": "2 days, 8:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2154, "total_steps": 9627, "loss": 1.7445, "learning_rate": 8.81479587182582e-05, "epoch": 0.2237457151760673, "percentage": 22.37, "elapsed_time": "16:15:13", "remaining_time": "2 days, 8:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2155, "total_steps": 9627, "loss": 1.8105, "learning_rate": 8.813740889396682e-05, "epoch": 0.22384958969564767, "percentage": 22.38, "elapsed_time": "16:15:39", "remaining_time": "2 days, 8:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2156, "total_steps": 9627, "loss": 1.7913, "learning_rate": 8.81268550083389e-05, "epoch": 0.223953464215228, "percentage": 22.4, "elapsed_time": "16:16:04", "remaining_time": "2 days, 8:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2157, "total_steps": 9627, "loss": 1.805, "learning_rate": 8.81162970624983e-05, "epoch": 0.22405733873480835, "percentage": 22.41, "elapsed_time": "16:16:31", "remaining_time": "2 days, 8:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2158, "total_steps": 9627, "loss": 1.6997, "learning_rate": 8.81057350575694e-05, "epoch": 0.2241612132543887, "percentage": 22.42, "elapsed_time": "16:16:56", "remaining_time": "2 days, 8:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2159, "total_steps": 9627, "loss": 1.5612, "learning_rate": 8.809516899467694e-05, "epoch": 0.22426508777396906, "percentage": 22.43, "elapsed_time": "16:17:22", "remaining_time": "2 days, 8:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2160, "total_steps": 9627, "loss": 1.6928, "learning_rate": 8.808459887494615e-05, "epoch": 0.22436896229354938, "percentage": 22.44, "elapsed_time": "16:17:47", "remaining_time": "2 days, 8:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2161, "total_steps": 9627, "loss": 1.7605, "learning_rate": 8.807402469950263e-05, "epoch": 0.22447283681312974, "percentage": 22.45, "elapsed_time": "16:18:14", "remaining_time": "2 days, 8:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2162, "total_steps": 9627, "loss": 1.7773, "learning_rate": 8.806344646947249e-05, "epoch": 0.2245767113327101, "percentage": 22.46, "elapsed_time": "16:18:39", "remaining_time": "2 days, 8:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2163, "total_steps": 9627, "loss": 1.8473, "learning_rate": 8.80528641859822e-05, "epoch": 0.22468058585229042, "percentage": 22.47, "elapsed_time": "16:19:04", "remaining_time": "2 days, 8:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2164, "total_steps": 9627, "loss": 1.686, "learning_rate": 8.804227785015869e-05, "epoch": 0.22478446037187078, "percentage": 22.48, "elapsed_time": "16:19:31", "remaining_time": "2 days, 8:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2165, "total_steps": 9627, "loss": 1.7894, "learning_rate": 8.803168746312934e-05, "epoch": 0.22488833489145113, "percentage": 22.49, "elapsed_time": "16:19:56", "remaining_time": "2 days, 8:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2166, "total_steps": 9627, "loss": 1.8895, "learning_rate": 8.802109302602193e-05, "epoch": 0.22499220941103149, "percentage": 22.5, "elapsed_time": "16:20:21", "remaining_time": "2 days, 8:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2167, "total_steps": 9627, "loss": 2.0375, "learning_rate": 8.801049453996468e-05, "epoch": 0.2250960839306118, "percentage": 22.51, "elapsed_time": "16:20:49", "remaining_time": "2 days, 8:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2168, "total_steps": 9627, "loss": 1.6489, "learning_rate": 8.799989200608627e-05, "epoch": 0.22519995845019217, "percentage": 22.52, "elapsed_time": "16:21:14", "remaining_time": "2 days, 8:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2169, "total_steps": 9627, "loss": 1.8188, "learning_rate": 8.798928542551576e-05, "epoch": 0.22530383296977252, "percentage": 22.53, "elapsed_time": "16:21:40", "remaining_time": "2 days, 8:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2170, "total_steps": 9627, "loss": 1.9716, "learning_rate": 8.797867479938269e-05, "epoch": 0.22540770748935285, "percentage": 22.54, "elapsed_time": "16:22:05", "remaining_time": "2 days, 8:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2171, "total_steps": 9627, "loss": 1.857, "learning_rate": 8.796806012881699e-05, "epoch": 0.2255115820089332, "percentage": 22.55, "elapsed_time": "16:22:32", "remaining_time": "2 days, 8:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2172, "total_steps": 9627, "loss": 1.6663, "learning_rate": 8.795744141494905e-05, "epoch": 0.22561545652851356, "percentage": 22.56, "elapsed_time": "16:22:57", "remaining_time": "2 days, 8:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2173, "total_steps": 9627, "loss": 1.7631, "learning_rate": 8.794681865890968e-05, "epoch": 0.2257193310480939, "percentage": 22.57, "elapsed_time": "16:23:23", "remaining_time": "2 days, 8:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2174, "total_steps": 9627, "loss": 1.8269, "learning_rate": 8.793619186183011e-05, "epoch": 0.22582320556767424, "percentage": 22.58, "elapsed_time": "16:23:49", "remaining_time": "2 days, 8:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2175, "total_steps": 9627, "loss": 1.6963, "learning_rate": 8.792556102484204e-05, "epoch": 0.2259270800872546, "percentage": 22.59, "elapsed_time": "16:24:14", "remaining_time": "2 days, 8:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2176, "total_steps": 9627, "loss": 1.6336, "learning_rate": 8.791492614907754e-05, "epoch": 0.22603095460683495, "percentage": 22.6, "elapsed_time": "16:24:41", "remaining_time": "2 days, 8:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2177, "total_steps": 9627, "loss": 1.8569, "learning_rate": 8.790428723566915e-05, "epoch": 0.22613482912641528, "percentage": 22.61, "elapsed_time": "16:25:06", "remaining_time": "2 days, 8:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2178, "total_steps": 9627, "loss": 1.7161, "learning_rate": 8.789364428574984e-05, "epoch": 0.22623870364599563, "percentage": 22.62, "elapsed_time": "16:25:31", "remaining_time": "2 days, 8:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2179, "total_steps": 9627, "loss": 1.8211, "learning_rate": 8.788299730045299e-05, "epoch": 0.22634257816557599, "percentage": 22.63, "elapsed_time": "16:25:57", "remaining_time": "2 days, 8:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2180, "total_steps": 9627, "loss": 1.7704, "learning_rate": 8.787234628091243e-05, "epoch": 0.22644645268515634, "percentage": 22.64, "elapsed_time": "16:26:24", "remaining_time": "2 days, 8:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2181, "total_steps": 9627, "loss": 1.7376, "learning_rate": 8.786169122826242e-05, "epoch": 0.22655032720473667, "percentage": 22.66, "elapsed_time": "16:26:50", "remaining_time": "2 days, 8:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2182, "total_steps": 9627, "loss": 1.6503, "learning_rate": 8.785103214363761e-05, "epoch": 0.22665420172431702, "percentage": 22.67, "elapsed_time": "16:27:16", "remaining_time": "2 days, 8:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2183, "total_steps": 9627, "loss": 1.7421, "learning_rate": 8.784036902817312e-05, "epoch": 0.22675807624389738, "percentage": 22.68, "elapsed_time": "16:27:41", "remaining_time": "2 days, 8:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2184, "total_steps": 9627, "loss": 1.7828, "learning_rate": 8.78297018830045e-05, "epoch": 0.22686195076347773, "percentage": 22.69, "elapsed_time": "16:28:07", "remaining_time": "2 days, 8:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2185, "total_steps": 9627, "loss": 1.7687, "learning_rate": 8.781903070926774e-05, "epoch": 0.22696582528305806, "percentage": 22.7, "elapsed_time": "16:28:33", "remaining_time": "2 days, 8:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2186, "total_steps": 9627, "loss": 1.7469, "learning_rate": 8.780835550809918e-05, "epoch": 0.22706969980263841, "percentage": 22.71, "elapsed_time": "16:28:59", "remaining_time": "2 days, 8:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2187, "total_steps": 9627, "loss": 1.5268, "learning_rate": 8.779767628063567e-05, "epoch": 0.22717357432221877, "percentage": 22.72, "elapsed_time": "16:29:25", "remaining_time": "2 days, 8:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2188, "total_steps": 9627, "loss": 1.5966, "learning_rate": 8.77869930280145e-05, "epoch": 0.2272774488417991, "percentage": 22.73, "elapsed_time": "16:29:50", "remaining_time": "2 days, 8:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2189, "total_steps": 9627, "loss": 1.7469, "learning_rate": 8.77763057513733e-05, "epoch": 0.22738132336137945, "percentage": 22.74, "elapsed_time": "16:30:16", "remaining_time": "2 days, 8:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2190, "total_steps": 9627, "loss": 1.6986, "learning_rate": 8.77656144518502e-05, "epoch": 0.2274851978809598, "percentage": 22.75, "elapsed_time": "16:30:42", "remaining_time": "2 days, 8:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2191, "total_steps": 9627, "loss": 1.7425, "learning_rate": 8.775491913058376e-05, "epoch": 0.22758907240054016, "percentage": 22.76, "elapsed_time": "16:31:09", "remaining_time": "2 days, 8:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2192, "total_steps": 9627, "loss": 1.7665, "learning_rate": 8.774421978871292e-05, "epoch": 0.2276929469201205, "percentage": 22.77, "elapsed_time": "16:31:34", "remaining_time": "2 days, 8:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2193, "total_steps": 9627, "loss": 1.6914, "learning_rate": 8.773351642737708e-05, "epoch": 0.22779682143970084, "percentage": 22.78, "elapsed_time": "16:31:59", "remaining_time": "2 days, 8:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2194, "total_steps": 9627, "loss": 1.8031, "learning_rate": 8.772280904771608e-05, "epoch": 0.2279006959592812, "percentage": 22.79, "elapsed_time": "16:32:26", "remaining_time": "2 days, 8:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2195, "total_steps": 9627, "loss": 1.7248, "learning_rate": 8.771209765087018e-05, "epoch": 0.22800457047886152, "percentage": 22.8, "elapsed_time": "16:32:51", "remaining_time": "2 days, 8:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2196, "total_steps": 9627, "loss": 1.7994, "learning_rate": 8.770138223798003e-05, "epoch": 0.22810844499844188, "percentage": 22.81, "elapsed_time": "16:33:16", "remaining_time": "2 days, 8:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2197, "total_steps": 9627, "loss": 1.8668, "learning_rate": 8.769066281018676e-05, "epoch": 0.22821231951802223, "percentage": 22.82, "elapsed_time": "16:33:43", "remaining_time": "2 days, 8:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2198, "total_steps": 9627, "loss": 1.7928, "learning_rate": 8.76799393686319e-05, "epoch": 0.2283161940376026, "percentage": 22.83, "elapsed_time": "16:34:08", "remaining_time": "2 days, 8:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2199, "total_steps": 9627, "loss": 1.6981, "learning_rate": 8.766921191445742e-05, "epoch": 0.22842006855718291, "percentage": 22.84, "elapsed_time": "16:34:35", "remaining_time": "2 days, 7:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 9627, "loss": 1.634, "learning_rate": 8.765848044880569e-05, "epoch": 0.22852394307676327, "percentage": 22.85, "elapsed_time": "16:35:01", "remaining_time": "2 days, 7:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2201, "total_steps": 9627, "loss": 1.7564, "learning_rate": 8.764774497281954e-05, "epoch": 0.22862781759634362, "percentage": 22.86, "elapsed_time": "16:35:26", "remaining_time": "2 days, 7:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2202, "total_steps": 9627, "loss": 1.8504, "learning_rate": 8.763700548764223e-05, "epoch": 0.22873169211592395, "percentage": 22.87, "elapsed_time": "16:35:51", "remaining_time": "2 days, 7:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2203, "total_steps": 9627, "loss": 1.5756, "learning_rate": 8.76262619944174e-05, "epoch": 0.2288355666355043, "percentage": 22.88, "elapsed_time": "16:36:17", "remaining_time": "2 days, 7:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2204, "total_steps": 9627, "loss": 1.9804, "learning_rate": 8.761551449428918e-05, "epoch": 0.22893944115508466, "percentage": 22.89, "elapsed_time": "16:36:44", "remaining_time": "2 days, 7:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2205, "total_steps": 9627, "loss": 1.81, "learning_rate": 8.760476298840206e-05, "epoch": 0.22904331567466502, "percentage": 22.9, "elapsed_time": "16:37:08", "remaining_time": "2 days, 7:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2206, "total_steps": 9627, "loss": 1.8159, "learning_rate": 8.7594007477901e-05, "epoch": 0.22914719019424534, "percentage": 22.91, "elapsed_time": "16:37:36", "remaining_time": "2 days, 7:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2207, "total_steps": 9627, "loss": 1.8237, "learning_rate": 8.758324796393142e-05, "epoch": 0.2292510647138257, "percentage": 22.93, "elapsed_time": "16:38:01", "remaining_time": "2 days, 7:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2208, "total_steps": 9627, "loss": 1.6837, "learning_rate": 8.757248444763908e-05, "epoch": 0.22935493923340605, "percentage": 22.94, "elapsed_time": "16:38:27", "remaining_time": "2 days, 7:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2209, "total_steps": 9627, "loss": 1.6408, "learning_rate": 8.756171693017022e-05, "epoch": 0.22945881375298638, "percentage": 22.95, "elapsed_time": "16:38:53", "remaining_time": "2 days, 7:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2210, "total_steps": 9627, "loss": 1.8816, "learning_rate": 8.755094541267149e-05, "epoch": 0.22956268827256673, "percentage": 22.96, "elapsed_time": "16:39:18", "remaining_time": "2 days, 7:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2211, "total_steps": 9627, "loss": 1.9372, "learning_rate": 8.754016989629e-05, "epoch": 0.2296665627921471, "percentage": 22.97, "elapsed_time": "16:39:44", "remaining_time": "2 days, 7:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2212, "total_steps": 9627, "loss": 1.7356, "learning_rate": 8.752939038217322e-05, "epoch": 0.22977043731172744, "percentage": 22.98, "elapsed_time": "16:40:09", "remaining_time": "2 days, 7:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2213, "total_steps": 9627, "loss": 1.7804, "learning_rate": 8.751860687146912e-05, "epoch": 0.22987431183130777, "percentage": 22.99, "elapsed_time": "16:40:36", "remaining_time": "2 days, 7:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2214, "total_steps": 9627, "loss": 1.825, "learning_rate": 8.750781936532604e-05, "epoch": 0.22997818635088813, "percentage": 23.0, "elapsed_time": "16:41:01", "remaining_time": "2 days, 7:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2215, "total_steps": 9627, "loss": 1.7208, "learning_rate": 8.749702786489277e-05, "epoch": 0.23008206087046848, "percentage": 23.01, "elapsed_time": "16:41:26", "remaining_time": "2 days, 7:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2216, "total_steps": 9627, "loss": 1.8447, "learning_rate": 8.748623237131853e-05, "epoch": 0.23018593539004883, "percentage": 23.02, "elapsed_time": "16:41:53", "remaining_time": "2 days, 7:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2217, "total_steps": 9627, "loss": 1.6169, "learning_rate": 8.747543288575293e-05, "epoch": 0.23028980990962916, "percentage": 23.03, "elapsed_time": "16:42:18", "remaining_time": "2 days, 7:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2218, "total_steps": 9627, "loss": 1.6316, "learning_rate": 8.746462940934605e-05, "epoch": 0.23039368442920952, "percentage": 23.04, "elapsed_time": "16:42:44", "remaining_time": "2 days, 7:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2219, "total_steps": 9627, "loss": 1.7359, "learning_rate": 8.745382194324839e-05, "epoch": 0.23049755894878987, "percentage": 23.05, "elapsed_time": "16:43:10", "remaining_time": "2 days, 7:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2220, "total_steps": 9627, "loss": 1.7425, "learning_rate": 8.744301048861083e-05, "epoch": 0.2306014334683702, "percentage": 23.06, "elapsed_time": "16:43:36", "remaining_time": "2 days, 7:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2221, "total_steps": 9627, "loss": 1.8832, "learning_rate": 8.743219504658472e-05, "epoch": 0.23070530798795055, "percentage": 23.07, "elapsed_time": "16:44:02", "remaining_time": "2 days, 7:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2222, "total_steps": 9627, "loss": 1.8591, "learning_rate": 8.742137561832182e-05, "epoch": 0.2308091825075309, "percentage": 23.08, "elapsed_time": "16:44:27", "remaining_time": "2 days, 7:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2223, "total_steps": 9627, "loss": 1.9393, "learning_rate": 8.741055220497431e-05, "epoch": 0.23091305702711126, "percentage": 23.09, "elapsed_time": "16:44:53", "remaining_time": "2 days, 7:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2224, "total_steps": 9627, "loss": 1.8439, "learning_rate": 8.739972480769481e-05, "epoch": 0.2310169315466916, "percentage": 23.1, "elapsed_time": "16:45:19", "remaining_time": "2 days, 7:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2225, "total_steps": 9627, "loss": 1.7198, "learning_rate": 8.738889342763635e-05, "epoch": 0.23112080606627194, "percentage": 23.11, "elapsed_time": "16:45:45", "remaining_time": "2 days, 7:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2226, "total_steps": 9627, "loss": 1.6465, "learning_rate": 8.737805806595239e-05, "epoch": 0.2312246805858523, "percentage": 23.12, "elapsed_time": "16:46:10", "remaining_time": "2 days, 7:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2227, "total_steps": 9627, "loss": 1.7859, "learning_rate": 8.73672187237968e-05, "epoch": 0.23132855510543263, "percentage": 23.13, "elapsed_time": "16:46:37", "remaining_time": "2 days, 7:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2228, "total_steps": 9627, "loss": 1.7008, "learning_rate": 8.735637540232389e-05, "epoch": 0.23143242962501298, "percentage": 23.14, "elapsed_time": "16:47:02", "remaining_time": "2 days, 7:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2229, "total_steps": 9627, "loss": 1.6847, "learning_rate": 8.734552810268838e-05, "epoch": 0.23153630414459334, "percentage": 23.15, "elapsed_time": "16:47:28", "remaining_time": "2 days, 7:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2230, "total_steps": 9627, "loss": 1.7455, "learning_rate": 8.733467682604545e-05, "epoch": 0.2316401786641737, "percentage": 23.16, "elapsed_time": "16:47:53", "remaining_time": "2 days, 7:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2231, "total_steps": 9627, "loss": 1.6726, "learning_rate": 8.732382157355066e-05, "epoch": 0.23174405318375402, "percentage": 23.17, "elapsed_time": "16:48:20", "remaining_time": "2 days, 7:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2232, "total_steps": 9627, "loss": 1.9202, "learning_rate": 8.731296234636e-05, "epoch": 0.23184792770333437, "percentage": 23.18, "elapsed_time": "16:48:45", "remaining_time": "2 days, 7:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2233, "total_steps": 9627, "loss": 1.9388, "learning_rate": 8.73020991456299e-05, "epoch": 0.23195180222291473, "percentage": 23.2, "elapsed_time": "16:49:11", "remaining_time": "2 days, 7:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2234, "total_steps": 9627, "loss": 1.6893, "learning_rate": 8.72912319725172e-05, "epoch": 0.23205567674249505, "percentage": 23.21, "elapsed_time": "16:49:36", "remaining_time": "2 days, 7:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2235, "total_steps": 9627, "loss": 1.812, "learning_rate": 8.72803608281792e-05, "epoch": 0.2321595512620754, "percentage": 23.22, "elapsed_time": "16:50:03", "remaining_time": "2 days, 7:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2236, "total_steps": 9627, "loss": 1.8426, "learning_rate": 8.726948571377356e-05, "epoch": 0.23226342578165576, "percentage": 23.23, "elapsed_time": "16:50:28", "remaining_time": "2 days, 7:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2237, "total_steps": 9627, "loss": 1.6714, "learning_rate": 8.72586066304584e-05, "epoch": 0.23236730030123612, "percentage": 23.24, "elapsed_time": "16:50:54", "remaining_time": "2 days, 7:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2238, "total_steps": 9627, "loss": 1.7595, "learning_rate": 8.724772357939229e-05, "epoch": 0.23247117482081645, "percentage": 23.25, "elapsed_time": "16:51:19", "remaining_time": "2 days, 7:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2239, "total_steps": 9627, "loss": 1.6493, "learning_rate": 8.723683656173413e-05, "epoch": 0.2325750493403968, "percentage": 23.26, "elapsed_time": "16:51:45", "remaining_time": "2 days, 7:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2240, "total_steps": 9627, "loss": 1.7885, "learning_rate": 8.722594557864335e-05, "epoch": 0.23267892385997715, "percentage": 23.27, "elapsed_time": "16:52:11", "remaining_time": "2 days, 7:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2241, "total_steps": 9627, "loss": 1.6947, "learning_rate": 8.721505063127972e-05, "epoch": 0.23278279837955748, "percentage": 23.28, "elapsed_time": "16:52:36", "remaining_time": "2 days, 7:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2242, "total_steps": 9627, "loss": 1.8158, "learning_rate": 8.72041517208035e-05, "epoch": 0.23288667289913784, "percentage": 23.29, "elapsed_time": "16:53:03", "remaining_time": "2 days, 7:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2243, "total_steps": 9627, "loss": 1.7928, "learning_rate": 8.719324884837531e-05, "epoch": 0.2329905474187182, "percentage": 23.3, "elapsed_time": "16:53:28", "remaining_time": "2 days, 7:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2244, "total_steps": 9627, "loss": 1.7782, "learning_rate": 8.718234201515627e-05, "epoch": 0.23309442193829855, "percentage": 23.31, "elapsed_time": "16:53:54", "remaining_time": "2 days, 7:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2245, "total_steps": 9627, "loss": 1.6527, "learning_rate": 8.717143122230782e-05, "epoch": 0.23319829645787887, "percentage": 23.32, "elapsed_time": "16:54:20", "remaining_time": "2 days, 7:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2246, "total_steps": 9627, "loss": 1.8666, "learning_rate": 8.71605164709919e-05, "epoch": 0.23330217097745923, "percentage": 23.33, "elapsed_time": "16:54:44", "remaining_time": "2 days, 7:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2247, "total_steps": 9627, "loss": 1.7043, "learning_rate": 8.714959776237083e-05, "epoch": 0.23340604549703958, "percentage": 23.34, "elapsed_time": "16:55:11", "remaining_time": "2 days, 7:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2248, "total_steps": 9627, "loss": 2.007, "learning_rate": 8.713867509760738e-05, "epoch": 0.2335099200166199, "percentage": 23.35, "elapsed_time": "16:55:37", "remaining_time": "2 days, 7:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2249, "total_steps": 9627, "loss": 1.7151, "learning_rate": 8.712774847786471e-05, "epoch": 0.23361379453620026, "percentage": 23.36, "elapsed_time": "16:56:02", "remaining_time": "2 days, 7:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 9627, "loss": 1.8144, "learning_rate": 8.711681790430645e-05, "epoch": 0.23371766905578062, "percentage": 23.37, "elapsed_time": "16:56:28", "remaining_time": "2 days, 7:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2251, "total_steps": 9627, "loss": 1.9487, "learning_rate": 8.710588337809662e-05, "epoch": 0.23382154357536097, "percentage": 23.38, "elapsed_time": "16:56:53", "remaining_time": "2 days, 7:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2252, "total_steps": 9627, "loss": 1.6245, "learning_rate": 8.709494490039963e-05, "epoch": 0.2339254180949413, "percentage": 23.39, "elapsed_time": "16:57:19", "remaining_time": "2 days, 7:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2253, "total_steps": 9627, "loss": 1.8078, "learning_rate": 8.708400247238035e-05, "epoch": 0.23402929261452166, "percentage": 23.4, "elapsed_time": "16:57:44", "remaining_time": "2 days, 7:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2254, "total_steps": 9627, "loss": 1.7107, "learning_rate": 8.707305609520408e-05, "epoch": 0.234133167134102, "percentage": 23.41, "elapsed_time": "16:58:10", "remaining_time": "2 days, 7:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2255, "total_steps": 9627, "loss": 1.6238, "learning_rate": 8.706210577003653e-05, "epoch": 0.23423704165368237, "percentage": 23.42, "elapsed_time": "16:58:36", "remaining_time": "2 days, 7:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2256, "total_steps": 9627, "loss": 1.7069, "learning_rate": 8.705115149804381e-05, "epoch": 0.2343409161732627, "percentage": 23.43, "elapsed_time": "16:59:02", "remaining_time": "2 days, 7:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2257, "total_steps": 9627, "loss": 1.6198, "learning_rate": 8.704019328039244e-05, "epoch": 0.23444479069284305, "percentage": 23.44, "elapsed_time": "16:59:28", "remaining_time": "2 days, 7:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2258, "total_steps": 9627, "loss": 1.8176, "learning_rate": 8.702923111824943e-05, "epoch": 0.2345486652124234, "percentage": 23.45, "elapsed_time": "16:59:53", "remaining_time": "2 days, 7:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2259, "total_steps": 9627, "loss": 1.7607, "learning_rate": 8.701826501278216e-05, "epoch": 0.23465253973200373, "percentage": 23.47, "elapsed_time": "17:00:19", "remaining_time": "2 days, 7:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2260, "total_steps": 9627, "loss": 1.765, "learning_rate": 8.70072949651584e-05, "epoch": 0.23475641425158408, "percentage": 23.48, "elapsed_time": "17:00:45", "remaining_time": "2 days, 7:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2261, "total_steps": 9627, "loss": 1.6595, "learning_rate": 8.69963209765464e-05, "epoch": 0.23486028877116444, "percentage": 23.49, "elapsed_time": "17:01:11", "remaining_time": "2 days, 7:26:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2262, "total_steps": 9627, "loss": 1.4557, "learning_rate": 8.698534304811478e-05, "epoch": 0.2349641632907448, "percentage": 23.5, "elapsed_time": "17:01:36", "remaining_time": "2 days, 7:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2263, "total_steps": 9627, "loss": 1.8497, "learning_rate": 8.697436118103264e-05, "epoch": 0.23506803781032512, "percentage": 23.51, "elapsed_time": "17:02:03", "remaining_time": "2 days, 7:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2264, "total_steps": 9627, "loss": 1.7943, "learning_rate": 8.696337537646944e-05, "epoch": 0.23517191232990547, "percentage": 23.52, "elapsed_time": "17:02:29", "remaining_time": "2 days, 7:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2265, "total_steps": 9627, "loss": 1.9579, "learning_rate": 8.695238563559509e-05, "epoch": 0.23527578684948583, "percentage": 23.53, "elapsed_time": "17:02:53", "remaining_time": "2 days, 7:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2266, "total_steps": 9627, "loss": 1.7782, "learning_rate": 8.694139195957991e-05, "epoch": 0.23537966136906616, "percentage": 23.54, "elapsed_time": "17:03:20", "remaining_time": "2 days, 7:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2267, "total_steps": 9627, "loss": 1.7276, "learning_rate": 8.693039434959464e-05, "epoch": 0.2354835358886465, "percentage": 23.55, "elapsed_time": "17:03:46", "remaining_time": "2 days, 7:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2268, "total_steps": 9627, "loss": 1.818, "learning_rate": 8.691939280681045e-05, "epoch": 0.23558741040822687, "percentage": 23.56, "elapsed_time": "17:04:11", "remaining_time": "2 days, 7:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2269, "total_steps": 9627, "loss": 1.7603, "learning_rate": 8.69083873323989e-05, "epoch": 0.23569128492780722, "percentage": 23.57, "elapsed_time": "17:04:38", "remaining_time": "2 days, 7:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2270, "total_steps": 9627, "loss": 1.6039, "learning_rate": 8.689737792753198e-05, "epoch": 0.23579515944738755, "percentage": 23.58, "elapsed_time": "17:05:03", "remaining_time": "2 days, 7:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2271, "total_steps": 9627, "loss": 1.8416, "learning_rate": 8.688636459338215e-05, "epoch": 0.2358990339669679, "percentage": 23.59, "elapsed_time": "17:05:30", "remaining_time": "2 days, 7:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2272, "total_steps": 9627, "loss": 1.6987, "learning_rate": 8.68753473311222e-05, "epoch": 0.23600290848654826, "percentage": 23.6, "elapsed_time": "17:05:55", "remaining_time": "2 days, 7:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2273, "total_steps": 9627, "loss": 1.9472, "learning_rate": 8.686432614192538e-05, "epoch": 0.23610678300612858, "percentage": 23.61, "elapsed_time": "17:06:20", "remaining_time": "2 days, 7:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2274, "total_steps": 9627, "loss": 1.8414, "learning_rate": 8.68533010269654e-05, "epoch": 0.23621065752570894, "percentage": 23.62, "elapsed_time": "17:06:45", "remaining_time": "2 days, 7:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2275, "total_steps": 9627, "loss": 1.5978, "learning_rate": 8.684227198741633e-05, "epoch": 0.2363145320452893, "percentage": 23.63, "elapsed_time": "17:07:11", "remaining_time": "2 days, 7:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2276, "total_steps": 9627, "loss": 1.7981, "learning_rate": 8.683123902445267e-05, "epoch": 0.23641840656486965, "percentage": 23.64, "elapsed_time": "17:07:38", "remaining_time": "2 days, 7:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2277, "total_steps": 9627, "loss": 1.7098, "learning_rate": 8.682020213924935e-05, "epoch": 0.23652228108444998, "percentage": 23.65, "elapsed_time": "17:08:03", "remaining_time": "2 days, 7:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2278, "total_steps": 9627, "loss": 1.661, "learning_rate": 8.680916133298171e-05, "epoch": 0.23662615560403033, "percentage": 23.66, "elapsed_time": "17:08:29", "remaining_time": "2 days, 7:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2279, "total_steps": 9627, "loss": 1.5888, "learning_rate": 8.67981166068255e-05, "epoch": 0.23673003012361069, "percentage": 23.67, "elapsed_time": "17:08:54", "remaining_time": "2 days, 7:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2280, "total_steps": 9627, "loss": 1.7733, "learning_rate": 8.678706796195692e-05, "epoch": 0.236833904643191, "percentage": 23.68, "elapsed_time": "17:09:20", "remaining_time": "2 days, 7:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2281, "total_steps": 9627, "loss": 1.8096, "learning_rate": 8.677601539955256e-05, "epoch": 0.23693777916277137, "percentage": 23.69, "elapsed_time": "17:09:46", "remaining_time": "2 days, 7:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2282, "total_steps": 9627, "loss": 1.6919, "learning_rate": 8.676495892078941e-05, "epoch": 0.23704165368235172, "percentage": 23.7, "elapsed_time": "17:10:12", "remaining_time": "2 days, 7:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2283, "total_steps": 9627, "loss": 1.9165, "learning_rate": 8.675389852684492e-05, "epoch": 0.23714552820193208, "percentage": 23.71, "elapsed_time": "17:10:37", "remaining_time": "2 days, 7:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2284, "total_steps": 9627, "loss": 1.6767, "learning_rate": 8.674283421889691e-05, "epoch": 0.2372494027215124, "percentage": 23.72, "elapsed_time": "17:11:03", "remaining_time": "2 days, 7:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2285, "total_steps": 9627, "loss": 1.7891, "learning_rate": 8.673176599812368e-05, "epoch": 0.23735327724109276, "percentage": 23.74, "elapsed_time": "17:11:29", "remaining_time": "2 days, 7:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2286, "total_steps": 9627, "loss": 1.9999, "learning_rate": 8.672069386570389e-05, "epoch": 0.2374571517606731, "percentage": 23.75, "elapsed_time": "17:11:54", "remaining_time": "2 days, 7:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2287, "total_steps": 9627, "loss": 1.8249, "learning_rate": 8.670961782281664e-05, "epoch": 0.23756102628025344, "percentage": 23.76, "elapsed_time": "17:12:20", "remaining_time": "2 days, 7:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2288, "total_steps": 9627, "loss": 1.8532, "learning_rate": 8.669853787064142e-05, "epoch": 0.2376649007998338, "percentage": 23.77, "elapsed_time": "17:12:46", "remaining_time": "2 days, 7:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2289, "total_steps": 9627, "loss": 1.7474, "learning_rate": 8.668745401035818e-05, "epoch": 0.23776877531941415, "percentage": 23.78, "elapsed_time": "17:13:11", "remaining_time": "2 days, 7:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2290, "total_steps": 9627, "loss": 1.8941, "learning_rate": 8.667636624314725e-05, "epoch": 0.2378726498389945, "percentage": 23.79, "elapsed_time": "17:13:37", "remaining_time": "2 days, 7:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2291, "total_steps": 9627, "loss": 1.985, "learning_rate": 8.666527457018943e-05, "epoch": 0.23797652435857483, "percentage": 23.8, "elapsed_time": "17:14:04", "remaining_time": "2 days, 7:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2292, "total_steps": 9627, "loss": 1.6889, "learning_rate": 8.665417899266586e-05, "epoch": 0.23808039887815519, "percentage": 23.81, "elapsed_time": "17:14:28", "remaining_time": "2 days, 7:10:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2293, "total_steps": 9627, "loss": 1.5088, "learning_rate": 8.664307951175814e-05, "epoch": 0.23818427339773554, "percentage": 23.82, "elapsed_time": "17:14:54", "remaining_time": "2 days, 7:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2294, "total_steps": 9627, "loss": 1.7288, "learning_rate": 8.663197612864827e-05, "epoch": 0.2382881479173159, "percentage": 23.83, "elapsed_time": "17:15:20", "remaining_time": "2 days, 7:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2295, "total_steps": 9627, "loss": 1.8472, "learning_rate": 8.662086884451869e-05, "epoch": 0.23839202243689622, "percentage": 23.84, "elapsed_time": "17:15:46", "remaining_time": "2 days, 7:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2296, "total_steps": 9627, "loss": 1.8897, "learning_rate": 8.660975766055224e-05, "epoch": 0.23849589695647658, "percentage": 23.85, "elapsed_time": "17:16:11", "remaining_time": "2 days, 7:08:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2297, "total_steps": 9627, "loss": 1.9391, "learning_rate": 8.659864257793215e-05, "epoch": 0.23859977147605693, "percentage": 23.86, "elapsed_time": "17:16:37", "remaining_time": "2 days, 7:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2298, "total_steps": 9627, "loss": 1.7464, "learning_rate": 8.65875235978421e-05, "epoch": 0.23870364599563726, "percentage": 23.87, "elapsed_time": "17:17:02", "remaining_time": "2 days, 7:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2299, "total_steps": 9627, "loss": 1.7393, "learning_rate": 8.65764007214662e-05, "epoch": 0.23880752051521761, "percentage": 23.88, "elapsed_time": "17:17:29", "remaining_time": "2 days, 7:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 9627, "loss": 1.6336, "learning_rate": 8.656527394998892e-05, "epoch": 0.23891139503479797, "percentage": 23.89, "elapsed_time": "17:17:55", "remaining_time": "2 days, 7:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2301, "total_steps": 9627, "loss": 1.8982, "learning_rate": 8.655414328459519e-05, "epoch": 0.23901526955437832, "percentage": 23.9, "elapsed_time": "17:18:19", "remaining_time": "2 days, 7:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2302, "total_steps": 9627, "loss": 1.6851, "learning_rate": 8.654300872647033e-05, "epoch": 0.23911914407395865, "percentage": 23.91, "elapsed_time": "17:18:46", "remaining_time": "2 days, 7:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2303, "total_steps": 9627, "loss": 1.8767, "learning_rate": 8.65318702768001e-05, "epoch": 0.239223018593539, "percentage": 23.92, "elapsed_time": "17:19:11", "remaining_time": "2 days, 7:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2304, "total_steps": 9627, "loss": 1.725, "learning_rate": 8.652072793677061e-05, "epoch": 0.23932689311311936, "percentage": 23.93, "elapsed_time": "17:19:36", "remaining_time": "2 days, 7:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2305, "total_steps": 9627, "loss": 1.9115, "learning_rate": 8.650958170756852e-05, "epoch": 0.2394307676326997, "percentage": 23.94, "elapsed_time": "17:20:02", "remaining_time": "2 days, 7:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2306, "total_steps": 9627, "loss": 1.698, "learning_rate": 8.649843159038071e-05, "epoch": 0.23953464215228004, "percentage": 23.95, "elapsed_time": "17:20:28", "remaining_time": "2 days, 7:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2307, "total_steps": 9627, "loss": 1.8998, "learning_rate": 8.648727758639467e-05, "epoch": 0.2396385166718604, "percentage": 23.96, "elapsed_time": "17:20:54", "remaining_time": "2 days, 7:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2308, "total_steps": 9627, "loss": 1.7095, "learning_rate": 8.647611969679816e-05, "epoch": 0.23974239119144075, "percentage": 23.97, "elapsed_time": "17:21:19", "remaining_time": "2 days, 7:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2309, "total_steps": 9627, "loss": 1.9387, "learning_rate": 8.646495792277943e-05, "epoch": 0.23984626571102108, "percentage": 23.98, "elapsed_time": "17:21:44", "remaining_time": "2 days, 7:01:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2310, "total_steps": 9627, "loss": 1.8302, "learning_rate": 8.645379226552712e-05, "epoch": 0.23995014023060143, "percentage": 24.0, "elapsed_time": "17:22:11", "remaining_time": "2 days, 7:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2311, "total_steps": 9627, "loss": 1.6717, "learning_rate": 8.644262272623029e-05, "epoch": 0.2400540147501818, "percentage": 24.01, "elapsed_time": "17:22:37", "remaining_time": "2 days, 7:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2312, "total_steps": 9627, "loss": 1.6446, "learning_rate": 8.64314493060784e-05, "epoch": 0.24015788926976211, "percentage": 24.02, "elapsed_time": "17:23:03", "remaining_time": "2 days, 7:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2313, "total_steps": 9627, "loss": 1.7145, "learning_rate": 8.642027200626135e-05, "epoch": 0.24026176378934247, "percentage": 24.03, "elapsed_time": "17:23:28", "remaining_time": "2 days, 6:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2314, "total_steps": 9627, "loss": 1.7144, "learning_rate": 8.640909082796939e-05, "epoch": 0.24036563830892282, "percentage": 24.04, "elapsed_time": "17:23:54", "remaining_time": "2 days, 6:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2315, "total_steps": 9627, "loss": 1.8516, "learning_rate": 8.639790577239328e-05, "epoch": 0.24046951282850318, "percentage": 24.05, "elapsed_time": "17:24:19", "remaining_time": "2 days, 6:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2316, "total_steps": 9627, "loss": 1.6144, "learning_rate": 8.638671684072412e-05, "epoch": 0.2405733873480835, "percentage": 24.06, "elapsed_time": "17:24:45", "remaining_time": "2 days, 6:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2317, "total_steps": 9627, "loss": 1.7601, "learning_rate": 8.637552403415343e-05, "epoch": 0.24067726186766386, "percentage": 24.07, "elapsed_time": "17:25:11", "remaining_time": "2 days, 6:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2318, "total_steps": 9627, "loss": 1.798, "learning_rate": 8.636432735387319e-05, "epoch": 0.24078113638724422, "percentage": 24.08, "elapsed_time": "17:25:36", "remaining_time": "2 days, 6:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2319, "total_steps": 9627, "loss": 1.551, "learning_rate": 8.635312680107572e-05, "epoch": 0.24088501090682454, "percentage": 24.09, "elapsed_time": "17:26:03", "remaining_time": "2 days, 6:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2320, "total_steps": 9627, "loss": 1.6926, "learning_rate": 8.634192237695382e-05, "epoch": 0.2409888854264049, "percentage": 24.1, "elapsed_time": "17:26:28", "remaining_time": "2 days, 6:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2321, "total_steps": 9627, "loss": 1.604, "learning_rate": 8.633071408270065e-05, "epoch": 0.24109275994598525, "percentage": 24.11, "elapsed_time": "17:26:53", "remaining_time": "2 days, 6:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2322, "total_steps": 9627, "loss": 2.0036, "learning_rate": 8.631950191950983e-05, "epoch": 0.2411966344655656, "percentage": 24.12, "elapsed_time": "17:27:19", "remaining_time": "2 days, 6:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2323, "total_steps": 9627, "loss": 1.7145, "learning_rate": 8.630828588857537e-05, "epoch": 0.24130050898514593, "percentage": 24.13, "elapsed_time": "17:27:44", "remaining_time": "2 days, 6:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2324, "total_steps": 9627, "loss": 1.7844, "learning_rate": 8.629706599109169e-05, "epoch": 0.2414043835047263, "percentage": 24.14, "elapsed_time": "17:28:11", "remaining_time": "2 days, 6:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2325, "total_steps": 9627, "loss": 1.586, "learning_rate": 8.628584222825357e-05, "epoch": 0.24150825802430664, "percentage": 24.15, "elapsed_time": "17:28:36", "remaining_time": "2 days, 6:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2326, "total_steps": 9627, "loss": 1.6915, "learning_rate": 8.627461460125632e-05, "epoch": 0.241612132543887, "percentage": 24.16, "elapsed_time": "17:29:02", "remaining_time": "2 days, 6:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2327, "total_steps": 9627, "loss": 1.7567, "learning_rate": 8.626338311129557e-05, "epoch": 0.24171600706346733, "percentage": 24.17, "elapsed_time": "17:29:28", "remaining_time": "2 days, 6:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2328, "total_steps": 9627, "loss": 1.6969, "learning_rate": 8.625214775956737e-05, "epoch": 0.24181988158304768, "percentage": 24.18, "elapsed_time": "17:29:53", "remaining_time": "2 days, 6:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2329, "total_steps": 9627, "loss": 1.6198, "learning_rate": 8.624090854726822e-05, "epoch": 0.24192375610262803, "percentage": 24.19, "elapsed_time": "17:30:19", "remaining_time": "2 days, 6:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2330, "total_steps": 9627, "loss": 1.7932, "learning_rate": 8.622966547559499e-05, "epoch": 0.24202763062220836, "percentage": 24.2, "elapsed_time": "17:30:45", "remaining_time": "2 days, 6:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2331, "total_steps": 9627, "loss": 1.8561, "learning_rate": 8.621841854574501e-05, "epoch": 0.24213150514178872, "percentage": 24.21, "elapsed_time": "17:31:11", "remaining_time": "2 days, 6:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2332, "total_steps": 9627, "loss": 1.5224, "learning_rate": 8.620716775891595e-05, "epoch": 0.24223537966136907, "percentage": 24.22, "elapsed_time": "17:31:37", "remaining_time": "2 days, 6:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2333, "total_steps": 9627, "loss": 1.8392, "learning_rate": 8.619591311630595e-05, "epoch": 0.24233925418094943, "percentage": 24.23, "elapsed_time": "17:32:02", "remaining_time": "2 days, 6:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2334, "total_steps": 9627, "loss": 1.7624, "learning_rate": 8.618465461911355e-05, "epoch": 0.24244312870052975, "percentage": 24.24, "elapsed_time": "17:32:28", "remaining_time": "2 days, 6:48:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2335, "total_steps": 9627, "loss": 1.6901, "learning_rate": 8.617339226853768e-05, "epoch": 0.2425470032201101, "percentage": 24.25, "elapsed_time": "17:32:53", "remaining_time": "2 days, 6:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2336, "total_steps": 9627, "loss": 1.8461, "learning_rate": 8.61621260657777e-05, "epoch": 0.24265087773969046, "percentage": 24.27, "elapsed_time": "17:33:20", "remaining_time": "2 days, 6:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2337, "total_steps": 9627, "loss": 1.6562, "learning_rate": 8.615085601203337e-05, "epoch": 0.2427547522592708, "percentage": 24.28, "elapsed_time": "17:33:45", "remaining_time": "2 days, 6:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2338, "total_steps": 9627, "loss": 1.7862, "learning_rate": 8.613958210850485e-05, "epoch": 0.24285862677885114, "percentage": 24.29, "elapsed_time": "17:34:10", "remaining_time": "2 days, 6:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2339, "total_steps": 9627, "loss": 1.9233, "learning_rate": 8.612830435639275e-05, "epoch": 0.2429625012984315, "percentage": 24.3, "elapsed_time": "17:34:36", "remaining_time": "2 days, 6:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2340, "total_steps": 9627, "loss": 1.8637, "learning_rate": 8.611702275689805e-05, "epoch": 0.24306637581801185, "percentage": 24.31, "elapsed_time": "17:35:02", "remaining_time": "2 days, 6:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2341, "total_steps": 9627, "loss": 1.7277, "learning_rate": 8.610573731122214e-05, "epoch": 0.24317025033759218, "percentage": 24.32, "elapsed_time": "17:35:28", "remaining_time": "2 days, 6:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2342, "total_steps": 9627, "loss": 1.7141, "learning_rate": 8.609444802056686e-05, "epoch": 0.24327412485717254, "percentage": 24.33, "elapsed_time": "17:35:54", "remaining_time": "2 days, 6:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2343, "total_steps": 9627, "loss": 1.7315, "learning_rate": 8.608315488613439e-05, "epoch": 0.2433779993767529, "percentage": 24.34, "elapsed_time": "17:36:19", "remaining_time": "2 days, 6:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2344, "total_steps": 9627, "loss": 1.712, "learning_rate": 8.607185790912739e-05, "epoch": 0.24348187389633322, "percentage": 24.35, "elapsed_time": "17:36:45", "remaining_time": "2 days, 6:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2345, "total_steps": 9627, "loss": 1.7046, "learning_rate": 8.60605570907489e-05, "epoch": 0.24358574841591357, "percentage": 24.36, "elapsed_time": "17:37:11", "remaining_time": "2 days, 6:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2346, "total_steps": 9627, "loss": 1.8009, "learning_rate": 8.604925243220235e-05, "epoch": 0.24368962293549393, "percentage": 24.37, "elapsed_time": "17:37:36", "remaining_time": "2 days, 6:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2347, "total_steps": 9627, "loss": 1.8602, "learning_rate": 8.603794393469162e-05, "epoch": 0.24379349745507428, "percentage": 24.38, "elapsed_time": "17:38:02", "remaining_time": "2 days, 6:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2348, "total_steps": 9627, "loss": 1.8524, "learning_rate": 8.602663159942098e-05, "epoch": 0.2438973719746546, "percentage": 24.39, "elapsed_time": "17:38:27", "remaining_time": "2 days, 6:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2349, "total_steps": 9627, "loss": 1.722, "learning_rate": 8.601531542759506e-05, "epoch": 0.24400124649423496, "percentage": 24.4, "elapsed_time": "17:38:54", "remaining_time": "2 days, 6:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 9627, "loss": 1.7846, "learning_rate": 8.600399542041901e-05, "epoch": 0.24410512101381532, "percentage": 24.41, "elapsed_time": "17:39:18", "remaining_time": "2 days, 6:40:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2351, "total_steps": 9627, "loss": 1.7255, "learning_rate": 8.599267157909827e-05, "epoch": 0.24420899553339565, "percentage": 24.42, "elapsed_time": "17:39:45", "remaining_time": "2 days, 6:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2352, "total_steps": 9627, "loss": 1.8129, "learning_rate": 8.598134390483879e-05, "epoch": 0.244312870052976, "percentage": 24.43, "elapsed_time": "17:40:10", "remaining_time": "2 days, 6:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2353, "total_steps": 9627, "loss": 2.0753, "learning_rate": 8.59700123988468e-05, "epoch": 0.24441674457255635, "percentage": 24.44, "elapsed_time": "17:40:35", "remaining_time": "2 days, 6:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2354, "total_steps": 9627, "loss": 1.8298, "learning_rate": 8.595867706232911e-05, "epoch": 0.2445206190921367, "percentage": 24.45, "elapsed_time": "17:41:01", "remaining_time": "2 days, 6:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2355, "total_steps": 9627, "loss": 1.7315, "learning_rate": 8.594733789649279e-05, "epoch": 0.24462449361171704, "percentage": 24.46, "elapsed_time": "17:41:27", "remaining_time": "2 days, 6:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2356, "total_steps": 9627, "loss": 1.6989, "learning_rate": 8.593599490254538e-05, "epoch": 0.2447283681312974, "percentage": 24.47, "elapsed_time": "17:41:52", "remaining_time": "2 days, 6:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2357, "total_steps": 9627, "loss": 1.7326, "learning_rate": 8.592464808169482e-05, "epoch": 0.24483224265087775, "percentage": 24.48, "elapsed_time": "17:42:19", "remaining_time": "2 days, 6:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2358, "total_steps": 9627, "loss": 1.774, "learning_rate": 8.591329743514947e-05, "epoch": 0.24493611717045807, "percentage": 24.49, "elapsed_time": "17:42:44", "remaining_time": "2 days, 6:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2359, "total_steps": 9627, "loss": 2.0193, "learning_rate": 8.590194296411806e-05, "epoch": 0.24503999169003843, "percentage": 24.5, "elapsed_time": "17:43:10", "remaining_time": "2 days, 6:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2360, "total_steps": 9627, "loss": 1.6699, "learning_rate": 8.589058466980979e-05, "epoch": 0.24514386620961878, "percentage": 24.51, "elapsed_time": "17:43:35", "remaining_time": "2 days, 6:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2361, "total_steps": 9627, "loss": 1.6759, "learning_rate": 8.587922255343421e-05, "epoch": 0.24524774072919914, "percentage": 24.52, "elapsed_time": "17:44:01", "remaining_time": "2 days, 6:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2362, "total_steps": 9627, "loss": 1.4792, "learning_rate": 8.58678566162013e-05, "epoch": 0.24535161524877946, "percentage": 24.54, "elapsed_time": "17:44:26", "remaining_time": "2 days, 6:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2363, "total_steps": 9627, "loss": 1.7362, "learning_rate": 8.585648685932141e-05, "epoch": 0.24545548976835982, "percentage": 24.55, "elapsed_time": "17:44:53", "remaining_time": "2 days, 6:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2364, "total_steps": 9627, "loss": 1.8942, "learning_rate": 8.58451132840054e-05, "epoch": 0.24555936428794017, "percentage": 24.56, "elapsed_time": "17:45:19", "remaining_time": "2 days, 6:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2365, "total_steps": 9627, "loss": 1.8449, "learning_rate": 8.58337358914644e-05, "epoch": 0.24566323880752053, "percentage": 24.57, "elapsed_time": "17:45:44", "remaining_time": "2 days, 6:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2366, "total_steps": 9627, "loss": 1.88, "learning_rate": 8.582235468291007e-05, "epoch": 0.24576711332710086, "percentage": 24.58, "elapsed_time": "17:46:09", "remaining_time": "2 days, 6:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2367, "total_steps": 9627, "loss": 1.8228, "learning_rate": 8.581096965955436e-05, "epoch": 0.2458709878466812, "percentage": 24.59, "elapsed_time": "17:46:35", "remaining_time": "2 days, 6:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2368, "total_steps": 9627, "loss": 1.7457, "learning_rate": 8.579958082260973e-05, "epoch": 0.24597486236626157, "percentage": 24.6, "elapsed_time": "17:47:00", "remaining_time": "2 days, 6:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2369, "total_steps": 9627, "loss": 1.8158, "learning_rate": 8.5788188173289e-05, "epoch": 0.2460787368858419, "percentage": 24.61, "elapsed_time": "17:47:25", "remaining_time": "2 days, 6:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2370, "total_steps": 9627, "loss": 1.8368, "learning_rate": 8.577679171280537e-05, "epoch": 0.24618261140542225, "percentage": 24.62, "elapsed_time": "17:47:50", "remaining_time": "2 days, 6:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2371, "total_steps": 9627, "loss": 1.6665, "learning_rate": 8.57653914423725e-05, "epoch": 0.2462864859250026, "percentage": 24.63, "elapsed_time": "17:48:17", "remaining_time": "2 days, 6:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2372, "total_steps": 9627, "loss": 1.8557, "learning_rate": 8.575398736320442e-05, "epoch": 0.24639036044458296, "percentage": 24.64, "elapsed_time": "17:48:43", "remaining_time": "2 days, 6:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2373, "total_steps": 9627, "loss": 1.6039, "learning_rate": 8.574257947651558e-05, "epoch": 0.24649423496416328, "percentage": 24.65, "elapsed_time": "17:49:09", "remaining_time": "2 days, 6:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2374, "total_steps": 9627, "loss": 1.85, "learning_rate": 8.573116778352084e-05, "epoch": 0.24659810948374364, "percentage": 24.66, "elapsed_time": "17:49:34", "remaining_time": "2 days, 6:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2375, "total_steps": 9627, "loss": 1.8249, "learning_rate": 8.571975228543543e-05, "epoch": 0.246701984003324, "percentage": 24.67, "elapsed_time": "17:50:00", "remaining_time": "2 days, 6:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2376, "total_steps": 9627, "loss": 1.7355, "learning_rate": 8.570833298347502e-05, "epoch": 0.24680585852290432, "percentage": 24.68, "elapsed_time": "17:50:25", "remaining_time": "2 days, 6:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2377, "total_steps": 9627, "loss": 1.5235, "learning_rate": 8.56969098788557e-05, "epoch": 0.24690973304248467, "percentage": 24.69, "elapsed_time": "17:50:52", "remaining_time": "2 days, 6:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2378, "total_steps": 9627, "loss": 1.8553, "learning_rate": 8.568548297279392e-05, "epoch": 0.24701360756206503, "percentage": 24.7, "elapsed_time": "17:51:17", "remaining_time": "2 days, 6:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2379, "total_steps": 9627, "loss": 1.4544, "learning_rate": 8.567405226650656e-05, "epoch": 0.24711748208164538, "percentage": 24.71, "elapsed_time": "17:51:42", "remaining_time": "2 days, 6:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2380, "total_steps": 9627, "loss": 1.7564, "learning_rate": 8.56626177612109e-05, "epoch": 0.2472213566012257, "percentage": 24.72, "elapsed_time": "17:52:08", "remaining_time": "2 days, 6:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2381, "total_steps": 9627, "loss": 1.8172, "learning_rate": 8.565117945812463e-05, "epoch": 0.24732523112080607, "percentage": 24.73, "elapsed_time": "17:52:34", "remaining_time": "2 days, 6:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2382, "total_steps": 9627, "loss": 1.6763, "learning_rate": 8.563973735846583e-05, "epoch": 0.24742910564038642, "percentage": 24.74, "elapsed_time": "17:52:59", "remaining_time": "2 days, 6:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2383, "total_steps": 9627, "loss": 1.7017, "learning_rate": 8.562829146345301e-05, "epoch": 0.24753298015996675, "percentage": 24.75, "elapsed_time": "17:53:25", "remaining_time": "2 days, 6:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2384, "total_steps": 9627, "loss": 1.6087, "learning_rate": 8.561684177430507e-05, "epoch": 0.2476368546795471, "percentage": 24.76, "elapsed_time": "17:53:51", "remaining_time": "2 days, 6:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2385, "total_steps": 9627, "loss": 1.6795, "learning_rate": 8.560538829224129e-05, "epoch": 0.24774072919912746, "percentage": 24.77, "elapsed_time": "17:54:17", "remaining_time": "2 days, 6:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2386, "total_steps": 9627, "loss": 1.7984, "learning_rate": 8.559393101848139e-05, "epoch": 0.2478446037187078, "percentage": 24.78, "elapsed_time": "17:54:42", "remaining_time": "2 days, 6:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2387, "total_steps": 9627, "loss": 1.5587, "learning_rate": 8.558246995424548e-05, "epoch": 0.24794847823828814, "percentage": 24.79, "elapsed_time": "17:55:08", "remaining_time": "2 days, 6:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2388, "total_steps": 9627, "loss": 1.6269, "learning_rate": 8.557100510075406e-05, "epoch": 0.2480523527578685, "percentage": 24.81, "elapsed_time": "17:55:34", "remaining_time": "2 days, 6:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2389, "total_steps": 9627, "loss": 2.0851, "learning_rate": 8.555953645922809e-05, "epoch": 0.24815622727744885, "percentage": 24.82, "elapsed_time": "17:55:59", "remaining_time": "2 days, 6:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2390, "total_steps": 9627, "loss": 1.5321, "learning_rate": 8.554806403088884e-05, "epoch": 0.24826010179702918, "percentage": 24.83, "elapsed_time": "17:56:26", "remaining_time": "2 days, 6:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2391, "total_steps": 9627, "loss": 1.7002, "learning_rate": 8.553658781695807e-05, "epoch": 0.24836397631660953, "percentage": 24.84, "elapsed_time": "17:56:52", "remaining_time": "2 days, 6:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2392, "total_steps": 9627, "loss": 1.74, "learning_rate": 8.552510781865788e-05, "epoch": 0.24846785083618989, "percentage": 24.85, "elapsed_time": "17:57:17", "remaining_time": "2 days, 6:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2393, "total_steps": 9627, "loss": 1.7332, "learning_rate": 8.551362403721084e-05, "epoch": 0.24857172535577024, "percentage": 24.86, "elapsed_time": "17:57:43", "remaining_time": "2 days, 6:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2394, "total_steps": 9627, "loss": 1.8173, "learning_rate": 8.550213647383982e-05, "epoch": 0.24867559987535057, "percentage": 24.87, "elapsed_time": "17:58:08", "remaining_time": "2 days, 6:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2395, "total_steps": 9627, "loss": 1.824, "learning_rate": 8.549064512976822e-05, "epoch": 0.24877947439493092, "percentage": 24.88, "elapsed_time": "17:58:35", "remaining_time": "2 days, 6:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2396, "total_steps": 9627, "loss": 1.7691, "learning_rate": 8.547915000621974e-05, "epoch": 0.24888334891451128, "percentage": 24.89, "elapsed_time": "17:58:59", "remaining_time": "2 days, 6:16:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2397, "total_steps": 9627, "loss": 1.7228, "learning_rate": 8.546765110441855e-05, "epoch": 0.2489872234340916, "percentage": 24.9, "elapsed_time": "17:59:27", "remaining_time": "2 days, 6:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2398, "total_steps": 9627, "loss": 1.613, "learning_rate": 8.545614842558915e-05, "epoch": 0.24909109795367196, "percentage": 24.91, "elapsed_time": "17:59:51", "remaining_time": "2 days, 6:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2399, "total_steps": 9627, "loss": 1.6443, "learning_rate": 8.544464197095651e-05, "epoch": 0.2491949724732523, "percentage": 24.92, "elapsed_time": "18:00:18", "remaining_time": "2 days, 6:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 9627, "loss": 1.7364, "learning_rate": 8.5433131741746e-05, "epoch": 0.24929884699283267, "percentage": 24.93, "elapsed_time": "18:00:44", "remaining_time": "2 days, 6:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2401, "total_steps": 9627, "loss": 1.8304, "learning_rate": 8.542161773918334e-05, "epoch": 0.249402721512413, "percentage": 24.94, "elapsed_time": "18:01:08", "remaining_time": "2 days, 6:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2402, "total_steps": 9627, "loss": 1.7448, "learning_rate": 8.54100999644947e-05, "epoch": 0.24950659603199335, "percentage": 24.95, "elapsed_time": "18:01:35", "remaining_time": "2 days, 6:13:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2403, "total_steps": 9627, "loss": 1.7384, "learning_rate": 8.53985784189066e-05, "epoch": 0.2496104705515737, "percentage": 24.96, "elapsed_time": "18:02:00", "remaining_time": "2 days, 6:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2404, "total_steps": 9627, "loss": 1.8425, "learning_rate": 8.538705310364603e-05, "epoch": 0.24971434507115406, "percentage": 24.97, "elapsed_time": "18:02:26", "remaining_time": "2 days, 6:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2405, "total_steps": 9627, "loss": 1.7596, "learning_rate": 8.537552401994034e-05, "epoch": 0.24981821959073439, "percentage": 24.98, "elapsed_time": "18:02:51", "remaining_time": "2 days, 6:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2406, "total_steps": 9627, "loss": 1.8014, "learning_rate": 8.536399116901728e-05, "epoch": 0.24992209411031474, "percentage": 24.99, "elapsed_time": "18:03:17", "remaining_time": "2 days, 6:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2407, "total_steps": 9627, "loss": 1.5849, "learning_rate": 8.535245455210501e-05, "epoch": 0.25002596862989507, "percentage": 25.0, "elapsed_time": "18:03:43", "remaining_time": "2 days, 6:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2408, "total_steps": 9627, "loss": 1.9111, "learning_rate": 8.534091417043208e-05, "epoch": 0.25012984314947545, "percentage": 25.01, "elapsed_time": "18:04:09", "remaining_time": "2 days, 6:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2409, "total_steps": 9627, "loss": 1.6662, "learning_rate": 8.532937002522747e-05, "epoch": 0.2502337176690558, "percentage": 25.02, "elapsed_time": "18:04:35", "remaining_time": "2 days, 6:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2410, "total_steps": 9627, "loss": 1.5775, "learning_rate": 8.531782211772052e-05, "epoch": 0.2503375921886361, "percentage": 25.03, "elapsed_time": "18:05:00", "remaining_time": "2 days, 6:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2411, "total_steps": 9627, "loss": 1.796, "learning_rate": 8.530627044914101e-05, "epoch": 0.2504414667082165, "percentage": 25.04, "elapsed_time": "18:05:26", "remaining_time": "2 days, 6:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2412, "total_steps": 9627, "loss": 1.8143, "learning_rate": 8.52947150207191e-05, "epoch": 0.2505453412277968, "percentage": 25.05, "elapsed_time": "18:05:52", "remaining_time": "2 days, 6:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2413, "total_steps": 9627, "loss": 1.7078, "learning_rate": 8.528315583368536e-05, "epoch": 0.25064921574737714, "percentage": 25.06, "elapsed_time": "18:06:17", "remaining_time": "2 days, 6:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2414, "total_steps": 9627, "loss": 1.876, "learning_rate": 8.527159288927074e-05, "epoch": 0.2507530902669575, "percentage": 25.08, "elapsed_time": "18:06:42", "remaining_time": "2 days, 6:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2415, "total_steps": 9627, "loss": 1.646, "learning_rate": 8.526002618870659e-05, "epoch": 0.25085696478653785, "percentage": 25.09, "elapsed_time": "18:07:09", "remaining_time": "2 days, 6:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2416, "total_steps": 9627, "loss": 1.8018, "learning_rate": 8.52484557332247e-05, "epoch": 0.25096083930611823, "percentage": 25.1, "elapsed_time": "18:07:34", "remaining_time": "2 days, 6:06:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2417, "total_steps": 9627, "loss": 1.6909, "learning_rate": 8.523688152405722e-05, "epoch": 0.25106471382569856, "percentage": 25.11, "elapsed_time": "18:08:01", "remaining_time": "2 days, 6:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2418, "total_steps": 9627, "loss": 1.6112, "learning_rate": 8.522530356243671e-05, "epoch": 0.2511685883452789, "percentage": 25.12, "elapsed_time": "18:08:25", "remaining_time": "2 days, 6:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2419, "total_steps": 9627, "loss": 1.9221, "learning_rate": 8.521372184959615e-05, "epoch": 0.25127246286485927, "percentage": 25.13, "elapsed_time": "18:08:51", "remaining_time": "2 days, 6:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2420, "total_steps": 9627, "loss": 1.6999, "learning_rate": 8.520213638676889e-05, "epoch": 0.2513763373844396, "percentage": 25.14, "elapsed_time": "18:09:17", "remaining_time": "2 days, 6:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2421, "total_steps": 9627, "loss": 1.8009, "learning_rate": 8.519054717518868e-05, "epoch": 0.2514802119040199, "percentage": 25.15, "elapsed_time": "18:09:43", "remaining_time": "2 days, 6:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2422, "total_steps": 9627, "loss": 1.6935, "learning_rate": 8.517895421608972e-05, "epoch": 0.2515840864236003, "percentage": 25.16, "elapsed_time": "18:10:08", "remaining_time": "2 days, 6:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2423, "total_steps": 9627, "loss": 1.7611, "learning_rate": 8.516735751070652e-05, "epoch": 0.25168796094318063, "percentage": 25.17, "elapsed_time": "18:10:34", "remaining_time": "2 days, 6:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2424, "total_steps": 9627, "loss": 1.7451, "learning_rate": 8.515575706027406e-05, "epoch": 0.25179183546276096, "percentage": 25.18, "elapsed_time": "18:10:59", "remaining_time": "2 days, 6:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2425, "total_steps": 9627, "loss": 1.6652, "learning_rate": 8.514415286602771e-05, "epoch": 0.25189570998234134, "percentage": 25.19, "elapsed_time": "18:11:26", "remaining_time": "2 days, 6:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2426, "total_steps": 9627, "loss": 1.7082, "learning_rate": 8.51325449292032e-05, "epoch": 0.25199958450192167, "percentage": 25.2, "elapsed_time": "18:11:51", "remaining_time": "2 days, 6:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2427, "total_steps": 9627, "loss": 1.6654, "learning_rate": 8.512093325103671e-05, "epoch": 0.25210345902150205, "percentage": 25.21, "elapsed_time": "18:12:17", "remaining_time": "2 days, 6:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2428, "total_steps": 9627, "loss": 1.9137, "learning_rate": 8.510931783276477e-05, "epoch": 0.2522073335410824, "percentage": 25.22, "elapsed_time": "18:12:43", "remaining_time": "2 days, 5:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2429, "total_steps": 9627, "loss": 2.0342, "learning_rate": 8.509769867562436e-05, "epoch": 0.2523112080606627, "percentage": 25.23, "elapsed_time": "18:13:08", "remaining_time": "2 days, 5:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2430, "total_steps": 9627, "loss": 1.7393, "learning_rate": 8.508607578085282e-05, "epoch": 0.2524150825802431, "percentage": 25.24, "elapsed_time": "18:13:35", "remaining_time": "2 days, 5:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2431, "total_steps": 9627, "loss": 1.8187, "learning_rate": 8.507444914968788e-05, "epoch": 0.2525189570998234, "percentage": 25.25, "elapsed_time": "18:14:00", "remaining_time": "2 days, 5:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2432, "total_steps": 9627, "loss": 1.733, "learning_rate": 8.506281878336768e-05, "epoch": 0.25262283161940374, "percentage": 25.26, "elapsed_time": "18:14:25", "remaining_time": "2 days, 5:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2433, "total_steps": 9627, "loss": 1.691, "learning_rate": 8.50511846831308e-05, "epoch": 0.2527267061389841, "percentage": 25.27, "elapsed_time": "18:14:51", "remaining_time": "2 days, 5:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2434, "total_steps": 9627, "loss": 1.7962, "learning_rate": 8.503954685021616e-05, "epoch": 0.25283058065856445, "percentage": 25.28, "elapsed_time": "18:15:16", "remaining_time": "2 days, 5:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2435, "total_steps": 9627, "loss": 1.8226, "learning_rate": 8.50279052858631e-05, "epoch": 0.2529344551781448, "percentage": 25.29, "elapsed_time": "18:15:42", "remaining_time": "2 days, 5:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2436, "total_steps": 9627, "loss": 1.8345, "learning_rate": 8.501625999131134e-05, "epoch": 0.25303832969772516, "percentage": 25.3, "elapsed_time": "18:16:08", "remaining_time": "2 days, 5:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2437, "total_steps": 9627, "loss": 1.6779, "learning_rate": 8.500461096780105e-05, "epoch": 0.2531422042173055, "percentage": 25.31, "elapsed_time": "18:16:32", "remaining_time": "2 days, 5:55:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2438, "total_steps": 9627, "loss": 1.8124, "learning_rate": 8.499295821657273e-05, "epoch": 0.2532460787368858, "percentage": 25.32, "elapsed_time": "18:16:59", "remaining_time": "2 days, 5:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2439, "total_steps": 9627, "loss": 1.9252, "learning_rate": 8.498130173886731e-05, "epoch": 0.2533499532564662, "percentage": 25.33, "elapsed_time": "18:17:25", "remaining_time": "2 days, 5:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2440, "total_steps": 9627, "loss": 1.7423, "learning_rate": 8.496964153592613e-05, "epoch": 0.2534538277760465, "percentage": 25.35, "elapsed_time": "18:17:49", "remaining_time": "2 days, 5:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2441, "total_steps": 9627, "loss": 1.4438, "learning_rate": 8.495797760899088e-05, "epoch": 0.2535577022956269, "percentage": 25.36, "elapsed_time": "18:18:16", "remaining_time": "2 days, 5:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2442, "total_steps": 9627, "loss": 1.5389, "learning_rate": 8.494630995930372e-05, "epoch": 0.25366157681520723, "percentage": 25.37, "elapsed_time": "18:18:41", "remaining_time": "2 days, 5:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2443, "total_steps": 9627, "loss": 1.8215, "learning_rate": 8.493463858810713e-05, "epoch": 0.25376545133478756, "percentage": 25.38, "elapsed_time": "18:19:07", "remaining_time": "2 days, 5:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2444, "total_steps": 9627, "loss": 1.8385, "learning_rate": 8.492296349664401e-05, "epoch": 0.25386932585436794, "percentage": 25.39, "elapsed_time": "18:19:32", "remaining_time": "2 days, 5:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2445, "total_steps": 9627, "loss": 1.642, "learning_rate": 8.491128468615772e-05, "epoch": 0.25397320037394827, "percentage": 25.4, "elapsed_time": "18:19:58", "remaining_time": "2 days, 5:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2446, "total_steps": 9627, "loss": 1.8311, "learning_rate": 8.489960215789192e-05, "epoch": 0.2540770748935286, "percentage": 25.41, "elapsed_time": "18:20:23", "remaining_time": "2 days, 5:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2447, "total_steps": 9627, "loss": 1.7373, "learning_rate": 8.488791591309072e-05, "epoch": 0.254180949413109, "percentage": 25.42, "elapsed_time": "18:20:48", "remaining_time": "2 days, 5:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2448, "total_steps": 9627, "loss": 1.7054, "learning_rate": 8.48762259529986e-05, "epoch": 0.2542848239326893, "percentage": 25.43, "elapsed_time": "18:21:15", "remaining_time": "2 days, 5:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2449, "total_steps": 9627, "loss": 1.6371, "learning_rate": 8.486453227886049e-05, "epoch": 0.25438869845226963, "percentage": 25.44, "elapsed_time": "18:21:40", "remaining_time": "2 days, 5:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 9627, "loss": 1.5869, "learning_rate": 8.485283489192162e-05, "epoch": 0.25449257297185, "percentage": 25.45, "elapsed_time": "18:22:06", "remaining_time": "2 days, 5:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2451, "total_steps": 9627, "loss": 1.5886, "learning_rate": 8.48411337934277e-05, "epoch": 0.25459644749143034, "percentage": 25.46, "elapsed_time": "18:22:31", "remaining_time": "2 days, 5:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2452, "total_steps": 9627, "loss": 1.8044, "learning_rate": 8.48294289846248e-05, "epoch": 0.25470032201101067, "percentage": 25.47, "elapsed_time": "18:22:57", "remaining_time": "2 days, 5:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2453, "total_steps": 9627, "loss": 1.8413, "learning_rate": 8.48177204667594e-05, "epoch": 0.25480419653059105, "percentage": 25.48, "elapsed_time": "18:23:23", "remaining_time": "2 days, 5:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2454, "total_steps": 9627, "loss": 1.6651, "learning_rate": 8.480600824107837e-05, "epoch": 0.2549080710501714, "percentage": 25.49, "elapsed_time": "18:23:47", "remaining_time": "2 days, 5:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2455, "total_steps": 9627, "loss": 1.558, "learning_rate": 8.479429230882893e-05, "epoch": 0.25501194556975176, "percentage": 25.5, "elapsed_time": "18:24:14", "remaining_time": "2 days, 5:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2456, "total_steps": 9627, "loss": 1.7901, "learning_rate": 8.478257267125878e-05, "epoch": 0.2551158200893321, "percentage": 25.51, "elapsed_time": "18:24:40", "remaining_time": "2 days, 5:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2457, "total_steps": 9627, "loss": 1.6559, "learning_rate": 8.477084932961596e-05, "epoch": 0.2552196946089124, "percentage": 25.52, "elapsed_time": "18:25:05", "remaining_time": "2 days, 5:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2458, "total_steps": 9627, "loss": 1.7842, "learning_rate": 8.475912228514889e-05, "epoch": 0.2553235691284928, "percentage": 25.53, "elapsed_time": "18:25:31", "remaining_time": "2 days, 5:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2459, "total_steps": 9627, "loss": 1.6281, "learning_rate": 8.474739153910646e-05, "epoch": 0.2554274436480731, "percentage": 25.54, "elapsed_time": "18:25:56", "remaining_time": "2 days, 5:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2460, "total_steps": 9627, "loss": 1.8031, "learning_rate": 8.473565709273785e-05, "epoch": 0.25553131816765345, "percentage": 25.55, "elapsed_time": "18:26:22", "remaining_time": "2 days, 5:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2461, "total_steps": 9627, "loss": 1.9434, "learning_rate": 8.47239189472927e-05, "epoch": 0.25563519268723384, "percentage": 25.56, "elapsed_time": "18:26:48", "remaining_time": "2 days, 5:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2462, "total_steps": 9627, "loss": 1.8198, "learning_rate": 8.471217710402106e-05, "epoch": 0.25573906720681416, "percentage": 25.57, "elapsed_time": "18:27:13", "remaining_time": "2 days, 5:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2463, "total_steps": 9627, "loss": 1.8017, "learning_rate": 8.470043156417333e-05, "epoch": 0.2558429417263945, "percentage": 25.58, "elapsed_time": "18:27:38", "remaining_time": "2 days, 5:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2464, "total_steps": 9627, "loss": 1.7512, "learning_rate": 8.46886823290003e-05, "epoch": 0.2559468162459749, "percentage": 25.59, "elapsed_time": "18:28:05", "remaining_time": "2 days, 5:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2465, "total_steps": 9627, "loss": 1.9163, "learning_rate": 8.467692939975316e-05, "epoch": 0.2560506907655552, "percentage": 25.61, "elapsed_time": "18:28:31", "remaining_time": "2 days, 5:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2466, "total_steps": 9627, "loss": 1.9303, "learning_rate": 8.466517277768355e-05, "epoch": 0.2561545652851356, "percentage": 25.62, "elapsed_time": "18:28:56", "remaining_time": "2 days, 5:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2467, "total_steps": 9627, "loss": 1.6991, "learning_rate": 8.465341246404345e-05, "epoch": 0.2562584398047159, "percentage": 25.63, "elapsed_time": "18:29:21", "remaining_time": "2 days, 5:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2468, "total_steps": 9627, "loss": 1.7796, "learning_rate": 8.464164846008522e-05, "epoch": 0.25636231432429624, "percentage": 25.64, "elapsed_time": "18:29:47", "remaining_time": "2 days, 5:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2469, "total_steps": 9627, "loss": 1.7226, "learning_rate": 8.462988076706164e-05, "epoch": 0.2564661888438766, "percentage": 25.65, "elapsed_time": "18:30:13", "remaining_time": "2 days, 5:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2470, "total_steps": 9627, "loss": 1.7105, "learning_rate": 8.461810938622589e-05, "epoch": 0.25657006336345695, "percentage": 25.66, "elapsed_time": "18:30:38", "remaining_time": "2 days, 5:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2471, "total_steps": 9627, "loss": 1.6964, "learning_rate": 8.460633431883151e-05, "epoch": 0.2566739378830373, "percentage": 25.67, "elapsed_time": "18:31:04", "remaining_time": "2 days, 5:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2472, "total_steps": 9627, "loss": 1.7889, "learning_rate": 8.459455556613247e-05, "epoch": 0.25677781240261766, "percentage": 25.68, "elapsed_time": "18:31:29", "remaining_time": "2 days, 5:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2473, "total_steps": 9627, "loss": 2.066, "learning_rate": 8.458277312938312e-05, "epoch": 0.256881686922198, "percentage": 25.69, "elapsed_time": "18:31:56", "remaining_time": "2 days, 5:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2474, "total_steps": 9627, "loss": 1.8605, "learning_rate": 8.457098700983818e-05, "epoch": 0.2569855614417783, "percentage": 25.7, "elapsed_time": "18:32:21", "remaining_time": "2 days, 5:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2475, "total_steps": 9627, "loss": 1.8728, "learning_rate": 8.455919720875279e-05, "epoch": 0.2570894359613587, "percentage": 25.71, "elapsed_time": "18:32:47", "remaining_time": "2 days, 5:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2476, "total_steps": 9627, "loss": 1.6178, "learning_rate": 8.454740372738246e-05, "epoch": 0.257193310480939, "percentage": 25.72, "elapsed_time": "18:33:13", "remaining_time": "2 days, 5:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2477, "total_steps": 9627, "loss": 1.5962, "learning_rate": 8.453560656698311e-05, "epoch": 0.25729718500051935, "percentage": 25.73, "elapsed_time": "18:33:38", "remaining_time": "2 days, 5:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2478, "total_steps": 9627, "loss": 1.6725, "learning_rate": 8.452380572881107e-05, "epoch": 0.25740105952009973, "percentage": 25.74, "elapsed_time": "18:34:04", "remaining_time": "2 days, 5:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2479, "total_steps": 9627, "loss": 1.731, "learning_rate": 8.451200121412299e-05, "epoch": 0.25750493403968006, "percentage": 25.75, "elapsed_time": "18:34:29", "remaining_time": "2 days, 5:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2480, "total_steps": 9627, "loss": 1.5419, "learning_rate": 8.4500193024176e-05, "epoch": 0.25760880855926044, "percentage": 25.76, "elapsed_time": "18:34:55", "remaining_time": "2 days, 5:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2481, "total_steps": 9627, "loss": 1.6488, "learning_rate": 8.448838116022758e-05, "epoch": 0.25771268307884077, "percentage": 25.77, "elapsed_time": "18:35:20", "remaining_time": "2 days, 5:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2482, "total_steps": 9627, "loss": 1.8325, "learning_rate": 8.447656562353557e-05, "epoch": 0.2578165575984211, "percentage": 25.78, "elapsed_time": "18:35:46", "remaining_time": "2 days, 5:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2483, "total_steps": 9627, "loss": 1.5927, "learning_rate": 8.446474641535824e-05, "epoch": 0.2579204321180015, "percentage": 25.79, "elapsed_time": "18:36:11", "remaining_time": "2 days, 5:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2484, "total_steps": 9627, "loss": 1.7471, "learning_rate": 8.445292353695427e-05, "epoch": 0.2580243066375818, "percentage": 25.8, "elapsed_time": "18:36:37", "remaining_time": "2 days, 5:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2485, "total_steps": 9627, "loss": 1.7668, "learning_rate": 8.444109698958267e-05, "epoch": 0.25812818115716213, "percentage": 25.81, "elapsed_time": "18:37:03", "remaining_time": "2 days, 5:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2486, "total_steps": 9627, "loss": 1.7104, "learning_rate": 8.44292667745029e-05, "epoch": 0.2582320556767425, "percentage": 25.82, "elapsed_time": "18:37:29", "remaining_time": "2 days, 5:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2487, "total_steps": 9627, "loss": 1.8359, "learning_rate": 8.441743289297476e-05, "epoch": 0.25833593019632284, "percentage": 25.83, "elapsed_time": "18:37:54", "remaining_time": "2 days, 5:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2488, "total_steps": 9627, "loss": 1.6393, "learning_rate": 8.440559534625851e-05, "epoch": 0.25843980471590317, "percentage": 25.84, "elapsed_time": "18:38:20", "remaining_time": "2 days, 5:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2489, "total_steps": 9627, "loss": 1.6612, "learning_rate": 8.439375413561472e-05, "epoch": 0.25854367923548355, "percentage": 25.85, "elapsed_time": "18:38:45", "remaining_time": "2 days, 5:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2490, "total_steps": 9627, "loss": 1.7044, "learning_rate": 8.43819092623044e-05, "epoch": 0.2586475537550639, "percentage": 25.86, "elapsed_time": "18:39:10", "remaining_time": "2 days, 5:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2491, "total_steps": 9627, "loss": 1.608, "learning_rate": 8.437006072758891e-05, "epoch": 0.25875142827464426, "percentage": 25.88, "elapsed_time": "18:39:37", "remaining_time": "2 days, 5:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2492, "total_steps": 9627, "loss": 1.7361, "learning_rate": 8.435820853273007e-05, "epoch": 0.2588553027942246, "percentage": 25.89, "elapsed_time": "18:40:02", "remaining_time": "2 days, 5:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2493, "total_steps": 9627, "loss": 1.799, "learning_rate": 8.434635267899002e-05, "epoch": 0.2589591773138049, "percentage": 25.9, "elapsed_time": "18:40:28", "remaining_time": "2 days, 5:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2494, "total_steps": 9627, "loss": 1.8073, "learning_rate": 8.433449316763133e-05, "epoch": 0.2590630518333853, "percentage": 25.91, "elapsed_time": "18:40:53", "remaining_time": "2 days, 5:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2495, "total_steps": 9627, "loss": 2.0099, "learning_rate": 8.432262999991694e-05, "epoch": 0.2591669263529656, "percentage": 25.92, "elapsed_time": "18:41:19", "remaining_time": "2 days, 5:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2496, "total_steps": 9627, "loss": 1.6813, "learning_rate": 8.431076317711017e-05, "epoch": 0.25927080087254595, "percentage": 25.93, "elapsed_time": "18:41:44", "remaining_time": "2 days, 5:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2497, "total_steps": 9627, "loss": 1.6921, "learning_rate": 8.429889270047475e-05, "epoch": 0.25937467539212633, "percentage": 25.94, "elapsed_time": "18:42:11", "remaining_time": "2 days, 5:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2498, "total_steps": 9627, "loss": 1.8239, "learning_rate": 8.428701857127481e-05, "epoch": 0.25947854991170666, "percentage": 25.95, "elapsed_time": "18:42:36", "remaining_time": "2 days, 5:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2499, "total_steps": 9627, "loss": 1.6058, "learning_rate": 8.427514079077485e-05, "epoch": 0.259582424431287, "percentage": 25.96, "elapsed_time": "18:43:02", "remaining_time": "2 days, 5:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 9627, "loss": 1.8754, "learning_rate": 8.426325936023974e-05, "epoch": 0.25968629895086737, "percentage": 25.97, "elapsed_time": "18:43:28", "remaining_time": "2 days, 5:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2501, "total_steps": 9627, "loss": 1.7336, "learning_rate": 8.425137428093477e-05, "epoch": 0.2597901734704477, "percentage": 25.98, "elapsed_time": "18:43:53", "remaining_time": "2 days, 5:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2502, "total_steps": 9627, "loss": 1.7356, "learning_rate": 8.423948555412562e-05, "epoch": 0.259894047990028, "percentage": 25.99, "elapsed_time": "18:44:19", "remaining_time": "2 days, 5:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2503, "total_steps": 9627, "loss": 1.8169, "learning_rate": 8.422759318107832e-05, "epoch": 0.2599979225096084, "percentage": 26.0, "elapsed_time": "18:44:44", "remaining_time": "2 days, 5:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2504, "total_steps": 9627, "loss": 1.904, "learning_rate": 8.421569716305934e-05, "epoch": 0.26010179702918873, "percentage": 26.01, "elapsed_time": "18:45:10", "remaining_time": "2 days, 5:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2505, "total_steps": 9627, "loss": 1.809, "learning_rate": 8.42037975013355e-05, "epoch": 0.2602056715487691, "percentage": 26.02, "elapsed_time": "18:45:35", "remaining_time": "2 days, 5:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2506, "total_steps": 9627, "loss": 1.7811, "learning_rate": 8.419189419717404e-05, "epoch": 0.26030954606834944, "percentage": 26.03, "elapsed_time": "18:46:01", "remaining_time": "2 days, 5:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2507, "total_steps": 9627, "loss": 1.7371, "learning_rate": 8.417998725184254e-05, "epoch": 0.26041342058792977, "percentage": 26.04, "elapsed_time": "18:46:27", "remaining_time": "2 days, 5:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2508, "total_steps": 9627, "loss": 1.719, "learning_rate": 8.416807666660901e-05, "epoch": 0.26051729510751015, "percentage": 26.05, "elapsed_time": "18:46:53", "remaining_time": "2 days, 5:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2509, "total_steps": 9627, "loss": 1.6887, "learning_rate": 8.415616244274185e-05, "epoch": 0.2606211696270905, "percentage": 26.06, "elapsed_time": "18:47:18", "remaining_time": "2 days, 5:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2510, "total_steps": 9627, "loss": 1.7395, "learning_rate": 8.414424458150983e-05, "epoch": 0.2607250441466708, "percentage": 26.07, "elapsed_time": "18:47:44", "remaining_time": "2 days, 5:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2511, "total_steps": 9627, "loss": 1.6363, "learning_rate": 8.413232308418206e-05, "epoch": 0.2608289186662512, "percentage": 26.08, "elapsed_time": "18:48:09", "remaining_time": "2 days, 5:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2512, "total_steps": 9627, "loss": 1.91, "learning_rate": 8.412039795202816e-05, "epoch": 0.2609327931858315, "percentage": 26.09, "elapsed_time": "18:48:36", "remaining_time": "2 days, 5:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2513, "total_steps": 9627, "loss": 1.7341, "learning_rate": 8.4108469186318e-05, "epoch": 0.26103666770541184, "percentage": 26.1, "elapsed_time": "18:49:01", "remaining_time": "2 days, 5:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2514, "total_steps": 9627, "loss": 1.6744, "learning_rate": 8.409653678832194e-05, "epoch": 0.2611405422249922, "percentage": 26.11, "elapsed_time": "18:49:26", "remaining_time": "2 days, 5:15:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2515, "total_steps": 9627, "loss": 1.6597, "learning_rate": 8.408460075931068e-05, "epoch": 0.26124441674457255, "percentage": 26.12, "elapsed_time": "18:49:53", "remaining_time": "2 days, 5:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2516, "total_steps": 9627, "loss": 1.6995, "learning_rate": 8.407266110055531e-05, "epoch": 0.2613482912641529, "percentage": 26.13, "elapsed_time": "18:50:18", "remaining_time": "2 days, 5:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2517, "total_steps": 9627, "loss": 1.657, "learning_rate": 8.40607178133273e-05, "epoch": 0.26145216578373326, "percentage": 26.15, "elapsed_time": "18:50:44", "remaining_time": "2 days, 5:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2518, "total_steps": 9627, "loss": 1.7071, "learning_rate": 8.404877089889853e-05, "epoch": 0.2615560403033136, "percentage": 26.16, "elapsed_time": "18:51:09", "remaining_time": "2 days, 5:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2519, "total_steps": 9627, "loss": 1.5713, "learning_rate": 8.403682035854125e-05, "epoch": 0.26165991482289397, "percentage": 26.17, "elapsed_time": "18:51:35", "remaining_time": "2 days, 5:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2520, "total_steps": 9627, "loss": 1.6968, "learning_rate": 8.40248661935281e-05, "epoch": 0.2617637893424743, "percentage": 26.18, "elapsed_time": "18:52:01", "remaining_time": "2 days, 5:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2521, "total_steps": 9627, "loss": 1.5176, "learning_rate": 8.40129084051321e-05, "epoch": 0.2618676638620546, "percentage": 26.19, "elapsed_time": "18:52:26", "remaining_time": "2 days, 5:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2522, "total_steps": 9627, "loss": 1.84, "learning_rate": 8.400094699462667e-05, "epoch": 0.261971538381635, "percentage": 26.2, "elapsed_time": "18:52:52", "remaining_time": "2 days, 5:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2523, "total_steps": 9627, "loss": 1.818, "learning_rate": 8.398898196328561e-05, "epoch": 0.26207541290121533, "percentage": 26.21, "elapsed_time": "18:53:17", "remaining_time": "2 days, 5:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2524, "total_steps": 9627, "loss": 1.764, "learning_rate": 8.39770133123831e-05, "epoch": 0.26217928742079566, "percentage": 26.22, "elapsed_time": "18:53:44", "remaining_time": "2 days, 5:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2525, "total_steps": 9627, "loss": 1.8256, "learning_rate": 8.396504104319366e-05, "epoch": 0.26228316194037604, "percentage": 26.23, "elapsed_time": "18:54:09", "remaining_time": "2 days, 5:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2526, "total_steps": 9627, "loss": 1.5408, "learning_rate": 8.395306515699234e-05, "epoch": 0.26238703645995637, "percentage": 26.24, "elapsed_time": "18:54:35", "remaining_time": "2 days, 5:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2527, "total_steps": 9627, "loss": 1.6385, "learning_rate": 8.394108565505441e-05, "epoch": 0.2624909109795367, "percentage": 26.25, "elapsed_time": "18:55:01", "remaining_time": "2 days, 5:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2528, "total_steps": 9627, "loss": 1.6302, "learning_rate": 8.392910253865557e-05, "epoch": 0.2625947854991171, "percentage": 26.26, "elapsed_time": "18:55:26", "remaining_time": "2 days, 5:08:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2529, "total_steps": 9627, "loss": 1.8292, "learning_rate": 8.391711580907202e-05, "epoch": 0.2626986600186974, "percentage": 26.27, "elapsed_time": "18:55:52", "remaining_time": "2 days, 5:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2530, "total_steps": 9627, "loss": 1.8284, "learning_rate": 8.390512546758016e-05, "epoch": 0.2628025345382778, "percentage": 26.28, "elapsed_time": "18:56:17", "remaining_time": "2 days, 5:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2531, "total_steps": 9627, "loss": 1.8026, "learning_rate": 8.389313151545694e-05, "epoch": 0.2629064090578581, "percentage": 26.29, "elapsed_time": "18:56:43", "remaining_time": "2 days, 5:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2532, "total_steps": 9627, "loss": 1.7194, "learning_rate": 8.388113395397957e-05, "epoch": 0.26301028357743844, "percentage": 26.3, "elapsed_time": "18:57:09", "remaining_time": "2 days, 5:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2533, "total_steps": 9627, "loss": 1.703, "learning_rate": 8.386913278442571e-05, "epoch": 0.2631141580970188, "percentage": 26.31, "elapsed_time": "18:57:34", "remaining_time": "2 days, 5:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2534, "total_steps": 9627, "loss": 1.8659, "learning_rate": 8.385712800807343e-05, "epoch": 0.26321803261659915, "percentage": 26.32, "elapsed_time": "18:57:59", "remaining_time": "2 days, 5:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2535, "total_steps": 9627, "loss": 1.8752, "learning_rate": 8.38451196262011e-05, "epoch": 0.2633219071361795, "percentage": 26.33, "elapsed_time": "18:58:25", "remaining_time": "2 days, 5:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2536, "total_steps": 9627, "loss": 1.765, "learning_rate": 8.383310764008751e-05, "epoch": 0.26342578165575986, "percentage": 26.34, "elapsed_time": "18:58:50", "remaining_time": "2 days, 5:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2537, "total_steps": 9627, "loss": 1.6668, "learning_rate": 8.382109205101188e-05, "epoch": 0.2635296561753402, "percentage": 26.35, "elapsed_time": "18:59:16", "remaining_time": "2 days, 5:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2538, "total_steps": 9627, "loss": 1.6682, "learning_rate": 8.380907286025377e-05, "epoch": 0.2636335306949205, "percentage": 26.36, "elapsed_time": "18:59:41", "remaining_time": "2 days, 5:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2539, "total_steps": 9627, "loss": 1.6501, "learning_rate": 8.37970500690931e-05, "epoch": 0.2637374052145009, "percentage": 26.37, "elapsed_time": "19:00:06", "remaining_time": "2 days, 5:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2540, "total_steps": 9627, "loss": 1.6854, "learning_rate": 8.378502367881025e-05, "epoch": 0.2638412797340812, "percentage": 26.38, "elapsed_time": "19:00:32", "remaining_time": "2 days, 5:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2541, "total_steps": 9627, "loss": 1.8676, "learning_rate": 8.37729936906859e-05, "epoch": 0.26394515425366155, "percentage": 26.39, "elapsed_time": "19:00:58", "remaining_time": "2 days, 5:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2542, "total_steps": 9627, "loss": 1.7777, "learning_rate": 8.376096010600116e-05, "epoch": 0.26404902877324193, "percentage": 26.4, "elapsed_time": "19:01:23", "remaining_time": "2 days, 5:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2543, "total_steps": 9627, "loss": 1.7512, "learning_rate": 8.374892292603751e-05, "epoch": 0.26415290329282226, "percentage": 26.42, "elapsed_time": "19:01:49", "remaining_time": "2 days, 5:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2544, "total_steps": 9627, "loss": 1.7389, "learning_rate": 8.373688215207682e-05, "epoch": 0.26425677781240264, "percentage": 26.43, "elapsed_time": "19:02:14", "remaining_time": "2 days, 5:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2545, "total_steps": 9627, "loss": 1.9784, "learning_rate": 8.372483778540134e-05, "epoch": 0.26436065233198297, "percentage": 26.44, "elapsed_time": "19:02:40", "remaining_time": "2 days, 4:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2546, "total_steps": 9627, "loss": 1.8175, "learning_rate": 8.371278982729371e-05, "epoch": 0.2644645268515633, "percentage": 26.45, "elapsed_time": "19:03:06", "remaining_time": "2 days, 4:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2547, "total_steps": 9627, "loss": 1.8014, "learning_rate": 8.370073827903693e-05, "epoch": 0.2645684013711437, "percentage": 26.46, "elapsed_time": "19:03:31", "remaining_time": "2 days, 4:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2548, "total_steps": 9627, "loss": 1.8389, "learning_rate": 8.368868314191439e-05, "epoch": 0.264672275890724, "percentage": 26.47, "elapsed_time": "19:03:57", "remaining_time": "2 days, 4:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2549, "total_steps": 9627, "loss": 1.7975, "learning_rate": 8.367662441720989e-05, "epoch": 0.26477615041030433, "percentage": 26.48, "elapsed_time": "19:04:23", "remaining_time": "2 days, 4:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 9627, "loss": 1.7531, "learning_rate": 8.366456210620757e-05, "epoch": 0.2648800249298847, "percentage": 26.49, "elapsed_time": "19:04:48", "remaining_time": "2 days, 4:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2551, "total_steps": 9627, "loss": 1.6416, "learning_rate": 8.365249621019197e-05, "epoch": 0.26498389944946504, "percentage": 26.5, "elapsed_time": "19:05:14", "remaining_time": "2 days, 4:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2552, "total_steps": 9627, "loss": 1.775, "learning_rate": 8.364042673044803e-05, "epoch": 0.26508777396904537, "percentage": 26.51, "elapsed_time": "19:05:40", "remaining_time": "2 days, 4:56:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2553, "total_steps": 9627, "loss": 1.6302, "learning_rate": 8.362835366826105e-05, "epoch": 0.26519164848862575, "percentage": 26.52, "elapsed_time": "19:06:05", "remaining_time": "2 days, 4:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2554, "total_steps": 9627, "loss": 1.8325, "learning_rate": 8.361627702491673e-05, "epoch": 0.2652955230082061, "percentage": 26.53, "elapsed_time": "19:06:31", "remaining_time": "2 days, 4:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2555, "total_steps": 9627, "loss": 1.6433, "learning_rate": 8.360419680170111e-05, "epoch": 0.2653993975277864, "percentage": 26.54, "elapsed_time": "19:06:57", "remaining_time": "2 days, 4:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2556, "total_steps": 9627, "loss": 1.5261, "learning_rate": 8.359211299990064e-05, "epoch": 0.2655032720473668, "percentage": 26.55, "elapsed_time": "19:07:23", "remaining_time": "2 days, 4:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2557, "total_steps": 9627, "loss": 1.7036, "learning_rate": 8.358002562080219e-05, "epoch": 0.2656071465669471, "percentage": 26.56, "elapsed_time": "19:07:47", "remaining_time": "2 days, 4:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2558, "total_steps": 9627, "loss": 1.801, "learning_rate": 8.356793466569293e-05, "epoch": 0.2657110210865275, "percentage": 26.57, "elapsed_time": "19:08:14", "remaining_time": "2 days, 4:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2559, "total_steps": 9627, "loss": 2.0989, "learning_rate": 8.355584013586047e-05, "epoch": 0.2658148956061078, "percentage": 26.58, "elapsed_time": "19:08:39", "remaining_time": "2 days, 4:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2560, "total_steps": 9627, "loss": 1.8125, "learning_rate": 8.354374203259278e-05, "epoch": 0.26591877012568815, "percentage": 26.59, "elapsed_time": "19:09:05", "remaining_time": "2 days, 4:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2561, "total_steps": 9627, "loss": 1.6731, "learning_rate": 8.353164035717822e-05, "epoch": 0.26602264464526854, "percentage": 26.6, "elapsed_time": "19:09:30", "remaining_time": "2 days, 4:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2562, "total_steps": 9627, "loss": 1.7634, "learning_rate": 8.351953511090551e-05, "epoch": 0.26612651916484886, "percentage": 26.61, "elapsed_time": "19:09:56", "remaining_time": "2 days, 4:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2563, "total_steps": 9627, "loss": 1.8874, "learning_rate": 8.350742629506378e-05, "epoch": 0.2662303936844292, "percentage": 26.62, "elapsed_time": "19:10:22", "remaining_time": "2 days, 4:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2564, "total_steps": 9627, "loss": 1.7228, "learning_rate": 8.349531391094251e-05, "epoch": 0.26633426820400957, "percentage": 26.63, "elapsed_time": "19:10:47", "remaining_time": "2 days, 4:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2565, "total_steps": 9627, "loss": 1.6236, "learning_rate": 8.34831979598316e-05, "epoch": 0.2664381427235899, "percentage": 26.64, "elapsed_time": "19:11:13", "remaining_time": "2 days, 4:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2566, "total_steps": 9627, "loss": 1.8109, "learning_rate": 8.347107844302129e-05, "epoch": 0.2665420172431702, "percentage": 26.65, "elapsed_time": "19:11:38", "remaining_time": "2 days, 4:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2567, "total_steps": 9627, "loss": 1.7463, "learning_rate": 8.345895536180219e-05, "epoch": 0.2666458917627506, "percentage": 26.66, "elapsed_time": "19:12:05", "remaining_time": "2 days, 4:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2568, "total_steps": 9627, "loss": 1.8362, "learning_rate": 8.344682871746534e-05, "epoch": 0.26674976628233094, "percentage": 26.67, "elapsed_time": "19:12:30", "remaining_time": "2 days, 4:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2569, "total_steps": 9627, "loss": 1.845, "learning_rate": 8.343469851130212e-05, "epoch": 0.2668536408019113, "percentage": 26.69, "elapsed_time": "19:12:56", "remaining_time": "2 days, 4:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2570, "total_steps": 9627, "loss": 1.6763, "learning_rate": 8.342256474460431e-05, "epoch": 0.26695751532149165, "percentage": 26.7, "elapsed_time": "19:13:21", "remaining_time": "2 days, 4:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2571, "total_steps": 9627, "loss": 1.8428, "learning_rate": 8.341042741866408e-05, "epoch": 0.26706138984107197, "percentage": 26.71, "elapsed_time": "19:13:47", "remaining_time": "2 days, 4:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2572, "total_steps": 9627, "loss": 1.5346, "learning_rate": 8.339828653477391e-05, "epoch": 0.26716526436065235, "percentage": 26.72, "elapsed_time": "19:14:11", "remaining_time": "2 days, 4:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2573, "total_steps": 9627, "loss": 1.7763, "learning_rate": 8.338614209422677e-05, "epoch": 0.2672691388802327, "percentage": 26.73, "elapsed_time": "19:14:39", "remaining_time": "2 days, 4:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2574, "total_steps": 9627, "loss": 1.9153, "learning_rate": 8.33739940983159e-05, "epoch": 0.267373013399813, "percentage": 26.74, "elapsed_time": "19:15:03", "remaining_time": "2 days, 4:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2575, "total_steps": 9627, "loss": 1.4252, "learning_rate": 8.336184254833499e-05, "epoch": 0.2674768879193934, "percentage": 26.75, "elapsed_time": "19:15:30", "remaining_time": "2 days, 4:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2576, "total_steps": 9627, "loss": 1.8131, "learning_rate": 8.33496874455781e-05, "epoch": 0.2675807624389737, "percentage": 26.76, "elapsed_time": "19:15:55", "remaining_time": "2 days, 4:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2577, "total_steps": 9627, "loss": 1.769, "learning_rate": 8.33375287913396e-05, "epoch": 0.26768463695855405, "percentage": 26.77, "elapsed_time": "19:16:20", "remaining_time": "2 days, 4:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2578, "total_steps": 9627, "loss": 1.806, "learning_rate": 8.332536658691435e-05, "epoch": 0.26778851147813443, "percentage": 26.78, "elapsed_time": "19:16:47", "remaining_time": "2 days, 4:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2579, "total_steps": 9627, "loss": 1.8308, "learning_rate": 8.331320083359751e-05, "epoch": 0.26789238599771475, "percentage": 26.79, "elapsed_time": "19:17:12", "remaining_time": "2 days, 4:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2580, "total_steps": 9627, "loss": 1.6708, "learning_rate": 8.330103153268462e-05, "epoch": 0.2679962605172951, "percentage": 26.8, "elapsed_time": "19:17:38", "remaining_time": "2 days, 4:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2581, "total_steps": 9627, "loss": 1.6567, "learning_rate": 8.328885868547164e-05, "epoch": 0.26810013503687546, "percentage": 26.81, "elapsed_time": "19:18:03", "remaining_time": "2 days, 4:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2582, "total_steps": 9627, "loss": 1.9518, "learning_rate": 8.327668229325487e-05, "epoch": 0.2682040095564558, "percentage": 26.82, "elapsed_time": "19:18:29", "remaining_time": "2 days, 4:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2583, "total_steps": 9627, "loss": 1.8429, "learning_rate": 8.326450235733098e-05, "epoch": 0.2683078840760362, "percentage": 26.83, "elapsed_time": "19:18:54", "remaining_time": "2 days, 4:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2584, "total_steps": 9627, "loss": 1.5773, "learning_rate": 8.32523188789971e-05, "epoch": 0.2684117585956165, "percentage": 26.84, "elapsed_time": "19:19:20", "remaining_time": "2 days, 4:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2585, "total_steps": 9627, "loss": 1.685, "learning_rate": 8.324013185955062e-05, "epoch": 0.26851563311519683, "percentage": 26.85, "elapsed_time": "19:19:45", "remaining_time": "2 days, 4:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2586, "total_steps": 9627, "loss": 1.8974, "learning_rate": 8.322794130028938e-05, "epoch": 0.2686195076347772, "percentage": 26.86, "elapsed_time": "19:20:12", "remaining_time": "2 days, 4:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2587, "total_steps": 9627, "loss": 1.6507, "learning_rate": 8.321574720251158e-05, "epoch": 0.26872338215435754, "percentage": 26.87, "elapsed_time": "19:20:37", "remaining_time": "2 days, 4:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2588, "total_steps": 9627, "loss": 1.7104, "learning_rate": 8.32035495675158e-05, "epoch": 0.26882725667393786, "percentage": 26.88, "elapsed_time": "19:21:03", "remaining_time": "2 days, 4:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2589, "total_steps": 9627, "loss": 1.6052, "learning_rate": 8.3191348396601e-05, "epoch": 0.26893113119351825, "percentage": 26.89, "elapsed_time": "19:21:28", "remaining_time": "2 days, 4:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2590, "total_steps": 9627, "loss": 1.9357, "learning_rate": 8.317914369106648e-05, "epoch": 0.2690350057130986, "percentage": 26.9, "elapsed_time": "19:21:54", "remaining_time": "2 days, 4:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2591, "total_steps": 9627, "loss": 1.7948, "learning_rate": 8.316693545221196e-05, "epoch": 0.2691388802326789, "percentage": 26.91, "elapsed_time": "19:22:19", "remaining_time": "2 days, 4:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2592, "total_steps": 9627, "loss": 1.6696, "learning_rate": 8.315472368133754e-05, "epoch": 0.2692427547522593, "percentage": 26.92, "elapsed_time": "19:22:46", "remaining_time": "2 days, 4:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2593, "total_steps": 9627, "loss": 1.8025, "learning_rate": 8.314250837974364e-05, "epoch": 0.2693466292718396, "percentage": 26.93, "elapsed_time": "19:23:11", "remaining_time": "2 days, 4:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2594, "total_steps": 9627, "loss": 1.725, "learning_rate": 8.313028954873114e-05, "epoch": 0.26945050379141994, "percentage": 26.95, "elapsed_time": "19:23:37", "remaining_time": "2 days, 4:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2595, "total_steps": 9627, "loss": 1.5303, "learning_rate": 8.311806718960124e-05, "epoch": 0.2695543783110003, "percentage": 26.96, "elapsed_time": "19:24:02", "remaining_time": "2 days, 4:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2596, "total_steps": 9627, "loss": 1.9351, "learning_rate": 8.310584130365551e-05, "epoch": 0.26965825283058065, "percentage": 26.97, "elapsed_time": "19:24:28", "remaining_time": "2 days, 4:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2597, "total_steps": 9627, "loss": 1.6705, "learning_rate": 8.309361189219589e-05, "epoch": 0.26976212735016103, "percentage": 26.98, "elapsed_time": "19:24:53", "remaining_time": "2 days, 4:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2598, "total_steps": 9627, "loss": 1.7879, "learning_rate": 8.308137895652477e-05, "epoch": 0.26986600186974136, "percentage": 26.99, "elapsed_time": "19:25:20", "remaining_time": "2 days, 4:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2599, "total_steps": 9627, "loss": 1.7799, "learning_rate": 8.306914249794483e-05, "epoch": 0.2699698763893217, "percentage": 27.0, "elapsed_time": "19:25:45", "remaining_time": "2 days, 4:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 9627, "loss": 1.6268, "learning_rate": 8.305690251775915e-05, "epoch": 0.27007375090890207, "percentage": 27.01, "elapsed_time": "19:26:11", "remaining_time": "2 days, 4:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2601, "total_steps": 9627, "loss": 1.7004, "learning_rate": 8.304465901727123e-05, "epoch": 0.2701776254284824, "percentage": 27.02, "elapsed_time": "19:26:37", "remaining_time": "2 days, 4:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2602, "total_steps": 9627, "loss": 1.7739, "learning_rate": 8.303241199778486e-05, "epoch": 0.2702814999480627, "percentage": 27.03, "elapsed_time": "19:27:02", "remaining_time": "2 days, 4:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2603, "total_steps": 9627, "loss": 1.5496, "learning_rate": 8.30201614606043e-05, "epoch": 0.2703853744676431, "percentage": 27.04, "elapsed_time": "19:27:27", "remaining_time": "2 days, 4:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2604, "total_steps": 9627, "loss": 1.7503, "learning_rate": 8.300790740703409e-05, "epoch": 0.27048924898722343, "percentage": 27.05, "elapsed_time": "19:27:53", "remaining_time": "2 days, 4:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2605, "total_steps": 9627, "loss": 1.7856, "learning_rate": 8.299564983837922e-05, "epoch": 0.27059312350680376, "percentage": 27.06, "elapsed_time": "19:28:18", "remaining_time": "2 days, 4:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2606, "total_steps": 9627, "loss": 1.7488, "learning_rate": 8.298338875594501e-05, "epoch": 0.27069699802638414, "percentage": 27.07, "elapsed_time": "19:28:44", "remaining_time": "2 days, 4:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2607, "total_steps": 9627, "loss": 1.6934, "learning_rate": 8.29711241610372e-05, "epoch": 0.27080087254596447, "percentage": 27.08, "elapsed_time": "19:29:10", "remaining_time": "2 days, 4:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2608, "total_steps": 9627, "loss": 1.785, "learning_rate": 8.295885605496184e-05, "epoch": 0.27090474706554485, "percentage": 27.09, "elapsed_time": "19:29:35", "remaining_time": "2 days, 4:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2609, "total_steps": 9627, "loss": 1.7482, "learning_rate": 8.294658443902539e-05, "epoch": 0.2710086215851252, "percentage": 27.1, "elapsed_time": "19:30:00", "remaining_time": "2 days, 4:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2610, "total_steps": 9627, "loss": 1.7077, "learning_rate": 8.29343093145347e-05, "epoch": 0.2711124961047055, "percentage": 27.11, "elapsed_time": "19:30:26", "remaining_time": "2 days, 4:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2611, "total_steps": 9627, "loss": 1.8574, "learning_rate": 8.292203068279695e-05, "epoch": 0.2712163706242859, "percentage": 27.12, "elapsed_time": "19:30:52", "remaining_time": "2 days, 4:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2612, "total_steps": 9627, "loss": 1.7988, "learning_rate": 8.290974854511974e-05, "epoch": 0.2713202451438662, "percentage": 27.13, "elapsed_time": "19:31:17", "remaining_time": "2 days, 4:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2613, "total_steps": 9627, "loss": 1.6488, "learning_rate": 8.289746290281104e-05, "epoch": 0.27142411966344654, "percentage": 27.14, "elapsed_time": "19:31:43", "remaining_time": "2 days, 4:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2614, "total_steps": 9627, "loss": 1.8813, "learning_rate": 8.288517375717913e-05, "epoch": 0.2715279941830269, "percentage": 27.15, "elapsed_time": "19:32:08", "remaining_time": "2 days, 4:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2615, "total_steps": 9627, "loss": 1.4855, "learning_rate": 8.287288110953274e-05, "epoch": 0.27163186870260725, "percentage": 27.16, "elapsed_time": "19:32:35", "remaining_time": "2 days, 4:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2616, "total_steps": 9627, "loss": 1.921, "learning_rate": 8.286058496118091e-05, "epoch": 0.2717357432221876, "percentage": 27.17, "elapsed_time": "19:32:59", "remaining_time": "2 days, 4:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2617, "total_steps": 9627, "loss": 1.6206, "learning_rate": 8.284828531343312e-05, "epoch": 0.27183961774176796, "percentage": 27.18, "elapsed_time": "19:33:25", "remaining_time": "2 days, 4:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2618, "total_steps": 9627, "loss": 1.8668, "learning_rate": 8.283598216759915e-05, "epoch": 0.2719434922613483, "percentage": 27.19, "elapsed_time": "19:33:51", "remaining_time": "2 days, 4:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2619, "total_steps": 9627, "loss": 1.6809, "learning_rate": 8.282367552498925e-05, "epoch": 0.2720473667809286, "percentage": 27.2, "elapsed_time": "19:34:16", "remaining_time": "2 days, 4:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2620, "total_steps": 9627, "loss": 1.922, "learning_rate": 8.28113653869139e-05, "epoch": 0.272151241300509, "percentage": 27.22, "elapsed_time": "19:34:42", "remaining_time": "2 days, 4:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2621, "total_steps": 9627, "loss": 1.8944, "learning_rate": 8.27990517546841e-05, "epoch": 0.2722551158200893, "percentage": 27.23, "elapsed_time": "19:35:08", "remaining_time": "2 days, 4:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2622, "total_steps": 9627, "loss": 1.8936, "learning_rate": 8.278673462961112e-05, "epoch": 0.2723589903396697, "percentage": 27.24, "elapsed_time": "19:35:34", "remaining_time": "2 days, 4:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2623, "total_steps": 9627, "loss": 1.9192, "learning_rate": 8.277441401300665e-05, "epoch": 0.27246286485925003, "percentage": 27.25, "elapsed_time": "19:35:59", "remaining_time": "2 days, 4:20:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2624, "total_steps": 9627, "loss": 1.6761, "learning_rate": 8.276208990618274e-05, "epoch": 0.27256673937883036, "percentage": 27.26, "elapsed_time": "19:36:24", "remaining_time": "2 days, 4:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2625, "total_steps": 9627, "loss": 1.7843, "learning_rate": 8.27497623104518e-05, "epoch": 0.27267061389841074, "percentage": 27.27, "elapsed_time": "19:36:51", "remaining_time": "2 days, 4:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2626, "total_steps": 9627, "loss": 1.5891, "learning_rate": 8.273743122712664e-05, "epoch": 0.27277448841799107, "percentage": 27.28, "elapsed_time": "19:37:16", "remaining_time": "2 days, 4:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2627, "total_steps": 9627, "loss": 1.793, "learning_rate": 8.272509665752041e-05, "epoch": 0.2728783629375714, "percentage": 27.29, "elapsed_time": "19:37:41", "remaining_time": "2 days, 4:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2628, "total_steps": 9627, "loss": 1.9712, "learning_rate": 8.271275860294667e-05, "epoch": 0.2729822374571518, "percentage": 27.3, "elapsed_time": "19:38:07", "remaining_time": "2 days, 4:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2629, "total_steps": 9627, "loss": 1.6459, "learning_rate": 8.27004170647193e-05, "epoch": 0.2730861119767321, "percentage": 27.31, "elapsed_time": "19:38:33", "remaining_time": "2 days, 4:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2630, "total_steps": 9627, "loss": 1.6445, "learning_rate": 8.268807204415258e-05, "epoch": 0.27318998649631243, "percentage": 27.32, "elapsed_time": "19:38:58", "remaining_time": "2 days, 4:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2631, "total_steps": 9627, "loss": 1.6357, "learning_rate": 8.267572354256117e-05, "epoch": 0.2732938610158928, "percentage": 27.33, "elapsed_time": "19:39:24", "remaining_time": "2 days, 4:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2632, "total_steps": 9627, "loss": 1.7254, "learning_rate": 8.266337156126008e-05, "epoch": 0.27339773553547314, "percentage": 27.34, "elapsed_time": "19:39:49", "remaining_time": "2 days, 4:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2633, "total_steps": 9627, "loss": 1.7073, "learning_rate": 8.26510161015647e-05, "epoch": 0.27350161005505347, "percentage": 27.35, "elapsed_time": "19:40:14", "remaining_time": "2 days, 4:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2634, "total_steps": 9627, "loss": 1.8689, "learning_rate": 8.263865716479078e-05, "epoch": 0.27360548457463385, "percentage": 27.36, "elapsed_time": "19:40:40", "remaining_time": "2 days, 4:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2635, "total_steps": 9627, "loss": 1.8721, "learning_rate": 8.262629475225448e-05, "epoch": 0.2737093590942142, "percentage": 27.37, "elapsed_time": "19:41:05", "remaining_time": "2 days, 4:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2636, "total_steps": 9627, "loss": 1.7335, "learning_rate": 8.261392886527229e-05, "epoch": 0.27381323361379456, "percentage": 27.38, "elapsed_time": "19:41:32", "remaining_time": "2 days, 4:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2637, "total_steps": 9627, "loss": 1.8539, "learning_rate": 8.260155950516106e-05, "epoch": 0.2739171081333749, "percentage": 27.39, "elapsed_time": "19:41:57", "remaining_time": "2 days, 4:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2638, "total_steps": 9627, "loss": 1.6214, "learning_rate": 8.258918667323806e-05, "epoch": 0.2740209826529552, "percentage": 27.4, "elapsed_time": "19:42:22", "remaining_time": "2 days, 4:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2639, "total_steps": 9627, "loss": 1.7361, "learning_rate": 8.257681037082085e-05, "epoch": 0.2741248571725356, "percentage": 27.41, "elapsed_time": "19:42:47", "remaining_time": "2 days, 4:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2640, "total_steps": 9627, "loss": 1.8081, "learning_rate": 8.256443059922749e-05, "epoch": 0.2742287316921159, "percentage": 27.42, "elapsed_time": "19:43:14", "remaining_time": "2 days, 4:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2641, "total_steps": 9627, "loss": 1.7, "learning_rate": 8.255204735977626e-05, "epoch": 0.27433260621169625, "percentage": 27.43, "elapsed_time": "19:43:38", "remaining_time": "2 days, 4:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2642, "total_steps": 9627, "loss": 1.5137, "learning_rate": 8.25396606537859e-05, "epoch": 0.27443648073127663, "percentage": 27.44, "elapsed_time": "19:44:05", "remaining_time": "2 days, 4:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2643, "total_steps": 9627, "loss": 1.7127, "learning_rate": 8.252727048257551e-05, "epoch": 0.27454035525085696, "percentage": 27.45, "elapsed_time": "19:44:31", "remaining_time": "2 days, 4:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2644, "total_steps": 9627, "loss": 1.8356, "learning_rate": 8.251487684746453e-05, "epoch": 0.2746442297704373, "percentage": 27.46, "elapsed_time": "19:44:56", "remaining_time": "2 days, 4:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2645, "total_steps": 9627, "loss": 1.6803, "learning_rate": 8.250247974977279e-05, "epoch": 0.27474810429001767, "percentage": 27.47, "elapsed_time": "19:45:22", "remaining_time": "2 days, 4:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2646, "total_steps": 9627, "loss": 1.7868, "learning_rate": 8.249007919082048e-05, "epoch": 0.274851978809598, "percentage": 27.49, "elapsed_time": "19:45:47", "remaining_time": "2 days, 4:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2647, "total_steps": 9627, "loss": 1.8521, "learning_rate": 8.247767517192818e-05, "epoch": 0.2749558533291784, "percentage": 27.5, "elapsed_time": "19:46:12", "remaining_time": "2 days, 4:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2648, "total_steps": 9627, "loss": 1.7785, "learning_rate": 8.246526769441681e-05, "epoch": 0.2750597278487587, "percentage": 27.51, "elapsed_time": "19:46:39", "remaining_time": "2 days, 4:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2649, "total_steps": 9627, "loss": 1.8763, "learning_rate": 8.245285675960767e-05, "epoch": 0.27516360236833903, "percentage": 27.52, "elapsed_time": "19:47:04", "remaining_time": "2 days, 4:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 9627, "loss": 1.4576, "learning_rate": 8.244044236882242e-05, "epoch": 0.2752674768879194, "percentage": 27.53, "elapsed_time": "19:47:29", "remaining_time": "2 days, 4:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2651, "total_steps": 9627, "loss": 1.7468, "learning_rate": 8.24280245233831e-05, "epoch": 0.27537135140749974, "percentage": 27.54, "elapsed_time": "19:47:55", "remaining_time": "2 days, 4:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2652, "total_steps": 9627, "loss": 1.92, "learning_rate": 8.241560322461212e-05, "epoch": 0.27547522592708007, "percentage": 27.55, "elapsed_time": "19:48:20", "remaining_time": "2 days, 4:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2653, "total_steps": 9627, "loss": 1.6042, "learning_rate": 8.240317847383226e-05, "epoch": 0.27557910044666045, "percentage": 27.56, "elapsed_time": "19:48:47", "remaining_time": "2 days, 4:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2654, "total_steps": 9627, "loss": 1.8099, "learning_rate": 8.239075027236663e-05, "epoch": 0.2756829749662408, "percentage": 27.57, "elapsed_time": "19:49:11", "remaining_time": "2 days, 4:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2655, "total_steps": 9627, "loss": 1.7363, "learning_rate": 8.237831862153877e-05, "epoch": 0.2757868494858211, "percentage": 27.58, "elapsed_time": "19:49:37", "remaining_time": "2 days, 4:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2656, "total_steps": 9627, "loss": 1.8691, "learning_rate": 8.236588352267252e-05, "epoch": 0.2758907240054015, "percentage": 27.59, "elapsed_time": "19:50:03", "remaining_time": "2 days, 4:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2657, "total_steps": 9627, "loss": 1.8538, "learning_rate": 8.235344497709214e-05, "epoch": 0.2759945985249818, "percentage": 27.6, "elapsed_time": "19:50:29", "remaining_time": "2 days, 4:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2658, "total_steps": 9627, "loss": 1.28, "learning_rate": 8.234100298612226e-05, "epoch": 0.27609847304456214, "percentage": 27.61, "elapsed_time": "19:50:54", "remaining_time": "2 days, 4:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2659, "total_steps": 9627, "loss": 1.9326, "learning_rate": 8.23285575510878e-05, "epoch": 0.2762023475641425, "percentage": 27.62, "elapsed_time": "19:51:20", "remaining_time": "2 days, 4:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2660, "total_steps": 9627, "loss": 1.7221, "learning_rate": 8.231610867331415e-05, "epoch": 0.27630622208372285, "percentage": 27.63, "elapsed_time": "19:51:46", "remaining_time": "2 days, 4:01:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2661, "total_steps": 9627, "loss": 1.9031, "learning_rate": 8.2303656354127e-05, "epoch": 0.27641009660330323, "percentage": 27.64, "elapsed_time": "19:52:11", "remaining_time": "2 days, 4:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2662, "total_steps": 9627, "loss": 1.6825, "learning_rate": 8.229120059485243e-05, "epoch": 0.27651397112288356, "percentage": 27.65, "elapsed_time": "19:52:36", "remaining_time": "2 days, 4:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2663, "total_steps": 9627, "loss": 1.7172, "learning_rate": 8.227874139681688e-05, "epoch": 0.2766178456424639, "percentage": 27.66, "elapsed_time": "19:53:02", "remaining_time": "2 days, 3:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2664, "total_steps": 9627, "loss": 1.8136, "learning_rate": 8.226627876134714e-05, "epoch": 0.27672172016204427, "percentage": 27.67, "elapsed_time": "19:53:28", "remaining_time": "2 days, 3:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2665, "total_steps": 9627, "loss": 1.7346, "learning_rate": 8.22538126897704e-05, "epoch": 0.2768255946816246, "percentage": 27.68, "elapsed_time": "19:53:53", "remaining_time": "2 days, 3:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2666, "total_steps": 9627, "loss": 1.925, "learning_rate": 8.224134318341421e-05, "epoch": 0.2769294692012049, "percentage": 27.69, "elapsed_time": "19:54:19", "remaining_time": "2 days, 3:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2667, "total_steps": 9627, "loss": 1.7681, "learning_rate": 8.222887024360646e-05, "epoch": 0.2770333437207853, "percentage": 27.7, "elapsed_time": "19:54:44", "remaining_time": "2 days, 3:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2668, "total_steps": 9627, "loss": 1.8118, "learning_rate": 8.221639387167543e-05, "epoch": 0.27713721824036563, "percentage": 27.71, "elapsed_time": "19:55:11", "remaining_time": "2 days, 3:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2669, "total_steps": 9627, "loss": 1.8121, "learning_rate": 8.220391406894973e-05, "epoch": 0.27724109275994596, "percentage": 27.72, "elapsed_time": "19:55:35", "remaining_time": "2 days, 3:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2670, "total_steps": 9627, "loss": 1.7102, "learning_rate": 8.21914308367584e-05, "epoch": 0.27734496727952634, "percentage": 27.73, "elapsed_time": "19:56:02", "remaining_time": "2 days, 3:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2671, "total_steps": 9627, "loss": 1.6396, "learning_rate": 8.217894417643078e-05, "epoch": 0.27744884179910667, "percentage": 27.74, "elapsed_time": "19:56:28", "remaining_time": "2 days, 3:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2672, "total_steps": 9627, "loss": 1.8278, "learning_rate": 8.216645408929661e-05, "epoch": 0.277552716318687, "percentage": 27.76, "elapsed_time": "19:56:53", "remaining_time": "2 days, 3:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2673, "total_steps": 9627, "loss": 1.7567, "learning_rate": 8.215396057668598e-05, "epoch": 0.2776565908382674, "percentage": 27.77, "elapsed_time": "19:57:19", "remaining_time": "2 days, 3:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2674, "total_steps": 9627, "loss": 1.7282, "learning_rate": 8.214146363992939e-05, "epoch": 0.2777604653578477, "percentage": 27.78, "elapsed_time": "19:57:44", "remaining_time": "2 days, 3:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2675, "total_steps": 9627, "loss": 1.6675, "learning_rate": 8.21289632803576e-05, "epoch": 0.2778643398774281, "percentage": 27.79, "elapsed_time": "19:58:10", "remaining_time": "2 days, 3:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2676, "total_steps": 9627, "loss": 1.6311, "learning_rate": 8.211645949930187e-05, "epoch": 0.2779682143970084, "percentage": 27.8, "elapsed_time": "19:58:35", "remaining_time": "2 days, 3:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2677, "total_steps": 9627, "loss": 1.7166, "learning_rate": 8.210395229809369e-05, "epoch": 0.27807208891658874, "percentage": 27.81, "elapsed_time": "19:59:01", "remaining_time": "2 days, 3:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2678, "total_steps": 9627, "loss": 1.7207, "learning_rate": 8.209144167806502e-05, "epoch": 0.2781759634361691, "percentage": 27.82, "elapsed_time": "19:59:26", "remaining_time": "2 days, 3:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2679, "total_steps": 9627, "loss": 1.7495, "learning_rate": 8.207892764054814e-05, "epoch": 0.27827983795574945, "percentage": 27.83, "elapsed_time": "19:59:51", "remaining_time": "2 days, 3:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2680, "total_steps": 9627, "loss": 1.6362, "learning_rate": 8.20664101868757e-05, "epoch": 0.2783837124753298, "percentage": 27.84, "elapsed_time": "20:00:18", "remaining_time": "2 days, 3:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2681, "total_steps": 9627, "loss": 1.594, "learning_rate": 8.205388931838068e-05, "epoch": 0.27848758699491016, "percentage": 27.85, "elapsed_time": "20:00:43", "remaining_time": "2 days, 3:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2682, "total_steps": 9627, "loss": 1.9431, "learning_rate": 8.20413650363965e-05, "epoch": 0.2785914615144905, "percentage": 27.86, "elapsed_time": "20:01:08", "remaining_time": "2 days, 3:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2683, "total_steps": 9627, "loss": 1.7749, "learning_rate": 8.202883734225686e-05, "epoch": 0.2786953360340708, "percentage": 27.87, "elapsed_time": "20:01:35", "remaining_time": "2 days, 3:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2684, "total_steps": 9627, "loss": 1.8466, "learning_rate": 8.201630623729588e-05, "epoch": 0.2787992105536512, "percentage": 27.88, "elapsed_time": "20:01:59", "remaining_time": "2 days, 3:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2685, "total_steps": 9627, "loss": 2.0036, "learning_rate": 8.200377172284803e-05, "epoch": 0.2789030850732315, "percentage": 27.89, "elapsed_time": "20:02:26", "remaining_time": "2 days, 3:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2686, "total_steps": 9627, "loss": 1.6884, "learning_rate": 8.199123380024812e-05, "epoch": 0.2790069595928119, "percentage": 27.9, "elapsed_time": "20:02:51", "remaining_time": "2 days, 3:48:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2687, "total_steps": 9627, "loss": 1.6512, "learning_rate": 8.197869247083136e-05, "epoch": 0.27911083411239224, "percentage": 27.91, "elapsed_time": "20:03:17", "remaining_time": "2 days, 3:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2688, "total_steps": 9627, "loss": 1.6059, "learning_rate": 8.196614773593329e-05, "epoch": 0.27921470863197256, "percentage": 27.92, "elapsed_time": "20:03:42", "remaining_time": "2 days, 3:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2689, "total_steps": 9627, "loss": 1.6252, "learning_rate": 8.195359959688985e-05, "epoch": 0.27931858315155295, "percentage": 27.93, "elapsed_time": "20:04:08", "remaining_time": "2 days, 3:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2690, "total_steps": 9627, "loss": 1.7011, "learning_rate": 8.194104805503728e-05, "epoch": 0.2794224576711333, "percentage": 27.94, "elapsed_time": "20:04:33", "remaining_time": "2 days, 3:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2691, "total_steps": 9627, "loss": 1.6864, "learning_rate": 8.192849311171225e-05, "epoch": 0.2795263321907136, "percentage": 27.95, "elapsed_time": "20:04:59", "remaining_time": "2 days, 3:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2692, "total_steps": 9627, "loss": 1.5545, "learning_rate": 8.191593476825174e-05, "epoch": 0.279630206710294, "percentage": 27.96, "elapsed_time": "20:05:25", "remaining_time": "2 days, 3:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2693, "total_steps": 9627, "loss": 1.7473, "learning_rate": 8.190337302599314e-05, "epoch": 0.2797340812298743, "percentage": 27.97, "elapsed_time": "20:05:50", "remaining_time": "2 days, 3:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2694, "total_steps": 9627, "loss": 1.6099, "learning_rate": 8.189080788627419e-05, "epoch": 0.27983795574945464, "percentage": 27.98, "elapsed_time": "20:06:15", "remaining_time": "2 days, 3:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2695, "total_steps": 9627, "loss": 1.6274, "learning_rate": 8.187823935043292e-05, "epoch": 0.279941830269035, "percentage": 27.99, "elapsed_time": "20:06:41", "remaining_time": "2 days, 3:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2696, "total_steps": 9627, "loss": 1.8226, "learning_rate": 8.186566741980786e-05, "epoch": 0.28004570478861535, "percentage": 28.0, "elapsed_time": "20:07:06", "remaining_time": "2 days, 3:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2697, "total_steps": 9627, "loss": 1.6987, "learning_rate": 8.185309209573775e-05, "epoch": 0.2801495793081957, "percentage": 28.01, "elapsed_time": "20:07:32", "remaining_time": "2 days, 3:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2698, "total_steps": 9627, "loss": 1.7248, "learning_rate": 8.18405133795618e-05, "epoch": 0.28025345382777606, "percentage": 28.03, "elapsed_time": "20:07:58", "remaining_time": "2 days, 3:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2699, "total_steps": 9627, "loss": 1.8529, "learning_rate": 8.182793127261955e-05, "epoch": 0.2803573283473564, "percentage": 28.04, "elapsed_time": "20:08:23", "remaining_time": "2 days, 3:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 9627, "loss": 1.8915, "learning_rate": 8.181534577625088e-05, "epoch": 0.28046120286693677, "percentage": 28.05, "elapsed_time": "20:08:49", "remaining_time": "2 days, 3:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2701, "total_steps": 9627, "loss": 1.7146, "learning_rate": 8.180275689179607e-05, "epoch": 0.2805650773865171, "percentage": 28.06, "elapsed_time": "20:09:14", "remaining_time": "2 days, 3:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2702, "total_steps": 9627, "loss": 1.5943, "learning_rate": 8.17901646205957e-05, "epoch": 0.2806689519060974, "percentage": 28.07, "elapsed_time": "20:09:40", "remaining_time": "2 days, 3:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2703, "total_steps": 9627, "loss": 1.7849, "learning_rate": 8.177756896399078e-05, "epoch": 0.2807728264256778, "percentage": 28.08, "elapsed_time": "20:10:05", "remaining_time": "2 days, 3:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2704, "total_steps": 9627, "loss": 1.7837, "learning_rate": 8.176496992332265e-05, "epoch": 0.28087670094525813, "percentage": 28.09, "elapsed_time": "20:10:31", "remaining_time": "2 days, 3:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2705, "total_steps": 9627, "loss": 1.9918, "learning_rate": 8.175236749993298e-05, "epoch": 0.28098057546483846, "percentage": 28.1, "elapsed_time": "20:10:56", "remaining_time": "2 days, 3:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2706, "total_steps": 9627, "loss": 1.8577, "learning_rate": 8.173976169516386e-05, "epoch": 0.28108444998441884, "percentage": 28.11, "elapsed_time": "20:11:22", "remaining_time": "2 days, 3:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2707, "total_steps": 9627, "loss": 1.6675, "learning_rate": 8.17271525103577e-05, "epoch": 0.28118832450399917, "percentage": 28.12, "elapsed_time": "20:11:48", "remaining_time": "2 days, 3:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2708, "total_steps": 9627, "loss": 1.8988, "learning_rate": 8.171453994685728e-05, "epoch": 0.2812921990235795, "percentage": 28.13, "elapsed_time": "20:12:14", "remaining_time": "2 days, 3:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2709, "total_steps": 9627, "loss": 1.6811, "learning_rate": 8.170192400600574e-05, "epoch": 0.2813960735431599, "percentage": 28.14, "elapsed_time": "20:12:40", "remaining_time": "2 days, 3:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2710, "total_steps": 9627, "loss": 1.5888, "learning_rate": 8.168930468914658e-05, "epoch": 0.2814999480627402, "percentage": 28.15, "elapsed_time": "20:13:05", "remaining_time": "2 days, 3:36:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2711, "total_steps": 9627, "loss": 1.5904, "learning_rate": 8.167668199762364e-05, "epoch": 0.2816038225823206, "percentage": 28.16, "elapsed_time": "20:13:31", "remaining_time": "2 days, 3:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2712, "total_steps": 9627, "loss": 1.7703, "learning_rate": 8.166405593278116e-05, "epoch": 0.2817076971019009, "percentage": 28.17, "elapsed_time": "20:13:57", "remaining_time": "2 days, 3:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2713, "total_steps": 9627, "loss": 1.6956, "learning_rate": 8.165142649596372e-05, "epoch": 0.28181157162148124, "percentage": 28.18, "elapsed_time": "20:14:23", "remaining_time": "2 days, 3:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2714, "total_steps": 9627, "loss": 1.9759, "learning_rate": 8.163879368851623e-05, "epoch": 0.2819154461410616, "percentage": 28.19, "elapsed_time": "20:14:48", "remaining_time": "2 days, 3:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2715, "total_steps": 9627, "loss": 1.6924, "learning_rate": 8.162615751178405e-05, "epoch": 0.28201932066064195, "percentage": 28.2, "elapsed_time": "20:15:13", "remaining_time": "2 days, 3:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2716, "total_steps": 9627, "loss": 1.8406, "learning_rate": 8.161351796711274e-05, "epoch": 0.2821231951802223, "percentage": 28.21, "elapsed_time": "20:15:39", "remaining_time": "2 days, 3:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2717, "total_steps": 9627, "loss": 1.7651, "learning_rate": 8.16008750558484e-05, "epoch": 0.28222706969980266, "percentage": 28.22, "elapsed_time": "20:16:04", "remaining_time": "2 days, 3:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2718, "total_steps": 9627, "loss": 1.7538, "learning_rate": 8.158822877933733e-05, "epoch": 0.282330944219383, "percentage": 28.23, "elapsed_time": "20:16:29", "remaining_time": "2 days, 3:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2719, "total_steps": 9627, "loss": 1.7825, "learning_rate": 8.15755791389263e-05, "epoch": 0.2824348187389633, "percentage": 28.24, "elapsed_time": "20:16:55", "remaining_time": "2 days, 3:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2720, "total_steps": 9627, "loss": 1.737, "learning_rate": 8.15629261359624e-05, "epoch": 0.2825386932585437, "percentage": 28.25, "elapsed_time": "20:17:22", "remaining_time": "2 days, 3:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2721, "total_steps": 9627, "loss": 1.774, "learning_rate": 8.155026977179307e-05, "epoch": 0.282642567778124, "percentage": 28.26, "elapsed_time": "20:17:47", "remaining_time": "2 days, 3:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2722, "total_steps": 9627, "loss": 1.7034, "learning_rate": 8.15376100477661e-05, "epoch": 0.28274644229770435, "percentage": 28.27, "elapsed_time": "20:18:12", "remaining_time": "2 days, 3:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2723, "total_steps": 9627, "loss": 1.5747, "learning_rate": 8.152494696522965e-05, "epoch": 0.28285031681728473, "percentage": 28.29, "elapsed_time": "20:18:38", "remaining_time": "2 days, 3:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2724, "total_steps": 9627, "loss": 1.7802, "learning_rate": 8.151228052553228e-05, "epoch": 0.28295419133686506, "percentage": 28.3, "elapsed_time": "20:19:03", "remaining_time": "2 days, 3:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2725, "total_steps": 9627, "loss": 1.7353, "learning_rate": 8.149961073002283e-05, "epoch": 0.28305806585644544, "percentage": 28.31, "elapsed_time": "20:19:29", "remaining_time": "2 days, 3:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2726, "total_steps": 9627, "loss": 1.8108, "learning_rate": 8.148693758005054e-05, "epoch": 0.28316194037602577, "percentage": 28.32, "elapsed_time": "20:19:55", "remaining_time": "2 days, 3:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2727, "total_steps": 9627, "loss": 1.7521, "learning_rate": 8.1474261076965e-05, "epoch": 0.2832658148956061, "percentage": 28.33, "elapsed_time": "20:20:20", "remaining_time": "2 days, 3:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2728, "total_steps": 9627, "loss": 1.6139, "learning_rate": 8.146158122211618e-05, "epoch": 0.2833696894151865, "percentage": 28.34, "elapsed_time": "20:20:45", "remaining_time": "2 days, 3:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2729, "total_steps": 9627, "loss": 1.9751, "learning_rate": 8.144889801685436e-05, "epoch": 0.2834735639347668, "percentage": 28.35, "elapsed_time": "20:21:12", "remaining_time": "2 days, 3:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2730, "total_steps": 9627, "loss": 1.7618, "learning_rate": 8.143621146253022e-05, "epoch": 0.28357743845434713, "percentage": 28.36, "elapsed_time": "20:21:37", "remaining_time": "2 days, 3:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2731, "total_steps": 9627, "loss": 1.7756, "learning_rate": 8.142352156049475e-05, "epoch": 0.2836813129739275, "percentage": 28.37, "elapsed_time": "20:22:02", "remaining_time": "2 days, 3:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2732, "total_steps": 9627, "loss": 1.8868, "learning_rate": 8.141082831209938e-05, "epoch": 0.28378518749350784, "percentage": 28.38, "elapsed_time": "20:22:29", "remaining_time": "2 days, 3:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2733, "total_steps": 9627, "loss": 1.9038, "learning_rate": 8.139813171869579e-05, "epoch": 0.28388906201308817, "percentage": 28.39, "elapsed_time": "20:22:54", "remaining_time": "2 days, 3:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2734, "total_steps": 9627, "loss": 1.5568, "learning_rate": 8.138543178163607e-05, "epoch": 0.28399293653266855, "percentage": 28.4, "elapsed_time": "20:23:20", "remaining_time": "2 days, 3:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2735, "total_steps": 9627, "loss": 1.6809, "learning_rate": 8.137272850227271e-05, "epoch": 0.2840968110522489, "percentage": 28.41, "elapsed_time": "20:23:46", "remaining_time": "2 days, 3:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2736, "total_steps": 9627, "loss": 1.7479, "learning_rate": 8.136002188195846e-05, "epoch": 0.2842006855718292, "percentage": 28.42, "elapsed_time": "20:24:11", "remaining_time": "2 days, 3:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2737, "total_steps": 9627, "loss": 1.8751, "learning_rate": 8.13473119220465e-05, "epoch": 0.2843045600914096, "percentage": 28.43, "elapsed_time": "20:24:37", "remaining_time": "2 days, 3:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2738, "total_steps": 9627, "loss": 1.8787, "learning_rate": 8.133459862389036e-05, "epoch": 0.2844084346109899, "percentage": 28.44, "elapsed_time": "20:25:03", "remaining_time": "2 days, 3:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2739, "total_steps": 9627, "loss": 1.827, "learning_rate": 8.132188198884386e-05, "epoch": 0.2845123091305703, "percentage": 28.45, "elapsed_time": "20:25:28", "remaining_time": "2 days, 3:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2740, "total_steps": 9627, "loss": 1.5635, "learning_rate": 8.130916201826126e-05, "epoch": 0.2846161836501506, "percentage": 28.46, "elapsed_time": "20:25:53", "remaining_time": "2 days, 3:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2741, "total_steps": 9627, "loss": 2.0049, "learning_rate": 8.129643871349712e-05, "epoch": 0.28472005816973095, "percentage": 28.47, "elapsed_time": "20:26:20", "remaining_time": "2 days, 3:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2742, "total_steps": 9627, "loss": 1.6739, "learning_rate": 8.128371207590639e-05, "epoch": 0.28482393268931133, "percentage": 28.48, "elapsed_time": "20:26:45", "remaining_time": "2 days, 3:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2743, "total_steps": 9627, "loss": 1.9091, "learning_rate": 8.127098210684434e-05, "epoch": 0.28492780720889166, "percentage": 28.49, "elapsed_time": "20:27:11", "remaining_time": "2 days, 3:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2744, "total_steps": 9627, "loss": 1.7084, "learning_rate": 8.125824880766661e-05, "epoch": 0.285031681728472, "percentage": 28.5, "elapsed_time": "20:27:35", "remaining_time": "2 days, 3:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2745, "total_steps": 9627, "loss": 1.7252, "learning_rate": 8.124551217972922e-05, "epoch": 0.28513555624805237, "percentage": 28.51, "elapsed_time": "20:28:03", "remaining_time": "2 days, 3:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2746, "total_steps": 9627, "loss": 1.8441, "learning_rate": 8.12327722243885e-05, "epoch": 0.2852394307676327, "percentage": 28.52, "elapsed_time": "20:28:28", "remaining_time": "2 days, 3:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2747, "total_steps": 9627, "loss": 1.506, "learning_rate": 8.122002894300117e-05, "epoch": 0.285343305287213, "percentage": 28.53, "elapsed_time": "20:28:53", "remaining_time": "2 days, 3:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2748, "total_steps": 9627, "loss": 1.6598, "learning_rate": 8.120728233692428e-05, "epoch": 0.2854471798067934, "percentage": 28.54, "elapsed_time": "20:29:19", "remaining_time": "2 days, 3:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2749, "total_steps": 9627, "loss": 1.6315, "learning_rate": 8.119453240751525e-05, "epoch": 0.28555105432637373, "percentage": 28.56, "elapsed_time": "20:29:44", "remaining_time": "2 days, 3:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 9627, "loss": 1.562, "learning_rate": 8.118177915613182e-05, "epoch": 0.2856549288459541, "percentage": 28.57, "elapsed_time": "20:30:10", "remaining_time": "2 days, 3:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2751, "total_steps": 9627, "loss": 1.9186, "learning_rate": 8.116902258413216e-05, "epoch": 0.28575880336553444, "percentage": 28.58, "elapsed_time": "20:30:36", "remaining_time": "2 days, 3:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2752, "total_steps": 9627, "loss": 1.862, "learning_rate": 8.115626269287473e-05, "epoch": 0.28586267788511477, "percentage": 28.59, "elapsed_time": "20:31:01", "remaining_time": "2 days, 3:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2753, "total_steps": 9627, "loss": 1.7655, "learning_rate": 8.114349948371833e-05, "epoch": 0.28596655240469515, "percentage": 28.6, "elapsed_time": "20:31:27", "remaining_time": "2 days, 3:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2754, "total_steps": 9627, "loss": 1.5148, "learning_rate": 8.113073295802219e-05, "epoch": 0.2860704269242755, "percentage": 28.61, "elapsed_time": "20:31:53", "remaining_time": "2 days, 3:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2755, "total_steps": 9627, "loss": 1.5992, "learning_rate": 8.111796311714579e-05, "epoch": 0.2861743014438558, "percentage": 28.62, "elapsed_time": "20:32:18", "remaining_time": "2 days, 3:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2756, "total_steps": 9627, "loss": 1.7642, "learning_rate": 8.110518996244907e-05, "epoch": 0.2862781759634362, "percentage": 28.63, "elapsed_time": "20:32:45", "remaining_time": "2 days, 3:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2757, "total_steps": 9627, "loss": 1.9091, "learning_rate": 8.109241349529223e-05, "epoch": 0.2863820504830165, "percentage": 28.64, "elapsed_time": "20:33:10", "remaining_time": "2 days, 3:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2758, "total_steps": 9627, "loss": 1.7881, "learning_rate": 8.107963371703589e-05, "epoch": 0.28648592500259684, "percentage": 28.65, "elapsed_time": "20:33:36", "remaining_time": "2 days, 3:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2759, "total_steps": 9627, "loss": 1.6742, "learning_rate": 8.1066850629041e-05, "epoch": 0.2865897995221772, "percentage": 28.66, "elapsed_time": "20:34:01", "remaining_time": "2 days, 3:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2760, "total_steps": 9627, "loss": 1.6718, "learning_rate": 8.105406423266884e-05, "epoch": 0.28669367404175755, "percentage": 28.67, "elapsed_time": "20:34:27", "remaining_time": "2 days, 3:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2761, "total_steps": 9627, "loss": 1.7174, "learning_rate": 8.104127452928107e-05, "epoch": 0.2867975485613379, "percentage": 28.68, "elapsed_time": "20:34:53", "remaining_time": "2 days, 3:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2762, "total_steps": 9627, "loss": 1.7269, "learning_rate": 8.10284815202397e-05, "epoch": 0.28690142308091826, "percentage": 28.69, "elapsed_time": "20:35:18", "remaining_time": "2 days, 3:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2763, "total_steps": 9627, "loss": 1.7251, "learning_rate": 8.101568520690708e-05, "epoch": 0.2870052976004986, "percentage": 28.7, "elapsed_time": "20:35:45", "remaining_time": "2 days, 3:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2764, "total_steps": 9627, "loss": 1.7643, "learning_rate": 8.10028855906459e-05, "epoch": 0.28710917212007897, "percentage": 28.71, "elapsed_time": "20:36:10", "remaining_time": "2 days, 3:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2765, "total_steps": 9627, "loss": 1.7648, "learning_rate": 8.099008267281924e-05, "epoch": 0.2872130466396593, "percentage": 28.72, "elapsed_time": "20:36:36", "remaining_time": "2 days, 3:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2766, "total_steps": 9627, "loss": 1.7988, "learning_rate": 8.097727645479053e-05, "epoch": 0.2873169211592396, "percentage": 28.73, "elapsed_time": "20:37:02", "remaining_time": "2 days, 3:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2767, "total_steps": 9627, "loss": 1.857, "learning_rate": 8.096446693792347e-05, "epoch": 0.28742079567882, "percentage": 28.74, "elapsed_time": "20:37:28", "remaining_time": "2 days, 3:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2768, "total_steps": 9627, "loss": 1.5582, "learning_rate": 8.095165412358225e-05, "epoch": 0.28752467019840033, "percentage": 28.75, "elapsed_time": "20:37:53", "remaining_time": "2 days, 3:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2769, "total_steps": 9627, "loss": 1.6839, "learning_rate": 8.093883801313129e-05, "epoch": 0.28762854471798066, "percentage": 28.76, "elapsed_time": "20:38:19", "remaining_time": "2 days, 3:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2770, "total_steps": 9627, "loss": 1.7254, "learning_rate": 8.09260186079354e-05, "epoch": 0.28773241923756104, "percentage": 28.77, "elapsed_time": "20:38:44", "remaining_time": "2 days, 3:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2771, "total_steps": 9627, "loss": 1.6938, "learning_rate": 8.091319590935978e-05, "epoch": 0.28783629375714137, "percentage": 28.78, "elapsed_time": "20:39:10", "remaining_time": "2 days, 3:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2772, "total_steps": 9627, "loss": 1.7066, "learning_rate": 8.090036991876992e-05, "epoch": 0.2879401682767217, "percentage": 28.79, "elapsed_time": "20:39:36", "remaining_time": "2 days, 3:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2773, "total_steps": 9627, "loss": 2.0641, "learning_rate": 8.08875406375317e-05, "epoch": 0.2880440427963021, "percentage": 28.8, "elapsed_time": "20:40:02", "remaining_time": "2 days, 3:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2774, "total_steps": 9627, "loss": 1.9339, "learning_rate": 8.087470806701131e-05, "epoch": 0.2881479173158824, "percentage": 28.81, "elapsed_time": "20:40:28", "remaining_time": "2 days, 3:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2775, "total_steps": 9627, "loss": 1.6855, "learning_rate": 8.086187220857537e-05, "epoch": 0.28825179183546273, "percentage": 28.83, "elapsed_time": "20:40:54", "remaining_time": "2 days, 3:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2776, "total_steps": 9627, "loss": 1.786, "learning_rate": 8.084903306359078e-05, "epoch": 0.2883556663550431, "percentage": 28.84, "elapsed_time": "20:41:19", "remaining_time": "2 days, 3:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2777, "total_steps": 9627, "loss": 1.796, "learning_rate": 8.083619063342477e-05, "epoch": 0.28845954087462344, "percentage": 28.85, "elapsed_time": "20:41:44", "remaining_time": "2 days, 3:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2778, "total_steps": 9627, "loss": 1.8309, "learning_rate": 8.0823344919445e-05, "epoch": 0.2885634153942038, "percentage": 28.86, "elapsed_time": "20:42:10", "remaining_time": "2 days, 3:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2779, "total_steps": 9627, "loss": 1.8686, "learning_rate": 8.081049592301944e-05, "epoch": 0.28866728991378415, "percentage": 28.87, "elapsed_time": "20:42:36", "remaining_time": "2 days, 3:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2780, "total_steps": 9627, "loss": 1.7419, "learning_rate": 8.079764364551638e-05, "epoch": 0.2887711644333645, "percentage": 28.88, "elapsed_time": "20:43:02", "remaining_time": "2 days, 3:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2781, "total_steps": 9627, "loss": 1.478, "learning_rate": 8.07847880883045e-05, "epoch": 0.28887503895294486, "percentage": 28.89, "elapsed_time": "20:43:27", "remaining_time": "2 days, 3:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2782, "total_steps": 9627, "loss": 1.8183, "learning_rate": 8.077192925275283e-05, "epoch": 0.2889789134725252, "percentage": 28.9, "elapsed_time": "20:43:53", "remaining_time": "2 days, 3:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2783, "total_steps": 9627, "loss": 1.7757, "learning_rate": 8.075906714023073e-05, "epoch": 0.2890827879921055, "percentage": 28.91, "elapsed_time": "20:44:19", "remaining_time": "2 days, 3:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2784, "total_steps": 9627, "loss": 1.6917, "learning_rate": 8.07462017521079e-05, "epoch": 0.2891866625116859, "percentage": 28.92, "elapsed_time": "20:44:44", "remaining_time": "2 days, 2:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2785, "total_steps": 9627, "loss": 1.7787, "learning_rate": 8.073333308975442e-05, "epoch": 0.2892905370312662, "percentage": 28.93, "elapsed_time": "20:45:11", "remaining_time": "2 days, 2:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2786, "total_steps": 9627, "loss": 1.9255, "learning_rate": 8.072046115454069e-05, "epoch": 0.28939441155084655, "percentage": 28.94, "elapsed_time": "20:45:36", "remaining_time": "2 days, 2:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2787, "total_steps": 9627, "loss": 1.6905, "learning_rate": 8.070758594783748e-05, "epoch": 0.28949828607042694, "percentage": 28.95, "elapsed_time": "20:46:02", "remaining_time": "2 days, 2:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2788, "total_steps": 9627, "loss": 1.784, "learning_rate": 8.069470747101588e-05, "epoch": 0.28960216059000726, "percentage": 28.96, "elapsed_time": "20:46:27", "remaining_time": "2 days, 2:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2789, "total_steps": 9627, "loss": 1.7567, "learning_rate": 8.068182572544736e-05, "epoch": 0.28970603510958765, "percentage": 28.97, "elapsed_time": "20:46:54", "remaining_time": "2 days, 2:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2790, "total_steps": 9627, "loss": 1.8726, "learning_rate": 8.066894071250375e-05, "epoch": 0.28980990962916797, "percentage": 28.98, "elapsed_time": "20:47:19", "remaining_time": "2 days, 2:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2791, "total_steps": 9627, "loss": 1.7629, "learning_rate": 8.065605243355717e-05, "epoch": 0.2899137841487483, "percentage": 28.99, "elapsed_time": "20:47:45", "remaining_time": "2 days, 2:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2792, "total_steps": 9627, "loss": 1.7499, "learning_rate": 8.064316088998012e-05, "epoch": 0.2900176586683287, "percentage": 29.0, "elapsed_time": "20:48:11", "remaining_time": "2 days, 2:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2793, "total_steps": 9627, "loss": 1.7148, "learning_rate": 8.063026608314547e-05, "epoch": 0.290121533187909, "percentage": 29.01, "elapsed_time": "20:48:36", "remaining_time": "2 days, 2:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2794, "total_steps": 9627, "loss": 1.8031, "learning_rate": 8.061736801442643e-05, "epoch": 0.29022540770748934, "percentage": 29.02, "elapsed_time": "20:49:02", "remaining_time": "2 days, 2:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2795, "total_steps": 9627, "loss": 1.718, "learning_rate": 8.06044666851965e-05, "epoch": 0.2903292822270697, "percentage": 29.03, "elapsed_time": "20:49:28", "remaining_time": "2 days, 2:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2796, "total_steps": 9627, "loss": 1.7655, "learning_rate": 8.059156209682959e-05, "epoch": 0.29043315674665005, "percentage": 29.04, "elapsed_time": "20:49:53", "remaining_time": "2 days, 2:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2797, "total_steps": 9627, "loss": 1.7541, "learning_rate": 8.057865425069995e-05, "epoch": 0.29053703126623037, "percentage": 29.05, "elapsed_time": "20:50:20", "remaining_time": "2 days, 2:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2798, "total_steps": 9627, "loss": 1.747, "learning_rate": 8.056574314818215e-05, "epoch": 0.29064090578581075, "percentage": 29.06, "elapsed_time": "20:50:45", "remaining_time": "2 days, 2:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2799, "total_steps": 9627, "loss": 1.6764, "learning_rate": 8.055282879065114e-05, "epoch": 0.2907447803053911, "percentage": 29.07, "elapsed_time": "20:51:11", "remaining_time": "2 days, 2:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 9627, "loss": 1.7869, "learning_rate": 8.053991117948216e-05, "epoch": 0.2908486548249714, "percentage": 29.08, "elapsed_time": "20:51:36", "remaining_time": "2 days, 2:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2801, "total_steps": 9627, "loss": 1.8845, "learning_rate": 8.052699031605087e-05, "epoch": 0.2909525293445518, "percentage": 29.1, "elapsed_time": "20:52:02", "remaining_time": "2 days, 2:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2802, "total_steps": 9627, "loss": 1.6482, "learning_rate": 8.051406620173323e-05, "epoch": 0.2910564038641321, "percentage": 29.11, "elapsed_time": "20:52:27", "remaining_time": "2 days, 2:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2803, "total_steps": 9627, "loss": 1.6466, "learning_rate": 8.050113883790556e-05, "epoch": 0.2911602783837125, "percentage": 29.12, "elapsed_time": "20:52:53", "remaining_time": "2 days, 2:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2804, "total_steps": 9627, "loss": 1.8663, "learning_rate": 8.048820822594452e-05, "epoch": 0.29126415290329283, "percentage": 29.13, "elapsed_time": "20:53:19", "remaining_time": "2 days, 2:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2805, "total_steps": 9627, "loss": 1.7933, "learning_rate": 8.047527436722713e-05, "epoch": 0.29136802742287315, "percentage": 29.14, "elapsed_time": "20:53:45", "remaining_time": "2 days, 2:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2806, "total_steps": 9627, "loss": 1.6788, "learning_rate": 8.046233726313073e-05, "epoch": 0.29147190194245354, "percentage": 29.15, "elapsed_time": "20:54:10", "remaining_time": "2 days, 2:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2807, "total_steps": 9627, "loss": 1.7392, "learning_rate": 8.044939691503304e-05, "epoch": 0.29157577646203386, "percentage": 29.16, "elapsed_time": "20:54:37", "remaining_time": "2 days, 2:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2808, "total_steps": 9627, "loss": 1.6476, "learning_rate": 8.043645332431206e-05, "epoch": 0.2916796509816142, "percentage": 29.17, "elapsed_time": "20:55:02", "remaining_time": "2 days, 2:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2809, "total_steps": 9627, "loss": 1.7906, "learning_rate": 8.042350649234625e-05, "epoch": 0.2917835255011946, "percentage": 29.18, "elapsed_time": "20:55:28", "remaining_time": "2 days, 2:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2810, "total_steps": 9627, "loss": 1.5869, "learning_rate": 8.041055642051429e-05, "epoch": 0.2918874000207749, "percentage": 29.19, "elapsed_time": "20:55:53", "remaining_time": "2 days, 2:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2811, "total_steps": 9627, "loss": 1.7447, "learning_rate": 8.039760311019529e-05, "epoch": 0.29199127454035523, "percentage": 29.2, "elapsed_time": "20:56:20", "remaining_time": "2 days, 2:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2812, "total_steps": 9627, "loss": 1.8424, "learning_rate": 8.038464656276867e-05, "epoch": 0.2920951490599356, "percentage": 29.21, "elapsed_time": "20:56:46", "remaining_time": "2 days, 2:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2813, "total_steps": 9627, "loss": 1.6962, "learning_rate": 8.03716867796142e-05, "epoch": 0.29219902357951594, "percentage": 29.22, "elapsed_time": "20:57:11", "remaining_time": "2 days, 2:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2814, "total_steps": 9627, "loss": 1.6874, "learning_rate": 8.035872376211199e-05, "epoch": 0.29230289809909626, "percentage": 29.23, "elapsed_time": "20:57:37", "remaining_time": "2 days, 2:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2815, "total_steps": 9627, "loss": 1.8638, "learning_rate": 8.03457575116425e-05, "epoch": 0.29240677261867665, "percentage": 29.24, "elapsed_time": "20:58:03", "remaining_time": "2 days, 2:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2816, "total_steps": 9627, "loss": 1.808, "learning_rate": 8.033278802958656e-05, "epoch": 0.292510647138257, "percentage": 29.25, "elapsed_time": "20:58:29", "remaining_time": "2 days, 2:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2817, "total_steps": 9627, "loss": 1.6983, "learning_rate": 8.031981531732529e-05, "epoch": 0.29261452165783736, "percentage": 29.26, "elapsed_time": "20:58:55", "remaining_time": "2 days, 2:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2818, "total_steps": 9627, "loss": 1.7543, "learning_rate": 8.03068393762402e-05, "epoch": 0.2927183961774177, "percentage": 29.27, "elapsed_time": "20:59:20", "remaining_time": "2 days, 2:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2819, "total_steps": 9627, "loss": 1.8414, "learning_rate": 8.02938602077131e-05, "epoch": 0.292822270696998, "percentage": 29.28, "elapsed_time": "20:59:45", "remaining_time": "2 days, 2:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2820, "total_steps": 9627, "loss": 1.8325, "learning_rate": 8.02808778131262e-05, "epoch": 0.2929261452165784, "percentage": 29.29, "elapsed_time": "21:00:11", "remaining_time": "2 days, 2:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2821, "total_steps": 9627, "loss": 1.7774, "learning_rate": 8.026789219386201e-05, "epoch": 0.2930300197361587, "percentage": 29.3, "elapsed_time": "21:00:36", "remaining_time": "2 days, 2:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2822, "total_steps": 9627, "loss": 1.7133, "learning_rate": 8.025490335130341e-05, "epoch": 0.29313389425573905, "percentage": 29.31, "elapsed_time": "21:01:02", "remaining_time": "2 days, 2:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2823, "total_steps": 9627, "loss": 1.7046, "learning_rate": 8.02419112868336e-05, "epoch": 0.29323776877531943, "percentage": 29.32, "elapsed_time": "21:01:28", "remaining_time": "2 days, 2:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2824, "total_steps": 9627, "loss": 1.6936, "learning_rate": 8.022891600183613e-05, "epoch": 0.29334164329489976, "percentage": 29.33, "elapsed_time": "21:01:54", "remaining_time": "2 days, 2:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2825, "total_steps": 9627, "loss": 1.7645, "learning_rate": 8.021591749769489e-05, "epoch": 0.2934455178144801, "percentage": 29.34, "elapsed_time": "21:02:19", "remaining_time": "2 days, 2:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2826, "total_steps": 9627, "loss": 1.8886, "learning_rate": 8.020291577579413e-05, "epoch": 0.29354939233406047, "percentage": 29.35, "elapsed_time": "21:02:45", "remaining_time": "2 days, 2:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2827, "total_steps": 9627, "loss": 1.7208, "learning_rate": 8.018991083751846e-05, "epoch": 0.2936532668536408, "percentage": 29.37, "elapsed_time": "21:03:11", "remaining_time": "2 days, 2:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2828, "total_steps": 9627, "loss": 1.6585, "learning_rate": 8.017690268425276e-05, "epoch": 0.2937571413732212, "percentage": 29.38, "elapsed_time": "21:03:36", "remaining_time": "2 days, 2:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2829, "total_steps": 9627, "loss": 1.7227, "learning_rate": 8.016389131738229e-05, "epoch": 0.2938610158928015, "percentage": 29.39, "elapsed_time": "21:04:03", "remaining_time": "2 days, 2:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2830, "total_steps": 9627, "loss": 1.8273, "learning_rate": 8.015087673829271e-05, "epoch": 0.29396489041238183, "percentage": 29.4, "elapsed_time": "21:04:28", "remaining_time": "2 days, 2:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2831, "total_steps": 9627, "loss": 1.6725, "learning_rate": 8.013785894836993e-05, "epoch": 0.2940687649319622, "percentage": 29.41, "elapsed_time": "21:04:54", "remaining_time": "2 days, 2:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2832, "total_steps": 9627, "loss": 1.729, "learning_rate": 8.012483794900026e-05, "epoch": 0.29417263945154254, "percentage": 29.42, "elapsed_time": "21:05:20", "remaining_time": "2 days, 2:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2833, "total_steps": 9627, "loss": 1.6771, "learning_rate": 8.011181374157034e-05, "epoch": 0.29427651397112287, "percentage": 29.43, "elapsed_time": "21:05:45", "remaining_time": "2 days, 2:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2834, "total_steps": 9627, "loss": 1.8316, "learning_rate": 8.009878632746712e-05, "epoch": 0.29438038849070325, "percentage": 29.44, "elapsed_time": "21:06:11", "remaining_time": "2 days, 2:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2835, "total_steps": 9627, "loss": 1.7071, "learning_rate": 8.008575570807795e-05, "epoch": 0.2944842630102836, "percentage": 29.45, "elapsed_time": "21:06:37", "remaining_time": "2 days, 2:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2836, "total_steps": 9627, "loss": 1.8557, "learning_rate": 8.007272188479049e-05, "epoch": 0.2945881375298639, "percentage": 29.46, "elapsed_time": "21:07:02", "remaining_time": "2 days, 2:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2837, "total_steps": 9627, "loss": 1.7695, "learning_rate": 8.005968485899269e-05, "epoch": 0.2946920120494443, "percentage": 29.47, "elapsed_time": "21:07:28", "remaining_time": "2 days, 2:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2838, "total_steps": 9627, "loss": 1.6902, "learning_rate": 8.004664463207294e-05, "epoch": 0.2947958865690246, "percentage": 29.48, "elapsed_time": "21:07:54", "remaining_time": "2 days, 2:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2839, "total_steps": 9627, "loss": 1.7109, "learning_rate": 8.003360120541992e-05, "epoch": 0.29489976108860494, "percentage": 29.49, "elapsed_time": "21:08:20", "remaining_time": "2 days, 2:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2840, "total_steps": 9627, "loss": 1.8152, "learning_rate": 8.002055458042264e-05, "epoch": 0.2950036356081853, "percentage": 29.5, "elapsed_time": "21:08:46", "remaining_time": "2 days, 2:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2841, "total_steps": 9627, "loss": 1.8906, "learning_rate": 8.000750475847045e-05, "epoch": 0.29510751012776565, "percentage": 29.51, "elapsed_time": "21:09:11", "remaining_time": "2 days, 2:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2842, "total_steps": 9627, "loss": 1.6325, "learning_rate": 7.999445174095308e-05, "epoch": 0.29521138464734603, "percentage": 29.52, "elapsed_time": "21:09:37", "remaining_time": "2 days, 2:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2843, "total_steps": 9627, "loss": 1.6156, "learning_rate": 7.998139552926057e-05, "epoch": 0.29531525916692636, "percentage": 29.53, "elapsed_time": "21:10:03", "remaining_time": "2 days, 2:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2844, "total_steps": 9627, "loss": 1.71, "learning_rate": 7.996833612478331e-05, "epoch": 0.2954191336865067, "percentage": 29.54, "elapsed_time": "21:10:28", "remaining_time": "2 days, 2:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2845, "total_steps": 9627, "loss": 1.7186, "learning_rate": 7.9955273528912e-05, "epoch": 0.29552300820608707, "percentage": 29.55, "elapsed_time": "21:10:55", "remaining_time": "2 days, 2:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2846, "total_steps": 9627, "loss": 1.5034, "learning_rate": 7.994220774303771e-05, "epoch": 0.2956268827256674, "percentage": 29.56, "elapsed_time": "21:11:20", "remaining_time": "2 days, 2:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2847, "total_steps": 9627, "loss": 1.6271, "learning_rate": 7.992913876855188e-05, "epoch": 0.2957307572452477, "percentage": 29.57, "elapsed_time": "21:11:46", "remaining_time": "2 days, 2:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2848, "total_steps": 9627, "loss": 1.7693, "learning_rate": 7.99160666068462e-05, "epoch": 0.2958346317648281, "percentage": 29.58, "elapsed_time": "21:12:11", "remaining_time": "2 days, 2:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2849, "total_steps": 9627, "loss": 1.5047, "learning_rate": 7.99029912593128e-05, "epoch": 0.29593850628440843, "percentage": 29.59, "elapsed_time": "21:12:38", "remaining_time": "2 days, 2:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 9627, "loss": 1.6688, "learning_rate": 7.988991272734407e-05, "epoch": 0.29604238080398876, "percentage": 29.6, "elapsed_time": "21:13:03", "remaining_time": "2 days, 2:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2851, "total_steps": 9627, "loss": 1.7687, "learning_rate": 7.987683101233279e-05, "epoch": 0.29614625532356914, "percentage": 29.61, "elapsed_time": "21:13:29", "remaining_time": "2 days, 2:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2852, "total_steps": 9627, "loss": 1.7141, "learning_rate": 7.986374611567207e-05, "epoch": 0.29625012984314947, "percentage": 29.63, "elapsed_time": "21:13:55", "remaining_time": "2 days, 2:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2853, "total_steps": 9627, "loss": 1.9484, "learning_rate": 7.985065803875532e-05, "epoch": 0.2963540043627298, "percentage": 29.64, "elapsed_time": "21:14:21", "remaining_time": "2 days, 2:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2854, "total_steps": 9627, "loss": 1.6849, "learning_rate": 7.983756678297633e-05, "epoch": 0.2964578788823102, "percentage": 29.65, "elapsed_time": "21:14:47", "remaining_time": "2 days, 2:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2855, "total_steps": 9627, "loss": 1.7369, "learning_rate": 7.982447234972922e-05, "epoch": 0.2965617534018905, "percentage": 29.66, "elapsed_time": "21:15:12", "remaining_time": "2 days, 2:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2856, "total_steps": 9627, "loss": 1.7769, "learning_rate": 7.981137474040845e-05, "epoch": 0.2966656279214709, "percentage": 29.67, "elapsed_time": "21:15:38", "remaining_time": "2 days, 2:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2857, "total_steps": 9627, "loss": 1.6387, "learning_rate": 7.979827395640883e-05, "epoch": 0.2967695024410512, "percentage": 29.68, "elapsed_time": "21:16:04", "remaining_time": "2 days, 2:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2858, "total_steps": 9627, "loss": 1.7448, "learning_rate": 7.978516999912544e-05, "epoch": 0.29687337696063154, "percentage": 29.69, "elapsed_time": "21:16:30", "remaining_time": "2 days, 2:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2859, "total_steps": 9627, "loss": 1.7705, "learning_rate": 7.977206286995379e-05, "epoch": 0.2969772514802119, "percentage": 29.7, "elapsed_time": "21:16:56", "remaining_time": "2 days, 2:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2860, "total_steps": 9627, "loss": 1.9017, "learning_rate": 7.975895257028965e-05, "epoch": 0.29708112599979225, "percentage": 29.71, "elapsed_time": "21:17:21", "remaining_time": "2 days, 2:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2861, "total_steps": 9627, "loss": 1.5924, "learning_rate": 7.974583910152922e-05, "epoch": 0.2971850005193726, "percentage": 29.72, "elapsed_time": "21:17:47", "remaining_time": "2 days, 2:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2862, "total_steps": 9627, "loss": 1.7093, "learning_rate": 7.973272246506893e-05, "epoch": 0.29728887503895296, "percentage": 29.73, "elapsed_time": "21:18:13", "remaining_time": "2 days, 2:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2863, "total_steps": 9627, "loss": 1.7662, "learning_rate": 7.971960266230565e-05, "epoch": 0.2973927495585333, "percentage": 29.74, "elapsed_time": "21:18:38", "remaining_time": "2 days, 2:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2864, "total_steps": 9627, "loss": 1.6753, "learning_rate": 7.97064796946365e-05, "epoch": 0.2974966240781136, "percentage": 29.75, "elapsed_time": "21:19:04", "remaining_time": "2 days, 2:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2865, "total_steps": 9627, "loss": 2.0455, "learning_rate": 7.969335356345894e-05, "epoch": 0.297600498597694, "percentage": 29.76, "elapsed_time": "21:19:30", "remaining_time": "2 days, 2:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2866, "total_steps": 9627, "loss": 1.4737, "learning_rate": 7.968022427017088e-05, "epoch": 0.2977043731172743, "percentage": 29.77, "elapsed_time": "21:19:56", "remaining_time": "2 days, 2:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2867, "total_steps": 9627, "loss": 1.8034, "learning_rate": 7.966709181617045e-05, "epoch": 0.2978082476368547, "percentage": 29.78, "elapsed_time": "21:20:21", "remaining_time": "2 days, 2:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2868, "total_steps": 9627, "loss": 1.7262, "learning_rate": 7.965395620285616e-05, "epoch": 0.29791212215643503, "percentage": 29.79, "elapsed_time": "21:20:47", "remaining_time": "2 days, 2:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2869, "total_steps": 9627, "loss": 1.8834, "learning_rate": 7.964081743162684e-05, "epoch": 0.29801599667601536, "percentage": 29.8, "elapsed_time": "21:21:13", "remaining_time": "2 days, 2:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2870, "total_steps": 9627, "loss": 1.6383, "learning_rate": 7.962767550388166e-05, "epoch": 0.29811987119559574, "percentage": 29.81, "elapsed_time": "21:21:38", "remaining_time": "2 days, 2:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2871, "total_steps": 9627, "loss": 1.6704, "learning_rate": 7.961453042102014e-05, "epoch": 0.29822374571517607, "percentage": 29.82, "elapsed_time": "21:22:05", "remaining_time": "2 days, 2:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2872, "total_steps": 9627, "loss": 1.8623, "learning_rate": 7.960138218444215e-05, "epoch": 0.2983276202347564, "percentage": 29.83, "elapsed_time": "21:22:30", "remaining_time": "2 days, 2:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2873, "total_steps": 9627, "loss": 1.7932, "learning_rate": 7.958823079554785e-05, "epoch": 0.2984314947543368, "percentage": 29.84, "elapsed_time": "21:22:56", "remaining_time": "2 days, 2:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2874, "total_steps": 9627, "loss": 1.7049, "learning_rate": 7.957507625573776e-05, "epoch": 0.2985353692739171, "percentage": 29.85, "elapsed_time": "21:23:22", "remaining_time": "2 days, 2:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2875, "total_steps": 9627, "loss": 1.682, "learning_rate": 7.956191856641276e-05, "epoch": 0.29863924379349743, "percentage": 29.86, "elapsed_time": "21:23:47", "remaining_time": "2 days, 2:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2876, "total_steps": 9627, "loss": 1.9822, "learning_rate": 7.9548757728974e-05, "epoch": 0.2987431183130778, "percentage": 29.87, "elapsed_time": "21:24:13", "remaining_time": "2 days, 2:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2877, "total_steps": 9627, "loss": 1.8279, "learning_rate": 7.953559374482305e-05, "epoch": 0.29884699283265814, "percentage": 29.88, "elapsed_time": "21:24:38", "remaining_time": "2 days, 2:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2878, "total_steps": 9627, "loss": 1.6634, "learning_rate": 7.952242661536175e-05, "epoch": 0.29895086735223847, "percentage": 29.9, "elapsed_time": "21:25:05", "remaining_time": "2 days, 2:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2879, "total_steps": 9627, "loss": 1.7705, "learning_rate": 7.950925634199228e-05, "epoch": 0.29905474187181885, "percentage": 29.91, "elapsed_time": "21:25:30", "remaining_time": "2 days, 2:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2880, "total_steps": 9627, "loss": 1.7795, "learning_rate": 7.949608292611721e-05, "epoch": 0.2991586163913992, "percentage": 29.92, "elapsed_time": "21:25:56", "remaining_time": "2 days, 2:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2881, "total_steps": 9627, "loss": 1.9119, "learning_rate": 7.948290636913939e-05, "epoch": 0.29926249091097956, "percentage": 29.93, "elapsed_time": "21:26:21", "remaining_time": "2 days, 2:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2882, "total_steps": 9627, "loss": 1.5662, "learning_rate": 7.946972667246201e-05, "epoch": 0.2993663654305599, "percentage": 29.94, "elapsed_time": "21:26:48", "remaining_time": "2 days, 2:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2883, "total_steps": 9627, "loss": 1.5546, "learning_rate": 7.945654383748861e-05, "epoch": 0.2994702399501402, "percentage": 29.95, "elapsed_time": "21:27:13", "remaining_time": "2 days, 2:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2884, "total_steps": 9627, "loss": 1.5994, "learning_rate": 7.944335786562307e-05, "epoch": 0.2995741144697206, "percentage": 29.96, "elapsed_time": "21:27:40", "remaining_time": "2 days, 2:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2885, "total_steps": 9627, "loss": 1.829, "learning_rate": 7.943016875826957e-05, "epoch": 0.2996779889893009, "percentage": 29.97, "elapsed_time": "21:28:05", "remaining_time": "2 days, 2:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2886, "total_steps": 9627, "loss": 1.6141, "learning_rate": 7.941697651683267e-05, "epoch": 0.29978186350888125, "percentage": 29.98, "elapsed_time": "21:28:30", "remaining_time": "2 days, 2:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2887, "total_steps": 9627, "loss": 1.837, "learning_rate": 7.940378114271723e-05, "epoch": 0.29988573802846163, "percentage": 29.99, "elapsed_time": "21:28:57", "remaining_time": "2 days, 2:09:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2888, "total_steps": 9627, "loss": 1.5883, "learning_rate": 7.939058263732846e-05, "epoch": 0.29998961254804196, "percentage": 30.0, "elapsed_time": "21:29:22", "remaining_time": "2 days, 2:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2889, "total_steps": 9627, "loss": 1.7448, "learning_rate": 7.93773810020719e-05, "epoch": 0.3000934870676223, "percentage": 30.01, "elapsed_time": "21:29:47", "remaining_time": "2 days, 2:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2890, "total_steps": 9627, "loss": 1.7747, "learning_rate": 7.93641762383534e-05, "epoch": 0.30019736158720267, "percentage": 30.02, "elapsed_time": "21:30:14", "remaining_time": "2 days, 2:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2891, "total_steps": 9627, "loss": 1.6808, "learning_rate": 7.93509683475792e-05, "epoch": 0.300301236106783, "percentage": 30.03, "elapsed_time": "21:30:40", "remaining_time": "2 days, 2:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2892, "total_steps": 9627, "loss": 1.6966, "learning_rate": 7.93377573311558e-05, "epoch": 0.3004051106263634, "percentage": 30.04, "elapsed_time": "21:31:05", "remaining_time": "2 days, 2:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2893, "total_steps": 9627, "loss": 1.6517, "learning_rate": 7.932454319049008e-05, "epoch": 0.3005089851459437, "percentage": 30.05, "elapsed_time": "21:31:31", "remaining_time": "2 days, 2:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2894, "total_steps": 9627, "loss": 1.5688, "learning_rate": 7.931132592698927e-05, "epoch": 0.30061285966552403, "percentage": 30.06, "elapsed_time": "21:31:56", "remaining_time": "2 days, 2:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2895, "total_steps": 9627, "loss": 1.7309, "learning_rate": 7.929810554206088e-05, "epoch": 0.3007167341851044, "percentage": 30.07, "elapsed_time": "21:32:23", "remaining_time": "2 days, 2:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2896, "total_steps": 9627, "loss": 1.7323, "learning_rate": 7.928488203711279e-05, "epoch": 0.30082060870468474, "percentage": 30.08, "elapsed_time": "21:32:48", "remaining_time": "2 days, 2:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2897, "total_steps": 9627, "loss": 1.6411, "learning_rate": 7.927165541355319e-05, "epoch": 0.30092448322426507, "percentage": 30.09, "elapsed_time": "21:33:13", "remaining_time": "2 days, 2:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2898, "total_steps": 9627, "loss": 1.6233, "learning_rate": 7.92584256727906e-05, "epoch": 0.30102835774384545, "percentage": 30.1, "elapsed_time": "21:33:40", "remaining_time": "2 days, 2:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2899, "total_steps": 9627, "loss": 1.8847, "learning_rate": 7.924519281623393e-05, "epoch": 0.3011322322634258, "percentage": 30.11, "elapsed_time": "21:34:05", "remaining_time": "2 days, 2:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 9627, "loss": 1.6344, "learning_rate": 7.923195684529232e-05, "epoch": 0.3012361067830061, "percentage": 30.12, "elapsed_time": "21:34:30", "remaining_time": "2 days, 2:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2901, "total_steps": 9627, "loss": 1.9062, "learning_rate": 7.921871776137533e-05, "epoch": 0.3013399813025865, "percentage": 30.13, "elapsed_time": "21:34:57", "remaining_time": "2 days, 2:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2902, "total_steps": 9627, "loss": 1.8971, "learning_rate": 7.920547556589282e-05, "epoch": 0.3014438558221668, "percentage": 30.14, "elapsed_time": "21:35:22", "remaining_time": "2 days, 2:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2903, "total_steps": 9627, "loss": 1.7381, "learning_rate": 7.919223026025498e-05, "epoch": 0.30154773034174714, "percentage": 30.15, "elapsed_time": "21:35:47", "remaining_time": "2 days, 2:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2904, "total_steps": 9627, "loss": 1.8914, "learning_rate": 7.917898184587231e-05, "epoch": 0.3016516048613275, "percentage": 30.17, "elapsed_time": "21:36:14", "remaining_time": "2 days, 2:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2905, "total_steps": 9627, "loss": 1.8567, "learning_rate": 7.916573032415569e-05, "epoch": 0.30175547938090785, "percentage": 30.18, "elapsed_time": "21:36:39", "remaining_time": "2 days, 2:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2906, "total_steps": 9627, "loss": 1.5998, "learning_rate": 7.915247569651627e-05, "epoch": 0.30185935390048824, "percentage": 30.19, "elapsed_time": "21:37:05", "remaining_time": "2 days, 1:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2907, "total_steps": 9627, "loss": 1.5639, "learning_rate": 7.913921796436561e-05, "epoch": 0.30196322842006856, "percentage": 30.2, "elapsed_time": "21:37:31", "remaining_time": "2 days, 1:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2908, "total_steps": 9627, "loss": 1.7428, "learning_rate": 7.912595712911552e-05, "epoch": 0.3020671029396489, "percentage": 30.21, "elapsed_time": "21:37:56", "remaining_time": "2 days, 1:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2909, "total_steps": 9627, "loss": 1.7877, "learning_rate": 7.91126931921782e-05, "epoch": 0.3021709774592293, "percentage": 30.22, "elapsed_time": "21:38:22", "remaining_time": "2 days, 1:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2910, "total_steps": 9627, "loss": 1.8667, "learning_rate": 7.909942615496613e-05, "epoch": 0.3022748519788096, "percentage": 30.23, "elapsed_time": "21:38:48", "remaining_time": "2 days, 1:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2911, "total_steps": 9627, "loss": 1.6627, "learning_rate": 7.908615601889218e-05, "epoch": 0.3023787264983899, "percentage": 30.24, "elapsed_time": "21:39:14", "remaining_time": "2 days, 1:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2912, "total_steps": 9627, "loss": 1.6026, "learning_rate": 7.907288278536947e-05, "epoch": 0.3024826010179703, "percentage": 30.25, "elapsed_time": "21:39:40", "remaining_time": "2 days, 1:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2913, "total_steps": 9627, "loss": 1.7998, "learning_rate": 7.905960645581152e-05, "epoch": 0.30258647553755064, "percentage": 30.26, "elapsed_time": "21:40:05", "remaining_time": "2 days, 1:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2914, "total_steps": 9627, "loss": 1.6253, "learning_rate": 7.904632703163218e-05, "epoch": 0.30269035005713096, "percentage": 30.27, "elapsed_time": "21:40:32", "remaining_time": "2 days, 1:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2915, "total_steps": 9627, "loss": 1.7304, "learning_rate": 7.903304451424556e-05, "epoch": 0.30279422457671135, "percentage": 30.28, "elapsed_time": "21:40:57", "remaining_time": "2 days, 1:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2916, "total_steps": 9627, "loss": 1.7403, "learning_rate": 7.901975890506616e-05, "epoch": 0.3028980990962917, "percentage": 30.29, "elapsed_time": "21:41:22", "remaining_time": "2 days, 1:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2917, "total_steps": 9627, "loss": 1.7706, "learning_rate": 7.900647020550882e-05, "epoch": 0.303001973615872, "percentage": 30.3, "elapsed_time": "21:41:48", "remaining_time": "2 days, 1:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2918, "total_steps": 9627, "loss": 1.7351, "learning_rate": 7.899317841698864e-05, "epoch": 0.3031058481354524, "percentage": 30.31, "elapsed_time": "21:42:15", "remaining_time": "2 days, 1:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2919, "total_steps": 9627, "loss": 1.8509, "learning_rate": 7.897988354092113e-05, "epoch": 0.3032097226550327, "percentage": 30.32, "elapsed_time": "21:42:40", "remaining_time": "2 days, 1:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2920, "total_steps": 9627, "loss": 1.6496, "learning_rate": 7.896658557872207e-05, "epoch": 0.3033135971746131, "percentage": 30.33, "elapsed_time": "21:43:07", "remaining_time": "2 days, 1:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2921, "total_steps": 9627, "loss": 1.4942, "learning_rate": 7.89532845318076e-05, "epoch": 0.3034174716941934, "percentage": 30.34, "elapsed_time": "21:43:32", "remaining_time": "2 days, 1:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2922, "total_steps": 9627, "loss": 1.5979, "learning_rate": 7.893998040159418e-05, "epoch": 0.30352134621377375, "percentage": 30.35, "elapsed_time": "21:43:58", "remaining_time": "2 days, 1:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2923, "total_steps": 9627, "loss": 1.5617, "learning_rate": 7.892667318949855e-05, "epoch": 0.30362522073335413, "percentage": 30.36, "elapsed_time": "21:44:23", "remaining_time": "2 days, 1:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2924, "total_steps": 9627, "loss": 1.6198, "learning_rate": 7.891336289693789e-05, "epoch": 0.30372909525293446, "percentage": 30.37, "elapsed_time": "21:44:50", "remaining_time": "2 days, 1:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2925, "total_steps": 9627, "loss": 1.7494, "learning_rate": 7.890004952532962e-05, "epoch": 0.3038329697725148, "percentage": 30.38, "elapsed_time": "21:45:16", "remaining_time": "2 days, 1:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2926, "total_steps": 9627, "loss": 1.5492, "learning_rate": 7.888673307609149e-05, "epoch": 0.30393684429209517, "percentage": 30.39, "elapsed_time": "21:45:41", "remaining_time": "2 days, 1:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2927, "total_steps": 9627, "loss": 1.6222, "learning_rate": 7.887341355064162e-05, "epoch": 0.3040407188116755, "percentage": 30.4, "elapsed_time": "21:46:07", "remaining_time": "2 days, 1:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2928, "total_steps": 9627, "loss": 1.8504, "learning_rate": 7.886009095039843e-05, "epoch": 0.3041445933312558, "percentage": 30.41, "elapsed_time": "21:46:32", "remaining_time": "2 days, 1:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2929, "total_steps": 9627, "loss": 2.1015, "learning_rate": 7.884676527678068e-05, "epoch": 0.3042484678508362, "percentage": 30.42, "elapsed_time": "21:46:58", "remaining_time": "2 days, 1:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2930, "total_steps": 9627, "loss": 1.6364, "learning_rate": 7.883343653120743e-05, "epoch": 0.30435234237041653, "percentage": 30.44, "elapsed_time": "21:47:24", "remaining_time": "2 days, 1:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2931, "total_steps": 9627, "loss": 1.5827, "learning_rate": 7.882010471509809e-05, "epoch": 0.3044562168899969, "percentage": 30.45, "elapsed_time": "21:47:50", "remaining_time": "2 days, 1:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2932, "total_steps": 9627, "loss": 1.9797, "learning_rate": 7.88067698298724e-05, "epoch": 0.30456009140957724, "percentage": 30.46, "elapsed_time": "21:48:15", "remaining_time": "2 days, 1:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2933, "total_steps": 9627, "loss": 1.7037, "learning_rate": 7.879343187695045e-05, "epoch": 0.30466396592915757, "percentage": 30.47, "elapsed_time": "21:48:41", "remaining_time": "2 days, 1:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2934, "total_steps": 9627, "loss": 1.7411, "learning_rate": 7.878009085775257e-05, "epoch": 0.30476784044873795, "percentage": 30.48, "elapsed_time": "21:49:08", "remaining_time": "2 days, 1:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2935, "total_steps": 9627, "loss": 1.7444, "learning_rate": 7.876674677369954e-05, "epoch": 0.3048717149683183, "percentage": 30.49, "elapsed_time": "21:49:33", "remaining_time": "2 days, 1:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2936, "total_steps": 9627, "loss": 1.8388, "learning_rate": 7.875339962621235e-05, "epoch": 0.3049755894878986, "percentage": 30.5, "elapsed_time": "21:50:00", "remaining_time": "2 days, 1:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2937, "total_steps": 9627, "loss": 1.7877, "learning_rate": 7.874004941671239e-05, "epoch": 0.305079464007479, "percentage": 30.51, "elapsed_time": "21:50:25", "remaining_time": "2 days, 1:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2938, "total_steps": 9627, "loss": 1.7491, "learning_rate": 7.872669614662135e-05, "epoch": 0.3051833385270593, "percentage": 30.52, "elapsed_time": "21:50:51", "remaining_time": "2 days, 1:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2939, "total_steps": 9627, "loss": 1.7892, "learning_rate": 7.871333981736124e-05, "epoch": 0.30528721304663964, "percentage": 30.53, "elapsed_time": "21:51:18", "remaining_time": "2 days, 1:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2940, "total_steps": 9627, "loss": 1.7247, "learning_rate": 7.869998043035442e-05, "epoch": 0.30539108756622, "percentage": 30.54, "elapsed_time": "21:51:43", "remaining_time": "2 days, 1:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2941, "total_steps": 9627, "loss": 1.767, "learning_rate": 7.868661798702355e-05, "epoch": 0.30549496208580035, "percentage": 30.55, "elapsed_time": "21:52:09", "remaining_time": "2 days, 1:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2942, "total_steps": 9627, "loss": 1.6133, "learning_rate": 7.867325248879163e-05, "epoch": 0.3055988366053807, "percentage": 30.56, "elapsed_time": "21:52:35", "remaining_time": "2 days, 1:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2943, "total_steps": 9627, "loss": 1.6876, "learning_rate": 7.865988393708197e-05, "epoch": 0.30570271112496106, "percentage": 30.57, "elapsed_time": "21:53:01", "remaining_time": "2 days, 1:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2944, "total_steps": 9627, "loss": 1.7866, "learning_rate": 7.864651233331823e-05, "epoch": 0.3058065856445414, "percentage": 30.58, "elapsed_time": "21:53:26", "remaining_time": "2 days, 1:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2945, "total_steps": 9627, "loss": 1.5605, "learning_rate": 7.863313767892438e-05, "epoch": 0.30591046016412177, "percentage": 30.59, "elapsed_time": "21:53:53", "remaining_time": "2 days, 1:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2946, "total_steps": 9627, "loss": 1.8965, "learning_rate": 7.861975997532471e-05, "epoch": 0.3060143346837021, "percentage": 30.6, "elapsed_time": "21:54:18", "remaining_time": "2 days, 1:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2947, "total_steps": 9627, "loss": 1.8668, "learning_rate": 7.860637922394387e-05, "epoch": 0.3061182092032824, "percentage": 30.61, "elapsed_time": "21:54:45", "remaining_time": "2 days, 1:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2948, "total_steps": 9627, "loss": 1.8258, "learning_rate": 7.859299542620675e-05, "epoch": 0.3062220837228628, "percentage": 30.62, "elapsed_time": "21:55:11", "remaining_time": "2 days, 1:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2949, "total_steps": 9627, "loss": 1.8309, "learning_rate": 7.857960858353866e-05, "epoch": 0.30632595824244313, "percentage": 30.63, "elapsed_time": "21:55:37", "remaining_time": "2 days, 1:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 9627, "loss": 1.7936, "learning_rate": 7.85662186973652e-05, "epoch": 0.30642983276202346, "percentage": 30.64, "elapsed_time": "21:56:02", "remaining_time": "2 days, 1:38:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2951, "total_steps": 9627, "loss": 1.7259, "learning_rate": 7.855282576911224e-05, "epoch": 0.30653370728160384, "percentage": 30.65, "elapsed_time": "21:56:29", "remaining_time": "2 days, 1:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2952, "total_steps": 9627, "loss": 1.7949, "learning_rate": 7.85394298002061e-05, "epoch": 0.30663758180118417, "percentage": 30.66, "elapsed_time": "21:56:55", "remaining_time": "2 days, 1:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2953, "total_steps": 9627, "loss": 1.6679, "learning_rate": 7.852603079207328e-05, "epoch": 0.3067414563207645, "percentage": 30.67, "elapsed_time": "21:57:20", "remaining_time": "2 days, 1:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2954, "total_steps": 9627, "loss": 1.6965, "learning_rate": 7.851262874614069e-05, "epoch": 0.3068453308403449, "percentage": 30.68, "elapsed_time": "21:57:46", "remaining_time": "2 days, 1:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2955, "total_steps": 9627, "loss": 1.6044, "learning_rate": 7.849922366383555e-05, "epoch": 0.3069492053599252, "percentage": 30.69, "elapsed_time": "21:58:12", "remaining_time": "2 days, 1:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2956, "total_steps": 9627, "loss": 2.1448, "learning_rate": 7.848581554658539e-05, "epoch": 0.30705307987950553, "percentage": 30.71, "elapsed_time": "21:58:39", "remaining_time": "2 days, 1:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2957, "total_steps": 9627, "loss": 1.7972, "learning_rate": 7.847240439581806e-05, "epoch": 0.3071569543990859, "percentage": 30.72, "elapsed_time": "21:59:04", "remaining_time": "2 days, 1:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2958, "total_steps": 9627, "loss": 1.732, "learning_rate": 7.845899021296178e-05, "epoch": 0.30726082891866624, "percentage": 30.73, "elapsed_time": "21:59:30", "remaining_time": "2 days, 1:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2959, "total_steps": 9627, "loss": 1.7266, "learning_rate": 7.844557299944501e-05, "epoch": 0.3073647034382466, "percentage": 30.74, "elapsed_time": "21:59:56", "remaining_time": "2 days, 1:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2960, "total_steps": 9627, "loss": 1.7042, "learning_rate": 7.843215275669663e-05, "epoch": 0.30746857795782695, "percentage": 30.75, "elapsed_time": "22:00:21", "remaining_time": "2 days, 1:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2961, "total_steps": 9627, "loss": 1.7086, "learning_rate": 7.841872948614573e-05, "epoch": 0.3075724524774073, "percentage": 30.76, "elapsed_time": "22:00:48", "remaining_time": "2 days, 1:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2962, "total_steps": 9627, "loss": 1.7215, "learning_rate": 7.840530318922181e-05, "epoch": 0.30767632699698766, "percentage": 30.77, "elapsed_time": "22:01:13", "remaining_time": "2 days, 1:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2963, "total_steps": 9627, "loss": 1.7995, "learning_rate": 7.839187386735469e-05, "epoch": 0.307780201516568, "percentage": 30.78, "elapsed_time": "22:01:38", "remaining_time": "2 days, 1:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2964, "total_steps": 9627, "loss": 1.7028, "learning_rate": 7.837844152197447e-05, "epoch": 0.3078840760361483, "percentage": 30.79, "elapsed_time": "22:02:06", "remaining_time": "2 days, 1:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2965, "total_steps": 9627, "loss": 1.4274, "learning_rate": 7.836500615451156e-05, "epoch": 0.3079879505557287, "percentage": 30.8, "elapsed_time": "22:02:31", "remaining_time": "2 days, 1:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2966, "total_steps": 9627, "loss": 1.5747, "learning_rate": 7.835156776639679e-05, "epoch": 0.308091825075309, "percentage": 30.81, "elapsed_time": "22:02:58", "remaining_time": "2 days, 1:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2967, "total_steps": 9627, "loss": 1.6061, "learning_rate": 7.833812635906118e-05, "epoch": 0.30819569959488935, "percentage": 30.82, "elapsed_time": "22:03:23", "remaining_time": "2 days, 1:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2968, "total_steps": 9627, "loss": 1.8704, "learning_rate": 7.832468193393616e-05, "epoch": 0.30829957411446973, "percentage": 30.83, "elapsed_time": "22:03:50", "remaining_time": "2 days, 1:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2969, "total_steps": 9627, "loss": 1.7132, "learning_rate": 7.831123449245345e-05, "epoch": 0.30840344863405006, "percentage": 30.84, "elapsed_time": "22:04:15", "remaining_time": "2 days, 1:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2970, "total_steps": 9627, "loss": 1.8511, "learning_rate": 7.829778403604513e-05, "epoch": 0.30850732315363044, "percentage": 30.85, "elapsed_time": "22:04:41", "remaining_time": "2 days, 1:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2971, "total_steps": 9627, "loss": 1.8369, "learning_rate": 7.828433056614351e-05, "epoch": 0.30861119767321077, "percentage": 30.86, "elapsed_time": "22:05:06", "remaining_time": "2 days, 1:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2972, "total_steps": 9627, "loss": 1.7907, "learning_rate": 7.827087408418132e-05, "epoch": 0.3087150721927911, "percentage": 30.87, "elapsed_time": "22:05:33", "remaining_time": "2 days, 1:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2973, "total_steps": 9627, "loss": 1.7639, "learning_rate": 7.825741459159157e-05, "epoch": 0.3088189467123715, "percentage": 30.88, "elapsed_time": "22:05:59", "remaining_time": "2 days, 1:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2974, "total_steps": 9627, "loss": 1.7871, "learning_rate": 7.824395208980758e-05, "epoch": 0.3089228212319518, "percentage": 30.89, "elapsed_time": "22:06:25", "remaining_time": "2 days, 1:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2975, "total_steps": 9627, "loss": 1.988, "learning_rate": 7.8230486580263e-05, "epoch": 0.30902669575153213, "percentage": 30.9, "elapsed_time": "22:06:51", "remaining_time": "2 days, 1:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2976, "total_steps": 9627, "loss": 1.812, "learning_rate": 7.821701806439179e-05, "epoch": 0.3091305702711125, "percentage": 30.91, "elapsed_time": "22:07:17", "remaining_time": "2 days, 1:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2977, "total_steps": 9627, "loss": 1.7231, "learning_rate": 7.820354654362828e-05, "epoch": 0.30923444479069284, "percentage": 30.92, "elapsed_time": "22:07:43", "remaining_time": "2 days, 1:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2978, "total_steps": 9627, "loss": 1.7493, "learning_rate": 7.819007201940706e-05, "epoch": 0.30933831931027317, "percentage": 30.93, "elapsed_time": "22:08:09", "remaining_time": "2 days, 1:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2979, "total_steps": 9627, "loss": 1.621, "learning_rate": 7.817659449316305e-05, "epoch": 0.30944219382985355, "percentage": 30.94, "elapsed_time": "22:08:35", "remaining_time": "2 days, 1:24:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2980, "total_steps": 9627, "loss": 1.7622, "learning_rate": 7.816311396633152e-05, "epoch": 0.3095460683494339, "percentage": 30.95, "elapsed_time": "22:09:01", "remaining_time": "2 days, 1:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2981, "total_steps": 9627, "loss": 1.615, "learning_rate": 7.814963044034802e-05, "epoch": 0.3096499428690142, "percentage": 30.96, "elapsed_time": "22:09:27", "remaining_time": "2 days, 1:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2982, "total_steps": 9627, "loss": 1.9264, "learning_rate": 7.813614391664847e-05, "epoch": 0.3097538173885946, "percentage": 30.98, "elapsed_time": "22:09:52", "remaining_time": "2 days, 1:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2983, "total_steps": 9627, "loss": 1.6321, "learning_rate": 7.812265439666906e-05, "epoch": 0.3098576919081749, "percentage": 30.99, "elapsed_time": "22:10:18", "remaining_time": "2 days, 1:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2984, "total_steps": 9627, "loss": 1.902, "learning_rate": 7.81091618818463e-05, "epoch": 0.3099615664277553, "percentage": 31.0, "elapsed_time": "22:10:45", "remaining_time": "2 days, 1:22:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2985, "total_steps": 9627, "loss": 1.8288, "learning_rate": 7.80956663736171e-05, "epoch": 0.3100654409473356, "percentage": 31.01, "elapsed_time": "22:11:10", "remaining_time": "2 days, 1:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2986, "total_steps": 9627, "loss": 1.7853, "learning_rate": 7.808216787341855e-05, "epoch": 0.31016931546691595, "percentage": 31.02, "elapsed_time": "22:11:36", "remaining_time": "2 days, 1:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2987, "total_steps": 9627, "loss": 1.702, "learning_rate": 7.806866638268818e-05, "epoch": 0.31027318998649633, "percentage": 31.03, "elapsed_time": "22:12:03", "remaining_time": "2 days, 1:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2988, "total_steps": 9627, "loss": 1.7776, "learning_rate": 7.80551619028638e-05, "epoch": 0.31037706450607666, "percentage": 31.04, "elapsed_time": "22:12:28", "remaining_time": "2 days, 1:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2989, "total_steps": 9627, "loss": 1.6451, "learning_rate": 7.80416544353835e-05, "epoch": 0.310480939025657, "percentage": 31.05, "elapsed_time": "22:12:55", "remaining_time": "2 days, 1:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2990, "total_steps": 9627, "loss": 1.8862, "learning_rate": 7.802814398168572e-05, "epoch": 0.31058481354523737, "percentage": 31.06, "elapsed_time": "22:13:20", "remaining_time": "2 days, 1:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2991, "total_steps": 9627, "loss": 1.7783, "learning_rate": 7.801463054320927e-05, "epoch": 0.3106886880648177, "percentage": 31.07, "elapsed_time": "22:13:47", "remaining_time": "2 days, 1:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2992, "total_steps": 9627, "loss": 1.654, "learning_rate": 7.800111412139318e-05, "epoch": 0.310792562584398, "percentage": 31.08, "elapsed_time": "22:14:12", "remaining_time": "2 days, 1:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2993, "total_steps": 9627, "loss": 1.7425, "learning_rate": 7.798759471767684e-05, "epoch": 0.3108964371039784, "percentage": 31.09, "elapsed_time": "22:14:39", "remaining_time": "2 days, 1:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2994, "total_steps": 9627, "loss": 1.7184, "learning_rate": 7.797407233349998e-05, "epoch": 0.31100031162355873, "percentage": 31.1, "elapsed_time": "22:15:04", "remaining_time": "2 days, 1:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2995, "total_steps": 9627, "loss": 1.5123, "learning_rate": 7.796054697030262e-05, "epoch": 0.31110418614313906, "percentage": 31.11, "elapsed_time": "22:15:31", "remaining_time": "2 days, 1:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2996, "total_steps": 9627, "loss": 1.7482, "learning_rate": 7.794701862952512e-05, "epoch": 0.31120806066271944, "percentage": 31.12, "elapsed_time": "22:15:57", "remaining_time": "2 days, 1:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2997, "total_steps": 9627, "loss": 1.8343, "learning_rate": 7.793348731260813e-05, "epoch": 0.31131193518229977, "percentage": 31.13, "elapsed_time": "22:16:23", "remaining_time": "2 days, 1:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2998, "total_steps": 9627, "loss": 1.655, "learning_rate": 7.79199530209926e-05, "epoch": 0.31141580970188015, "percentage": 31.14, "elapsed_time": "22:16:49", "remaining_time": "2 days, 1:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2999, "total_steps": 9627, "loss": 1.7954, "learning_rate": 7.79064157561199e-05, "epoch": 0.3115196842214605, "percentage": 31.15, "elapsed_time": "22:17:15", "remaining_time": "2 days, 1:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 9627, "loss": 1.5854, "learning_rate": 7.789287551943158e-05, "epoch": 0.3116235587410408, "percentage": 31.16, "elapsed_time": "22:17:41", "remaining_time": "2 days, 1:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3001, "total_steps": 9627, "loss": 1.6898, "learning_rate": 7.787933231236958e-05, "epoch": 0.3117274332606212, "percentage": 31.17, "elapsed_time": "22:18:08", "remaining_time": "2 days, 1:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3002, "total_steps": 9627, "loss": 1.6463, "learning_rate": 7.786578613637617e-05, "epoch": 0.3118313077802015, "percentage": 31.18, "elapsed_time": "22:18:34", "remaining_time": "2 days, 1:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3003, "total_steps": 9627, "loss": 1.951, "learning_rate": 7.78522369928939e-05, "epoch": 0.31193518229978184, "percentage": 31.19, "elapsed_time": "22:19:00", "remaining_time": "2 days, 1:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3004, "total_steps": 9627, "loss": 1.6597, "learning_rate": 7.783868488336563e-05, "epoch": 0.3120390568193622, "percentage": 31.2, "elapsed_time": "22:19:25", "remaining_time": "2 days, 1:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3005, "total_steps": 9627, "loss": 1.8036, "learning_rate": 7.782512980923459e-05, "epoch": 0.31214293133894255, "percentage": 31.21, "elapsed_time": "22:19:52", "remaining_time": "2 days, 1:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3006, "total_steps": 9627, "loss": 1.6382, "learning_rate": 7.781157177194426e-05, "epoch": 0.3122468058585229, "percentage": 31.22, "elapsed_time": "22:20:17", "remaining_time": "2 days, 1:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3007, "total_steps": 9627, "loss": 1.7521, "learning_rate": 7.779801077293847e-05, "epoch": 0.31235068037810326, "percentage": 31.24, "elapsed_time": "22:20:44", "remaining_time": "2 days, 1:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3008, "total_steps": 9627, "loss": 1.7019, "learning_rate": 7.778444681366137e-05, "epoch": 0.3124545548976836, "percentage": 31.25, "elapsed_time": "22:21:10", "remaining_time": "2 days, 1:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3009, "total_steps": 9627, "loss": 1.7686, "learning_rate": 7.777087989555741e-05, "epoch": 0.31255842941726397, "percentage": 31.26, "elapsed_time": "22:21:36", "remaining_time": "2 days, 1:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3010, "total_steps": 9627, "loss": 1.5242, "learning_rate": 7.775731002007138e-05, "epoch": 0.3126623039368443, "percentage": 31.27, "elapsed_time": "22:22:01", "remaining_time": "2 days, 1:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3011, "total_steps": 9627, "loss": 1.771, "learning_rate": 7.774373718864833e-05, "epoch": 0.3127661784564246, "percentage": 31.28, "elapsed_time": "22:22:28", "remaining_time": "2 days, 1:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3012, "total_steps": 9627, "loss": 1.8089, "learning_rate": 7.773016140273368e-05, "epoch": 0.312870052976005, "percentage": 31.29, "elapsed_time": "22:22:53", "remaining_time": "2 days, 1:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3013, "total_steps": 9627, "loss": 1.6336, "learning_rate": 7.771658266377315e-05, "epoch": 0.31297392749558534, "percentage": 31.3, "elapsed_time": "22:23:20", "remaining_time": "2 days, 1:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3014, "total_steps": 9627, "loss": 1.4883, "learning_rate": 7.770300097321276e-05, "epoch": 0.31307780201516566, "percentage": 31.31, "elapsed_time": "22:23:45", "remaining_time": "2 days, 1:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3015, "total_steps": 9627, "loss": 1.8948, "learning_rate": 7.768941633249884e-05, "epoch": 0.31318167653474605, "percentage": 31.32, "elapsed_time": "22:24:11", "remaining_time": "2 days, 1:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3016, "total_steps": 9627, "loss": 1.702, "learning_rate": 7.76758287430781e-05, "epoch": 0.31328555105432637, "percentage": 31.33, "elapsed_time": "22:24:38", "remaining_time": "2 days, 1:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3017, "total_steps": 9627, "loss": 1.687, "learning_rate": 7.766223820639747e-05, "epoch": 0.3133894255739067, "percentage": 31.34, "elapsed_time": "22:25:04", "remaining_time": "2 days, 1:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3018, "total_steps": 9627, "loss": 1.7333, "learning_rate": 7.764864472390423e-05, "epoch": 0.3134933000934871, "percentage": 31.35, "elapsed_time": "22:25:30", "remaining_time": "2 days, 1:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3019, "total_steps": 9627, "loss": 1.6883, "learning_rate": 7.7635048297046e-05, "epoch": 0.3135971746130674, "percentage": 31.36, "elapsed_time": "22:25:56", "remaining_time": "2 days, 1:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3020, "total_steps": 9627, "loss": 1.9121, "learning_rate": 7.762144892727069e-05, "epoch": 0.31370104913264774, "percentage": 31.37, "elapsed_time": "22:26:22", "remaining_time": "2 days, 1:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3021, "total_steps": 9627, "loss": 1.8525, "learning_rate": 7.760784661602653e-05, "epoch": 0.3138049236522281, "percentage": 31.38, "elapsed_time": "22:26:48", "remaining_time": "2 days, 1:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3022, "total_steps": 9627, "loss": 1.529, "learning_rate": 7.759424136476206e-05, "epoch": 0.31390879817180845, "percentage": 31.39, "elapsed_time": "22:27:15", "remaining_time": "2 days, 1:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3023, "total_steps": 9627, "loss": 1.8153, "learning_rate": 7.75806331749261e-05, "epoch": 0.31401267269138883, "percentage": 31.4, "elapsed_time": "22:27:40", "remaining_time": "2 days, 1:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3024, "total_steps": 9627, "loss": 1.6807, "learning_rate": 7.756702204796786e-05, "epoch": 0.31411654721096915, "percentage": 31.41, "elapsed_time": "22:28:05", "remaining_time": "2 days, 1:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3025, "total_steps": 9627, "loss": 1.8526, "learning_rate": 7.75534079853368e-05, "epoch": 0.3142204217305495, "percentage": 31.42, "elapsed_time": "22:28:33", "remaining_time": "2 days, 1:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3026, "total_steps": 9627, "loss": 1.6186, "learning_rate": 7.753979098848272e-05, "epoch": 0.31432429625012986, "percentage": 31.43, "elapsed_time": "22:28:58", "remaining_time": "2 days, 1:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3027, "total_steps": 9627, "loss": 1.6896, "learning_rate": 7.752617105885574e-05, "epoch": 0.3144281707697102, "percentage": 31.44, "elapsed_time": "22:29:25", "remaining_time": "2 days, 1:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3028, "total_steps": 9627, "loss": 1.719, "learning_rate": 7.751254819790623e-05, "epoch": 0.3145320452892905, "percentage": 31.45, "elapsed_time": "22:29:50", "remaining_time": "2 days, 1:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3029, "total_steps": 9627, "loss": 1.7155, "learning_rate": 7.749892240708494e-05, "epoch": 0.3146359198088709, "percentage": 31.46, "elapsed_time": "22:30:16", "remaining_time": "2 days, 1:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3030, "total_steps": 9627, "loss": 1.8792, "learning_rate": 7.748529368784292e-05, "epoch": 0.31473979432845123, "percentage": 31.47, "elapsed_time": "22:30:42", "remaining_time": "2 days, 1:00:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3031, "total_steps": 9627, "loss": 1.8348, "learning_rate": 7.747166204163152e-05, "epoch": 0.31484366884803155, "percentage": 31.48, "elapsed_time": "22:31:08", "remaining_time": "2 days, 1:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3032, "total_steps": 9627, "loss": 1.7037, "learning_rate": 7.745802746990239e-05, "epoch": 0.31494754336761194, "percentage": 31.49, "elapsed_time": "22:31:35", "remaining_time": "2 days, 0:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3033, "total_steps": 9627, "loss": 1.6523, "learning_rate": 7.744438997410752e-05, "epoch": 0.31505141788719226, "percentage": 31.51, "elapsed_time": "22:32:00", "remaining_time": "2 days, 0:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3034, "total_steps": 9627, "loss": 1.705, "learning_rate": 7.74307495556992e-05, "epoch": 0.3151552924067726, "percentage": 31.52, "elapsed_time": "22:32:26", "remaining_time": "2 days, 0:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3035, "total_steps": 9627, "loss": 1.9339, "learning_rate": 7.741710621613002e-05, "epoch": 0.315259166926353, "percentage": 31.53, "elapsed_time": "22:32:53", "remaining_time": "2 days, 0:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3036, "total_steps": 9627, "loss": 1.8712, "learning_rate": 7.740345995685287e-05, "epoch": 0.3153630414459333, "percentage": 31.54, "elapsed_time": "22:33:18", "remaining_time": "2 days, 0:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3037, "total_steps": 9627, "loss": 1.8456, "learning_rate": 7.738981077932099e-05, "epoch": 0.3154669159655137, "percentage": 31.55, "elapsed_time": "22:33:45", "remaining_time": "2 days, 0:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3038, "total_steps": 9627, "loss": 1.7126, "learning_rate": 7.737615868498793e-05, "epoch": 0.315570790485094, "percentage": 31.56, "elapsed_time": "22:34:10", "remaining_time": "2 days, 0:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3039, "total_steps": 9627, "loss": 1.6292, "learning_rate": 7.736250367530751e-05, "epoch": 0.31567466500467434, "percentage": 31.57, "elapsed_time": "22:34:37", "remaining_time": "2 days, 0:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3040, "total_steps": 9627, "loss": 1.7703, "learning_rate": 7.734884575173387e-05, "epoch": 0.3157785395242547, "percentage": 31.58, "elapsed_time": "22:35:03", "remaining_time": "2 days, 0:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3041, "total_steps": 9627, "loss": 1.7719, "learning_rate": 7.73351849157215e-05, "epoch": 0.31588241404383505, "percentage": 31.59, "elapsed_time": "22:35:29", "remaining_time": "2 days, 0:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3042, "total_steps": 9627, "loss": 1.6538, "learning_rate": 7.732152116872515e-05, "epoch": 0.3159862885634154, "percentage": 31.6, "elapsed_time": "22:35:55", "remaining_time": "2 days, 0:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3043, "total_steps": 9627, "loss": 1.755, "learning_rate": 7.730785451219991e-05, "epoch": 0.31609016308299576, "percentage": 31.61, "elapsed_time": "22:36:21", "remaining_time": "2 days, 0:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3044, "total_steps": 9627, "loss": 1.5637, "learning_rate": 7.729418494760119e-05, "epoch": 0.3161940376025761, "percentage": 31.62, "elapsed_time": "22:36:47", "remaining_time": "2 days, 0:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3045, "total_steps": 9627, "loss": 1.5991, "learning_rate": 7.728051247638468e-05, "epoch": 0.3162979121221564, "percentage": 31.63, "elapsed_time": "22:37:13", "remaining_time": "2 days, 0:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3046, "total_steps": 9627, "loss": 1.7331, "learning_rate": 7.726683710000637e-05, "epoch": 0.3164017866417368, "percentage": 31.64, "elapsed_time": "22:37:39", "remaining_time": "2 days, 0:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3047, "total_steps": 9627, "loss": 1.8179, "learning_rate": 7.72531588199226e-05, "epoch": 0.3165056611613171, "percentage": 31.65, "elapsed_time": "22:38:05", "remaining_time": "2 days, 0:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3048, "total_steps": 9627, "loss": 1.7464, "learning_rate": 7.723947763759e-05, "epoch": 0.3166095356808975, "percentage": 31.66, "elapsed_time": "22:38:31", "remaining_time": "2 days, 0:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3049, "total_steps": 9627, "loss": 1.5823, "learning_rate": 7.722579355446551e-05, "epoch": 0.31671341020047783, "percentage": 31.67, "elapsed_time": "22:38:57", "remaining_time": "2 days, 0:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 9627, "loss": 1.7697, "learning_rate": 7.721210657200637e-05, "epoch": 0.31681728472005816, "percentage": 31.68, "elapsed_time": "22:39:24", "remaining_time": "2 days, 0:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3051, "total_steps": 9627, "loss": 1.6861, "learning_rate": 7.719841669167014e-05, "epoch": 0.31692115923963854, "percentage": 31.69, "elapsed_time": "22:39:50", "remaining_time": "2 days, 0:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3052, "total_steps": 9627, "loss": 1.9079, "learning_rate": 7.71847239149147e-05, "epoch": 0.31702503375921887, "percentage": 31.7, "elapsed_time": "22:40:16", "remaining_time": "2 days, 0:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3053, "total_steps": 9627, "loss": 1.8736, "learning_rate": 7.717102824319822e-05, "epoch": 0.3171289082787992, "percentage": 31.71, "elapsed_time": "22:40:42", "remaining_time": "2 days, 0:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3054, "total_steps": 9627, "loss": 1.7298, "learning_rate": 7.715732967797915e-05, "epoch": 0.3172327827983796, "percentage": 31.72, "elapsed_time": "22:41:07", "remaining_time": "2 days, 0:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3055, "total_steps": 9627, "loss": 1.8096, "learning_rate": 7.714362822071632e-05, "epoch": 0.3173366573179599, "percentage": 31.73, "elapsed_time": "22:41:33", "remaining_time": "2 days, 0:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3056, "total_steps": 9627, "loss": 1.5215, "learning_rate": 7.712992387286882e-05, "epoch": 0.31744053183754023, "percentage": 31.74, "elapsed_time": "22:41:59", "remaining_time": "2 days, 0:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3057, "total_steps": 9627, "loss": 1.6497, "learning_rate": 7.711621663589602e-05, "epoch": 0.3175444063571206, "percentage": 31.75, "elapsed_time": "22:42:26", "remaining_time": "2 days, 0:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3058, "total_steps": 9627, "loss": 1.6053, "learning_rate": 7.71025065112577e-05, "epoch": 0.31764828087670094, "percentage": 31.76, "elapsed_time": "22:42:52", "remaining_time": "2 days, 0:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3059, "total_steps": 9627, "loss": 1.6968, "learning_rate": 7.708879350041383e-05, "epoch": 0.31775215539628127, "percentage": 31.78, "elapsed_time": "22:43:19", "remaining_time": "2 days, 0:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3060, "total_steps": 9627, "loss": 1.6815, "learning_rate": 7.707507760482474e-05, "epoch": 0.31785602991586165, "percentage": 31.79, "elapsed_time": "22:43:44", "remaining_time": "2 days, 0:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3061, "total_steps": 9627, "loss": 1.6113, "learning_rate": 7.706135882595108e-05, "epoch": 0.317959904435442, "percentage": 31.8, "elapsed_time": "22:44:09", "remaining_time": "2 days, 0:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3062, "total_steps": 9627, "loss": 1.9964, "learning_rate": 7.70476371652538e-05, "epoch": 0.31806377895502236, "percentage": 31.81, "elapsed_time": "22:44:37", "remaining_time": "2 days, 0:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3063, "total_steps": 9627, "loss": 1.67, "learning_rate": 7.703391262419413e-05, "epoch": 0.3181676534746027, "percentage": 31.82, "elapsed_time": "22:45:02", "remaining_time": "2 days, 0:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3064, "total_steps": 9627, "loss": 1.7399, "learning_rate": 7.702018520423367e-05, "epoch": 0.318271527994183, "percentage": 31.83, "elapsed_time": "22:45:29", "remaining_time": "2 days, 0:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3065, "total_steps": 9627, "loss": 1.8155, "learning_rate": 7.700645490683421e-05, "epoch": 0.3183754025137634, "percentage": 31.84, "elapsed_time": "22:45:55", "remaining_time": "2 days, 0:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3066, "total_steps": 9627, "loss": 1.7583, "learning_rate": 7.699272173345799e-05, "epoch": 0.3184792770333437, "percentage": 31.85, "elapsed_time": "22:46:21", "remaining_time": "2 days, 0:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3067, "total_steps": 9627, "loss": 1.5891, "learning_rate": 7.697898568556745e-05, "epoch": 0.31858315155292405, "percentage": 31.86, "elapsed_time": "22:46:46", "remaining_time": "2 days, 0:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3068, "total_steps": 9627, "loss": 1.7358, "learning_rate": 7.696524676462538e-05, "epoch": 0.31868702607250443, "percentage": 31.87, "elapsed_time": "22:47:13", "remaining_time": "2 days, 0:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3069, "total_steps": 9627, "loss": 1.7218, "learning_rate": 7.695150497209485e-05, "epoch": 0.31879090059208476, "percentage": 31.88, "elapsed_time": "22:47:39", "remaining_time": "2 days, 0:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3070, "total_steps": 9627, "loss": 1.8209, "learning_rate": 7.69377603094393e-05, "epoch": 0.3188947751116651, "percentage": 31.89, "elapsed_time": "22:48:05", "remaining_time": "2 days, 0:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3071, "total_steps": 9627, "loss": 1.6095, "learning_rate": 7.692401277812236e-05, "epoch": 0.31899864963124547, "percentage": 31.9, "elapsed_time": "22:48:32", "remaining_time": "2 days, 0:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3072, "total_steps": 9627, "loss": 1.5576, "learning_rate": 7.69102623796081e-05, "epoch": 0.3191025241508258, "percentage": 31.91, "elapsed_time": "22:48:57", "remaining_time": "2 days, 0:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3073, "total_steps": 9627, "loss": 1.656, "learning_rate": 7.689650911536081e-05, "epoch": 0.3192063986704061, "percentage": 31.92, "elapsed_time": "22:49:24", "remaining_time": "2 days, 0:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3074, "total_steps": 9627, "loss": 1.7435, "learning_rate": 7.688275298684509e-05, "epoch": 0.3193102731899865, "percentage": 31.93, "elapsed_time": "22:49:50", "remaining_time": "2 days, 0:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3075, "total_steps": 9627, "loss": 1.6421, "learning_rate": 7.686899399552587e-05, "epoch": 0.31941414770956683, "percentage": 31.94, "elapsed_time": "22:50:16", "remaining_time": "2 days, 0:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3076, "total_steps": 9627, "loss": 1.7208, "learning_rate": 7.685523214286839e-05, "epoch": 0.3195180222291472, "percentage": 31.95, "elapsed_time": "22:50:42", "remaining_time": "2 days, 0:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3077, "total_steps": 9627, "loss": 1.7648, "learning_rate": 7.684146743033815e-05, "epoch": 0.31962189674872754, "percentage": 31.96, "elapsed_time": "22:51:08", "remaining_time": "2 days, 0:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3078, "total_steps": 9627, "loss": 1.751, "learning_rate": 7.6827699859401e-05, "epoch": 0.31972577126830787, "percentage": 31.97, "elapsed_time": "22:51:34", "remaining_time": "2 days, 0:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3079, "total_steps": 9627, "loss": 1.7878, "learning_rate": 7.681392943152308e-05, "epoch": 0.31982964578788825, "percentage": 31.98, "elapsed_time": "22:52:01", "remaining_time": "2 days, 0:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3080, "total_steps": 9627, "loss": 1.7752, "learning_rate": 7.680015614817083e-05, "epoch": 0.3199335203074686, "percentage": 31.99, "elapsed_time": "22:52:26", "remaining_time": "2 days, 0:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3081, "total_steps": 9627, "loss": 1.7377, "learning_rate": 7.678638001081102e-05, "epoch": 0.3200373948270489, "percentage": 32.0, "elapsed_time": "22:52:53", "remaining_time": "2 days, 0:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3082, "total_steps": 9627, "loss": 1.7732, "learning_rate": 7.677260102091066e-05, "epoch": 0.3201412693466293, "percentage": 32.01, "elapsed_time": "22:53:19", "remaining_time": "2 days, 0:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3083, "total_steps": 9627, "loss": 1.6768, "learning_rate": 7.675881917993713e-05, "epoch": 0.3202451438662096, "percentage": 32.02, "elapsed_time": "22:53:45", "remaining_time": "2 days, 0:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3084, "total_steps": 9627, "loss": 1.59, "learning_rate": 7.674503448935808e-05, "epoch": 0.32034901838578994, "percentage": 32.03, "elapsed_time": "22:54:11", "remaining_time": "2 days, 0:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3085, "total_steps": 9627, "loss": 1.3873, "learning_rate": 7.673124695064148e-05, "epoch": 0.3204528929053703, "percentage": 32.05, "elapsed_time": "22:54:38", "remaining_time": "2 days, 0:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3086, "total_steps": 9627, "loss": 1.5037, "learning_rate": 7.671745656525559e-05, "epoch": 0.32055676742495065, "percentage": 32.06, "elapsed_time": "22:55:04", "remaining_time": "2 days, 0:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3087, "total_steps": 9627, "loss": 1.6842, "learning_rate": 7.670366333466899e-05, "epoch": 0.32066064194453103, "percentage": 32.07, "elapsed_time": "22:55:30", "remaining_time": "2 days, 0:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3088, "total_steps": 9627, "loss": 1.858, "learning_rate": 7.668986726035054e-05, "epoch": 0.32076451646411136, "percentage": 32.08, "elapsed_time": "22:55:56", "remaining_time": "2 days, 0:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3089, "total_steps": 9627, "loss": 1.9369, "learning_rate": 7.66760683437694e-05, "epoch": 0.3208683909836917, "percentage": 32.09, "elapsed_time": "22:56:22", "remaining_time": "2 days, 0:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3090, "total_steps": 9627, "loss": 1.6107, "learning_rate": 7.666226658639507e-05, "epoch": 0.32097226550327207, "percentage": 32.1, "elapsed_time": "22:56:49", "remaining_time": "2 days, 0:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3091, "total_steps": 9627, "loss": 1.8063, "learning_rate": 7.664846198969733e-05, "epoch": 0.3210761400228524, "percentage": 32.11, "elapsed_time": "22:57:15", "remaining_time": "2 days, 0:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3092, "total_steps": 9627, "loss": 2.2025, "learning_rate": 7.663465455514625e-05, "epoch": 0.3211800145424327, "percentage": 32.12, "elapsed_time": "22:57:41", "remaining_time": "2 days, 0:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3093, "total_steps": 9627, "loss": 1.6021, "learning_rate": 7.662084428421221e-05, "epoch": 0.3212838890620131, "percentage": 32.13, "elapsed_time": "22:58:07", "remaining_time": "2 days, 0:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3094, "total_steps": 9627, "loss": 1.6781, "learning_rate": 7.660703117836591e-05, "epoch": 0.32138776358159343, "percentage": 32.14, "elapsed_time": "22:58:34", "remaining_time": "2 days, 0:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3095, "total_steps": 9627, "loss": 1.8033, "learning_rate": 7.659321523907834e-05, "epoch": 0.32149163810117376, "percentage": 32.15, "elapsed_time": "22:58:59", "remaining_time": "2 days, 0:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3096, "total_steps": 9627, "loss": 1.6971, "learning_rate": 7.657939646782077e-05, "epoch": 0.32159551262075414, "percentage": 32.16, "elapsed_time": "22:59:26", "remaining_time": "2 days, 0:29:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3097, "total_steps": 9627, "loss": 1.7625, "learning_rate": 7.656557486606482e-05, "epoch": 0.32169938714033447, "percentage": 32.17, "elapsed_time": "22:59:52", "remaining_time": "2 days, 0:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3098, "total_steps": 9627, "loss": 1.79, "learning_rate": 7.655175043528235e-05, "epoch": 0.3218032616599148, "percentage": 32.18, "elapsed_time": "23:00:18", "remaining_time": "2 days, 0:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3099, "total_steps": 9627, "loss": 1.7281, "learning_rate": 7.653792317694556e-05, "epoch": 0.3219071361794952, "percentage": 32.19, "elapsed_time": "23:00:44", "remaining_time": "2 days, 0:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 9627, "loss": 1.7644, "learning_rate": 7.652409309252699e-05, "epoch": 0.3220110106990755, "percentage": 32.2, "elapsed_time": "23:01:11", "remaining_time": "2 days, 0:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3101, "total_steps": 9627, "loss": 1.815, "learning_rate": 7.651026018349938e-05, "epoch": 0.3221148852186559, "percentage": 32.21, "elapsed_time": "23:01:37", "remaining_time": "2 days, 0:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3102, "total_steps": 9627, "loss": 1.8004, "learning_rate": 7.649642445133585e-05, "epoch": 0.3222187597382362, "percentage": 32.22, "elapsed_time": "23:02:03", "remaining_time": "2 days, 0:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3103, "total_steps": 9627, "loss": 1.8058, "learning_rate": 7.64825858975098e-05, "epoch": 0.32232263425781654, "percentage": 32.23, "elapsed_time": "23:02:29", "remaining_time": "2 days, 0:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3104, "total_steps": 9627, "loss": 1.7229, "learning_rate": 7.646874452349491e-05, "epoch": 0.3224265087773969, "percentage": 32.24, "elapsed_time": "23:02:56", "remaining_time": "2 days, 0:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3105, "total_steps": 9627, "loss": 1.6437, "learning_rate": 7.64549003307652e-05, "epoch": 0.32253038329697725, "percentage": 32.25, "elapsed_time": "23:03:21", "remaining_time": "2 days, 0:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3106, "total_steps": 9627, "loss": 1.8526, "learning_rate": 7.644105332079497e-05, "epoch": 0.3226342578165576, "percentage": 32.26, "elapsed_time": "23:03:47", "remaining_time": "2 days, 0:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3107, "total_steps": 9627, "loss": 1.8628, "learning_rate": 7.642720349505881e-05, "epoch": 0.32273813233613796, "percentage": 32.27, "elapsed_time": "23:04:13", "remaining_time": "2 days, 0:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3108, "total_steps": 9627, "loss": 1.7873, "learning_rate": 7.641335085503161e-05, "epoch": 0.3228420068557183, "percentage": 32.28, "elapsed_time": "23:04:39", "remaining_time": "2 days, 0:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3109, "total_steps": 9627, "loss": 1.7672, "learning_rate": 7.639949540218858e-05, "epoch": 0.3229458813752986, "percentage": 32.29, "elapsed_time": "23:05:06", "remaining_time": "2 days, 0:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3110, "total_steps": 9627, "loss": 1.7417, "learning_rate": 7.63856371380052e-05, "epoch": 0.323049755894879, "percentage": 32.3, "elapsed_time": "23:05:32", "remaining_time": "2 days, 0:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3111, "total_steps": 9627, "loss": 1.855, "learning_rate": 7.63717760639573e-05, "epoch": 0.3231536304144593, "percentage": 32.32, "elapsed_time": "23:05:59", "remaining_time": "2 days, 0:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3112, "total_steps": 9627, "loss": 1.766, "learning_rate": 7.635791218152094e-05, "epoch": 0.3232575049340397, "percentage": 32.33, "elapsed_time": "23:06:24", "remaining_time": "2 days, 0:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3113, "total_steps": 9627, "loss": 1.6696, "learning_rate": 7.634404549217254e-05, "epoch": 0.32336137945362003, "percentage": 32.34, "elapsed_time": "23:06:51", "remaining_time": "2 days, 0:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3114, "total_steps": 9627, "loss": 1.7205, "learning_rate": 7.633017599738879e-05, "epoch": 0.32346525397320036, "percentage": 32.35, "elapsed_time": "23:07:16", "remaining_time": "2 days, 0:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3115, "total_steps": 9627, "loss": 1.6764, "learning_rate": 7.631630369864668e-05, "epoch": 0.32356912849278074, "percentage": 32.36, "elapsed_time": "23:07:42", "remaining_time": "2 days, 0:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3116, "total_steps": 9627, "loss": 1.633, "learning_rate": 7.63024285974235e-05, "epoch": 0.32367300301236107, "percentage": 32.37, "elapsed_time": "23:08:09", "remaining_time": "2 days, 0:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3117, "total_steps": 9627, "loss": 1.9059, "learning_rate": 7.628855069519685e-05, "epoch": 0.3237768775319414, "percentage": 32.38, "elapsed_time": "23:08:35", "remaining_time": "2 days, 0:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3118, "total_steps": 9627, "loss": 1.6475, "learning_rate": 7.627466999344459e-05, "epoch": 0.3238807520515218, "percentage": 32.39, "elapsed_time": "23:09:02", "remaining_time": "2 days, 0:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3119, "total_steps": 9627, "loss": 1.8901, "learning_rate": 7.626078649364494e-05, "epoch": 0.3239846265711021, "percentage": 32.4, "elapsed_time": "23:09:28", "remaining_time": "2 days, 0:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3120, "total_steps": 9627, "loss": 1.62, "learning_rate": 7.624690019727636e-05, "epoch": 0.32408850109068243, "percentage": 32.41, "elapsed_time": "23:09:53", "remaining_time": "2 days, 0:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3121, "total_steps": 9627, "loss": 1.7613, "learning_rate": 7.623301110581764e-05, "epoch": 0.3241923756102628, "percentage": 32.42, "elapsed_time": "23:10:20", "remaining_time": "2 days, 0:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3122, "total_steps": 9627, "loss": 1.6685, "learning_rate": 7.621911922074787e-05, "epoch": 0.32429625012984314, "percentage": 32.43, "elapsed_time": "23:10:46", "remaining_time": "2 days, 0:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3123, "total_steps": 9627, "loss": 1.8067, "learning_rate": 7.620522454354644e-05, "epoch": 0.32440012464942347, "percentage": 32.44, "elapsed_time": "23:11:13", "remaining_time": "2 days, 0:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3124, "total_steps": 9627, "loss": 1.8046, "learning_rate": 7.619132707569299e-05, "epoch": 0.32450399916900385, "percentage": 32.45, "elapsed_time": "23:11:38", "remaining_time": "2 days, 0:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3125, "total_steps": 9627, "loss": 1.9807, "learning_rate": 7.617742681866749e-05, "epoch": 0.3246078736885842, "percentage": 32.46, "elapsed_time": "23:12:05", "remaining_time": "2 days, 0:16:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3126, "total_steps": 9627, "loss": 1.7041, "learning_rate": 7.616352377395025e-05, "epoch": 0.32471174820816456, "percentage": 32.47, "elapsed_time": "23:12:31", "remaining_time": "2 days, 0:15:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3127, "total_steps": 9627, "loss": 1.7103, "learning_rate": 7.614961794302178e-05, "epoch": 0.3248156227277449, "percentage": 32.48, "elapsed_time": "23:12:57", "remaining_time": "2 days, 0:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3128, "total_steps": 9627, "loss": 1.6377, "learning_rate": 7.6135709327363e-05, "epoch": 0.3249194972473252, "percentage": 32.49, "elapsed_time": "23:13:23", "remaining_time": "2 days, 0:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3129, "total_steps": 9627, "loss": 1.7518, "learning_rate": 7.612179792845504e-05, "epoch": 0.3250233717669056, "percentage": 32.5, "elapsed_time": "23:13:49", "remaining_time": "2 days, 0:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3130, "total_steps": 9627, "loss": 1.6768, "learning_rate": 7.610788374777935e-05, "epoch": 0.3251272462864859, "percentage": 32.51, "elapsed_time": "23:14:16", "remaining_time": "2 days, 0:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3131, "total_steps": 9627, "loss": 1.8424, "learning_rate": 7.609396678681771e-05, "epoch": 0.32523112080606625, "percentage": 32.52, "elapsed_time": "23:14:41", "remaining_time": "2 days, 0:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3132, "total_steps": 9627, "loss": 1.8505, "learning_rate": 7.608004704705212e-05, "epoch": 0.32533499532564664, "percentage": 32.53, "elapsed_time": "23:15:08", "remaining_time": "2 days, 0:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3133, "total_steps": 9627, "loss": 1.6893, "learning_rate": 7.606612452996495e-05, "epoch": 0.32543886984522696, "percentage": 32.54, "elapsed_time": "23:15:34", "remaining_time": "2 days, 0:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3134, "total_steps": 9627, "loss": 1.7895, "learning_rate": 7.605219923703886e-05, "epoch": 0.3255427443648073, "percentage": 32.55, "elapsed_time": "23:16:00", "remaining_time": "2 days, 0:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3135, "total_steps": 9627, "loss": 1.5966, "learning_rate": 7.603827116975677e-05, "epoch": 0.3256466188843877, "percentage": 32.56, "elapsed_time": "23:16:26", "remaining_time": "2 days, 0:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3136, "total_steps": 9627, "loss": 1.7413, "learning_rate": 7.602434032960189e-05, "epoch": 0.325750493403968, "percentage": 32.58, "elapsed_time": "23:16:53", "remaining_time": "2 days, 0:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3137, "total_steps": 9627, "loss": 1.3362, "learning_rate": 7.601040671805779e-05, "epoch": 0.3258543679235483, "percentage": 32.59, "elapsed_time": "23:17:19", "remaining_time": "2 days, 0:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3138, "total_steps": 9627, "loss": 1.6745, "learning_rate": 7.599647033660824e-05, "epoch": 0.3259582424431287, "percentage": 32.6, "elapsed_time": "23:17:45", "remaining_time": "2 days, 0:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3139, "total_steps": 9627, "loss": 1.6381, "learning_rate": 7.598253118673738e-05, "epoch": 0.32606211696270904, "percentage": 32.61, "elapsed_time": "23:18:12", "remaining_time": "2 days, 0:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3140, "total_steps": 9627, "loss": 1.8387, "learning_rate": 7.596858926992962e-05, "epoch": 0.3261659914822894, "percentage": 32.62, "elapsed_time": "23:18:37", "remaining_time": "2 days, 0:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3141, "total_steps": 9627, "loss": 1.6446, "learning_rate": 7.595464458766968e-05, "epoch": 0.32626986600186975, "percentage": 32.63, "elapsed_time": "23:19:04", "remaining_time": "2 days, 0:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3142, "total_steps": 9627, "loss": 1.4691, "learning_rate": 7.594069714144252e-05, "epoch": 0.3263737405214501, "percentage": 32.64, "elapsed_time": "23:19:30", "remaining_time": "2 days, 0:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3143, "total_steps": 9627, "loss": 1.8108, "learning_rate": 7.592674693273348e-05, "epoch": 0.32647761504103046, "percentage": 32.65, "elapsed_time": "23:19:56", "remaining_time": "2 days, 0:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3144, "total_steps": 9627, "loss": 1.7062, "learning_rate": 7.591279396302812e-05, "epoch": 0.3265814895606108, "percentage": 32.66, "elapsed_time": "23:20:23", "remaining_time": "2 days, 0:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3145, "total_steps": 9627, "loss": 1.6658, "learning_rate": 7.589883823381234e-05, "epoch": 0.3266853640801911, "percentage": 32.67, "elapsed_time": "23:20:48", "remaining_time": "2 days, 0:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3146, "total_steps": 9627, "loss": 1.7899, "learning_rate": 7.58848797465723e-05, "epoch": 0.3267892385997715, "percentage": 32.68, "elapsed_time": "23:21:14", "remaining_time": "2 days, 0:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3147, "total_steps": 9627, "loss": 1.7506, "learning_rate": 7.587091850279447e-05, "epoch": 0.3268931131193518, "percentage": 32.69, "elapsed_time": "23:21:41", "remaining_time": "2 days, 0:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3148, "total_steps": 9627, "loss": 1.7103, "learning_rate": 7.585695450396564e-05, "epoch": 0.32699698763893215, "percentage": 32.7, "elapsed_time": "23:22:07", "remaining_time": "2 days, 0:05:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3149, "total_steps": 9627, "loss": 1.5979, "learning_rate": 7.584298775157282e-05, "epoch": 0.32710086215851253, "percentage": 32.71, "elapsed_time": "23:22:32", "remaining_time": "2 days, 0:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 9627, "loss": 1.8509, "learning_rate": 7.58290182471034e-05, "epoch": 0.32720473667809286, "percentage": 32.72, "elapsed_time": "23:22:59", "remaining_time": "2 days, 0:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3151, "total_steps": 9627, "loss": 1.686, "learning_rate": 7.581504599204503e-05, "epoch": 0.32730861119767324, "percentage": 32.73, "elapsed_time": "23:23:25", "remaining_time": "2 days, 0:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3152, "total_steps": 9627, "loss": 1.8448, "learning_rate": 7.58010709878856e-05, "epoch": 0.32741248571725357, "percentage": 32.74, "elapsed_time": "23:23:52", "remaining_time": "2 days, 0:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3153, "total_steps": 9627, "loss": 1.7782, "learning_rate": 7.578709323611338e-05, "epoch": 0.3275163602368339, "percentage": 32.75, "elapsed_time": "23:24:18", "remaining_time": "2 days, 0:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3154, "total_steps": 9627, "loss": 1.7276, "learning_rate": 7.577311273821687e-05, "epoch": 0.3276202347564143, "percentage": 32.76, "elapsed_time": "23:24:43", "remaining_time": "2 days, 0:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3155, "total_steps": 9627, "loss": 1.7094, "learning_rate": 7.575912949568489e-05, "epoch": 0.3277241092759946, "percentage": 32.77, "elapsed_time": "23:25:10", "remaining_time": "2 days, 0:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3156, "total_steps": 9627, "loss": 1.6252, "learning_rate": 7.574514351000657e-05, "epoch": 0.32782798379557493, "percentage": 32.78, "elapsed_time": "23:25:36", "remaining_time": "2 days, 0:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3157, "total_steps": 9627, "loss": 1.7715, "learning_rate": 7.573115478267126e-05, "epoch": 0.3279318583151553, "percentage": 32.79, "elapsed_time": "23:26:02", "remaining_time": "2 days, 0:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3158, "total_steps": 9627, "loss": 1.71, "learning_rate": 7.571716331516869e-05, "epoch": 0.32803573283473564, "percentage": 32.8, "elapsed_time": "23:26:28", "remaining_time": "2 days, 0:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3159, "total_steps": 9627, "loss": 1.6717, "learning_rate": 7.570316910898882e-05, "epoch": 0.32813960735431597, "percentage": 32.81, "elapsed_time": "23:26:53", "remaining_time": "2 days, 0:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3160, "total_steps": 9627, "loss": 1.6144, "learning_rate": 7.568917216562193e-05, "epoch": 0.32824348187389635, "percentage": 32.82, "elapsed_time": "23:27:20", "remaining_time": "2 days, 0:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3161, "total_steps": 9627, "loss": 1.7229, "learning_rate": 7.56751724865586e-05, "epoch": 0.3283473563934767, "percentage": 32.83, "elapsed_time": "23:27:46", "remaining_time": "1 day, 23:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3162, "total_steps": 9627, "loss": 1.6128, "learning_rate": 7.566117007328967e-05, "epoch": 0.328451230913057, "percentage": 32.85, "elapsed_time": "23:28:12", "remaining_time": "1 day, 23:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3163, "total_steps": 9627, "loss": 1.8158, "learning_rate": 7.564716492730628e-05, "epoch": 0.3285551054326374, "percentage": 32.86, "elapsed_time": "23:28:38", "remaining_time": "1 day, 23:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3164, "total_steps": 9627, "loss": 1.5258, "learning_rate": 7.56331570500999e-05, "epoch": 0.3286589799522177, "percentage": 32.87, "elapsed_time": "23:29:04", "remaining_time": "1 day, 23:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3165, "total_steps": 9627, "loss": 1.8395, "learning_rate": 7.561914644316221e-05, "epoch": 0.3287628544717981, "percentage": 32.88, "elapsed_time": "23:29:30", "remaining_time": "1 day, 23:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3166, "total_steps": 9627, "loss": 1.7382, "learning_rate": 7.560513310798529e-05, "epoch": 0.3288667289913784, "percentage": 32.89, "elapsed_time": "23:29:56", "remaining_time": "1 day, 23:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3167, "total_steps": 9627, "loss": 1.7647, "learning_rate": 7.559111704606142e-05, "epoch": 0.32897060351095875, "percentage": 32.9, "elapsed_time": "23:30:22", "remaining_time": "1 day, 23:56:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3168, "total_steps": 9627, "loss": 1.6671, "learning_rate": 7.557709825888319e-05, "epoch": 0.32907447803053913, "percentage": 32.91, "elapsed_time": "23:30:49", "remaining_time": "1 day, 23:56:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3169, "total_steps": 9627, "loss": 1.8564, "learning_rate": 7.556307674794351e-05, "epoch": 0.32917835255011946, "percentage": 32.92, "elapsed_time": "23:31:14", "remaining_time": "1 day, 23:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3170, "total_steps": 9627, "loss": 1.8405, "learning_rate": 7.554905251473557e-05, "epoch": 0.3292822270696998, "percentage": 32.93, "elapsed_time": "23:31:41", "remaining_time": "1 day, 23:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3171, "total_steps": 9627, "loss": 1.6871, "learning_rate": 7.55350255607528e-05, "epoch": 0.32938610158928017, "percentage": 32.94, "elapsed_time": "23:32:07", "remaining_time": "1 day, 23:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3172, "total_steps": 9627, "loss": 1.6192, "learning_rate": 7.5520995887489e-05, "epoch": 0.3294899761088605, "percentage": 32.95, "elapsed_time": "23:32:32", "remaining_time": "1 day, 23:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3173, "total_steps": 9627, "loss": 1.9924, "learning_rate": 7.550696349643822e-05, "epoch": 0.3295938506284408, "percentage": 32.96, "elapsed_time": "23:33:00", "remaining_time": "1 day, 23:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3174, "total_steps": 9627, "loss": 1.7255, "learning_rate": 7.549292838909478e-05, "epoch": 0.3296977251480212, "percentage": 32.97, "elapsed_time": "23:33:25", "remaining_time": "1 day, 23:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3175, "total_steps": 9627, "loss": 1.7508, "learning_rate": 7.547889056695332e-05, "epoch": 0.32980159966760153, "percentage": 32.98, "elapsed_time": "23:33:52", "remaining_time": "1 day, 23:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3176, "total_steps": 9627, "loss": 1.7239, "learning_rate": 7.546485003150876e-05, "epoch": 0.32990547418718186, "percentage": 32.99, "elapsed_time": "23:34:17", "remaining_time": "1 day, 23:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3177, "total_steps": 9627, "loss": 1.6987, "learning_rate": 7.54508067842563e-05, "epoch": 0.33000934870676224, "percentage": 33.0, "elapsed_time": "23:34:44", "remaining_time": "1 day, 23:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3178, "total_steps": 9627, "loss": 1.675, "learning_rate": 7.543676082669146e-05, "epoch": 0.33011322322634257, "percentage": 33.01, "elapsed_time": "23:35:10", "remaining_time": "1 day, 23:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3179, "total_steps": 9627, "loss": 1.6841, "learning_rate": 7.542271216030998e-05, "epoch": 0.33021709774592295, "percentage": 33.02, "elapsed_time": "23:35:36", "remaining_time": "1 day, 23:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3180, "total_steps": 9627, "loss": 1.7604, "learning_rate": 7.540866078660797e-05, "epoch": 0.3303209722655033, "percentage": 33.03, "elapsed_time": "23:36:02", "remaining_time": "1 day, 23:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3181, "total_steps": 9627, "loss": 1.7021, "learning_rate": 7.539460670708178e-05, "epoch": 0.3304248467850836, "percentage": 33.04, "elapsed_time": "23:36:28", "remaining_time": "1 day, 23:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3182, "total_steps": 9627, "loss": 1.885, "learning_rate": 7.538054992322806e-05, "epoch": 0.330528721304664, "percentage": 33.05, "elapsed_time": "23:36:53", "remaining_time": "1 day, 23:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3183, "total_steps": 9627, "loss": 1.3871, "learning_rate": 7.536649043654376e-05, "epoch": 0.3306325958242443, "percentage": 33.06, "elapsed_time": "23:37:21", "remaining_time": "1 day, 23:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3184, "total_steps": 9627, "loss": 1.7323, "learning_rate": 7.535242824852608e-05, "epoch": 0.33073647034382464, "percentage": 33.07, "elapsed_time": "23:37:47", "remaining_time": "1 day, 23:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3185, "total_steps": 9627, "loss": 1.7173, "learning_rate": 7.533836336067257e-05, "epoch": 0.330840344863405, "percentage": 33.08, "elapsed_time": "23:38:13", "remaining_time": "1 day, 23:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3186, "total_steps": 9627, "loss": 1.6793, "learning_rate": 7.5324295774481e-05, "epoch": 0.33094421938298535, "percentage": 33.09, "elapsed_time": "23:38:39", "remaining_time": "1 day, 23:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3187, "total_steps": 9627, "loss": 1.7443, "learning_rate": 7.531022549144946e-05, "epoch": 0.3310480939025657, "percentage": 33.1, "elapsed_time": "23:39:05", "remaining_time": "1 day, 23:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3188, "total_steps": 9627, "loss": 1.675, "learning_rate": 7.529615251307631e-05, "epoch": 0.33115196842214606, "percentage": 33.12, "elapsed_time": "23:39:31", "remaining_time": "1 day, 23:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3189, "total_steps": 9627, "loss": 1.7026, "learning_rate": 7.528207684086027e-05, "epoch": 0.3312558429417264, "percentage": 33.13, "elapsed_time": "23:39:57", "remaining_time": "1 day, 23:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3190, "total_steps": 9627, "loss": 1.6583, "learning_rate": 7.526799847630024e-05, "epoch": 0.33135971746130677, "percentage": 33.14, "elapsed_time": "23:40:23", "remaining_time": "1 day, 23:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3191, "total_steps": 9627, "loss": 1.6339, "learning_rate": 7.525391742089547e-05, "epoch": 0.3314635919808871, "percentage": 33.15, "elapsed_time": "23:40:49", "remaining_time": "1 day, 23:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3192, "total_steps": 9627, "loss": 1.7295, "learning_rate": 7.52398336761455e-05, "epoch": 0.3315674665004674, "percentage": 33.16, "elapsed_time": "23:41:15", "remaining_time": "1 day, 23:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3193, "total_steps": 9627, "loss": 1.8415, "learning_rate": 7.522574724355009e-05, "epoch": 0.3316713410200478, "percentage": 33.17, "elapsed_time": "23:41:42", "remaining_time": "1 day, 23:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3194, "total_steps": 9627, "loss": 1.8444, "learning_rate": 7.52116581246094e-05, "epoch": 0.33177521553962813, "percentage": 33.18, "elapsed_time": "23:42:08", "remaining_time": "1 day, 23:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3195, "total_steps": 9627, "loss": 1.9211, "learning_rate": 7.519756632082376e-05, "epoch": 0.33187909005920846, "percentage": 33.19, "elapsed_time": "23:42:33", "remaining_time": "1 day, 23:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3196, "total_steps": 9627, "loss": 1.5216, "learning_rate": 7.518347183369385e-05, "epoch": 0.33198296457878884, "percentage": 33.2, "elapsed_time": "23:43:00", "remaining_time": "1 day, 23:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3197, "total_steps": 9627, "loss": 1.6549, "learning_rate": 7.516937466472065e-05, "epoch": 0.33208683909836917, "percentage": 33.21, "elapsed_time": "23:43:27", "remaining_time": "1 day, 23:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3198, "total_steps": 9627, "loss": 1.6972, "learning_rate": 7.515527481540536e-05, "epoch": 0.3321907136179495, "percentage": 33.22, "elapsed_time": "23:43:52", "remaining_time": "1 day, 23:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3199, "total_steps": 9627, "loss": 1.6622, "learning_rate": 7.514117228724953e-05, "epoch": 0.3322945881375299, "percentage": 33.23, "elapsed_time": "23:44:18", "remaining_time": "1 day, 23:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 9627, "loss": 1.5866, "learning_rate": 7.512706708175496e-05, "epoch": 0.3323984626571102, "percentage": 33.24, "elapsed_time": "23:44:45", "remaining_time": "1 day, 23:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3201, "total_steps": 9627, "loss": 1.7721, "learning_rate": 7.511295920042374e-05, "epoch": 0.33250233717669053, "percentage": 33.25, "elapsed_time": "23:45:11", "remaining_time": "1 day, 23:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3202, "total_steps": 9627, "loss": 1.7278, "learning_rate": 7.509884864475825e-05, "epoch": 0.3326062116962709, "percentage": 33.26, "elapsed_time": "23:45:38", "remaining_time": "1 day, 23:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3203, "total_steps": 9627, "loss": 1.7481, "learning_rate": 7.508473541626115e-05, "epoch": 0.33271008621585124, "percentage": 33.27, "elapsed_time": "23:46:04", "remaining_time": "1 day, 23:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3204, "total_steps": 9627, "loss": 1.7085, "learning_rate": 7.507061951643541e-05, "epoch": 0.3328139607354316, "percentage": 33.28, "elapsed_time": "23:46:29", "remaining_time": "1 day, 23:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3205, "total_steps": 9627, "loss": 1.8142, "learning_rate": 7.505650094678425e-05, "epoch": 0.33291783525501195, "percentage": 33.29, "elapsed_time": "23:46:57", "remaining_time": "1 day, 23:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3206, "total_steps": 9627, "loss": 1.7213, "learning_rate": 7.504237970881118e-05, "epoch": 0.3330217097745923, "percentage": 33.3, "elapsed_time": "23:47:22", "remaining_time": "1 day, 23:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3207, "total_steps": 9627, "loss": 1.637, "learning_rate": 7.502825580402002e-05, "epoch": 0.33312558429417266, "percentage": 33.31, "elapsed_time": "23:47:48", "remaining_time": "1 day, 23:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3208, "total_steps": 9627, "loss": 1.7966, "learning_rate": 7.501412923391483e-05, "epoch": 0.333229458813753, "percentage": 33.32, "elapsed_time": "23:48:15", "remaining_time": "1 day, 23:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3209, "total_steps": 9627, "loss": 1.7097, "learning_rate": 7.500000000000001e-05, "epoch": 0.3333333333333333, "percentage": 33.33, "elapsed_time": "23:48:40", "remaining_time": "1 day, 23:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3210, "total_steps": 9627, "loss": 1.6064, "learning_rate": 7.498586810378019e-05, "epoch": 0.3334372078529137, "percentage": 33.34, "elapsed_time": "23:49:07", "remaining_time": "1 day, 23:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3211, "total_steps": 9627, "loss": 1.8244, "learning_rate": 7.49717335467603e-05, "epoch": 0.333541082372494, "percentage": 33.35, "elapsed_time": "23:49:33", "remaining_time": "1 day, 23:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3212, "total_steps": 9627, "loss": 1.8339, "learning_rate": 7.49575963304456e-05, "epoch": 0.33364495689207435, "percentage": 33.36, "elapsed_time": "23:49:59", "remaining_time": "1 day, 23:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3213, "total_steps": 9627, "loss": 1.6953, "learning_rate": 7.494345645634156e-05, "epoch": 0.33374883141165473, "percentage": 33.37, "elapsed_time": "23:50:25", "remaining_time": "1 day, 23:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3214, "total_steps": 9627, "loss": 1.7246, "learning_rate": 7.492931392595397e-05, "epoch": 0.33385270593123506, "percentage": 33.39, "elapsed_time": "23:50:51", "remaining_time": "1 day, 23:35:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3215, "total_steps": 9627, "loss": 1.6528, "learning_rate": 7.49151687407889e-05, "epoch": 0.3339565804508154, "percentage": 33.4, "elapsed_time": "23:51:18", "remaining_time": "1 day, 23:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3216, "total_steps": 9627, "loss": 1.5913, "learning_rate": 7.49010209023527e-05, "epoch": 0.33406045497039577, "percentage": 33.41, "elapsed_time": "23:51:44", "remaining_time": "1 day, 23:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3217, "total_steps": 9627, "loss": 1.609, "learning_rate": 7.488687041215202e-05, "epoch": 0.3341643294899761, "percentage": 33.42, "elapsed_time": "23:52:10", "remaining_time": "1 day, 23:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3218, "total_steps": 9627, "loss": 1.6473, "learning_rate": 7.487271727169377e-05, "epoch": 0.3342682040095565, "percentage": 33.43, "elapsed_time": "23:52:35", "remaining_time": "1 day, 23:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3219, "total_steps": 9627, "loss": 1.7744, "learning_rate": 7.485856148248513e-05, "epoch": 0.3343720785291368, "percentage": 33.44, "elapsed_time": "23:53:02", "remaining_time": "1 day, 23:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3220, "total_steps": 9627, "loss": 1.8776, "learning_rate": 7.484440304603362e-05, "epoch": 0.33447595304871713, "percentage": 33.45, "elapsed_time": "23:53:28", "remaining_time": "1 day, 23:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3221, "total_steps": 9627, "loss": 1.8293, "learning_rate": 7.483024196384696e-05, "epoch": 0.3345798275682975, "percentage": 33.46, "elapsed_time": "23:53:55", "remaining_time": "1 day, 23:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3222, "total_steps": 9627, "loss": 1.8113, "learning_rate": 7.481607823743321e-05, "epoch": 0.33468370208787784, "percentage": 33.47, "elapsed_time": "23:54:20", "remaining_time": "1 day, 23:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3223, "total_steps": 9627, "loss": 1.6579, "learning_rate": 7.480191186830072e-05, "epoch": 0.33478757660745817, "percentage": 33.48, "elapsed_time": "23:54:47", "remaining_time": "1 day, 23:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3224, "total_steps": 9627, "loss": 1.9302, "learning_rate": 7.478774285795805e-05, "epoch": 0.33489145112703855, "percentage": 33.49, "elapsed_time": "23:55:12", "remaining_time": "1 day, 23:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3225, "total_steps": 9627, "loss": 1.8298, "learning_rate": 7.477357120791415e-05, "epoch": 0.3349953256466189, "percentage": 33.5, "elapsed_time": "23:55:39", "remaining_time": "1 day, 23:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3226, "total_steps": 9627, "loss": 1.673, "learning_rate": 7.475939691967814e-05, "epoch": 0.3350992001661992, "percentage": 33.51, "elapsed_time": "23:56:05", "remaining_time": "1 day, 23:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3227, "total_steps": 9627, "loss": 1.7051, "learning_rate": 7.47452199947595e-05, "epoch": 0.3352030746857796, "percentage": 33.52, "elapsed_time": "23:56:32", "remaining_time": "1 day, 23:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3228, "total_steps": 9627, "loss": 1.6151, "learning_rate": 7.473104043466794e-05, "epoch": 0.3353069492053599, "percentage": 33.53, "elapsed_time": "23:56:57", "remaining_time": "1 day, 23:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3229, "total_steps": 9627, "loss": 1.7629, "learning_rate": 7.471685824091348e-05, "epoch": 0.3354108237249403, "percentage": 33.54, "elapsed_time": "23:57:23", "remaining_time": "1 day, 23:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3230, "total_steps": 9627, "loss": 1.7987, "learning_rate": 7.470267341500642e-05, "epoch": 0.3355146982445206, "percentage": 33.55, "elapsed_time": "23:57:49", "remaining_time": "1 day, 23:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3231, "total_steps": 9627, "loss": 1.5922, "learning_rate": 7.468848595845733e-05, "epoch": 0.33561857276410095, "percentage": 33.56, "elapsed_time": "23:58:15", "remaining_time": "1 day, 23:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3232, "total_steps": 9627, "loss": 1.6534, "learning_rate": 7.467429587277705e-05, "epoch": 0.33572244728368134, "percentage": 33.57, "elapsed_time": "23:58:41", "remaining_time": "1 day, 23:26:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3233, "total_steps": 9627, "loss": 1.7319, "learning_rate": 7.466010315947676e-05, "epoch": 0.33582632180326166, "percentage": 33.58, "elapsed_time": "23:59:07", "remaining_time": "1 day, 23:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3234, "total_steps": 9627, "loss": 1.8126, "learning_rate": 7.464590782006782e-05, "epoch": 0.335930196322842, "percentage": 33.59, "elapsed_time": "23:59:33", "remaining_time": "1 day, 23:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3235, "total_steps": 9627, "loss": 1.7701, "learning_rate": 7.463170985606194e-05, "epoch": 0.33603407084242237, "percentage": 33.6, "elapsed_time": "1 day, 0:00:00", "remaining_time": "1 day, 23:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3236, "total_steps": 9627, "loss": 1.8166, "learning_rate": 7.46175092689711e-05, "epoch": 0.3361379453620027, "percentage": 33.61, "elapsed_time": "1 day, 0:00:25", "remaining_time": "1 day, 23:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3237, "total_steps": 9627, "loss": 1.9408, "learning_rate": 7.460330606030754e-05, "epoch": 0.336241819881583, "percentage": 33.62, "elapsed_time": "1 day, 0:00:52", "remaining_time": "1 day, 23:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3238, "total_steps": 9627, "loss": 1.6185, "learning_rate": 7.45891002315838e-05, "epoch": 0.3363456944011634, "percentage": 33.63, "elapsed_time": "1 day, 0:01:18", "remaining_time": "1 day, 23:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3239, "total_steps": 9627, "loss": 1.5973, "learning_rate": 7.457489178431269e-05, "epoch": 0.33644956892074374, "percentage": 33.64, "elapsed_time": "1 day, 0:01:44", "remaining_time": "1 day, 23:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3240, "total_steps": 9627, "loss": 1.5255, "learning_rate": 7.45606807200073e-05, "epoch": 0.33655344344032406, "percentage": 33.66, "elapsed_time": "1 day, 0:02:11", "remaining_time": "1 day, 23:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3241, "total_steps": 9627, "loss": 1.6482, "learning_rate": 7.4546467040181e-05, "epoch": 0.33665731795990445, "percentage": 33.67, "elapsed_time": "1 day, 0:02:37", "remaining_time": "1 day, 23:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3242, "total_steps": 9627, "loss": 1.5935, "learning_rate": 7.453225074634742e-05, "epoch": 0.33676119247948477, "percentage": 33.68, "elapsed_time": "1 day, 0:03:03", "remaining_time": "1 day, 23:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3243, "total_steps": 9627, "loss": 1.8217, "learning_rate": 7.451803184002048e-05, "epoch": 0.33686506699906515, "percentage": 33.69, "elapsed_time": "1 day, 0:03:29", "remaining_time": "1 day, 23:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3244, "total_steps": 9627, "loss": 1.698, "learning_rate": 7.450381032271442e-05, "epoch": 0.3369689415186455, "percentage": 33.7, "elapsed_time": "1 day, 0:03:55", "remaining_time": "1 day, 23:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3245, "total_steps": 9627, "loss": 1.7154, "learning_rate": 7.44895861959437e-05, "epoch": 0.3370728160382258, "percentage": 33.71, "elapsed_time": "1 day, 0:04:21", "remaining_time": "1 day, 23:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3246, "total_steps": 9627, "loss": 1.6902, "learning_rate": 7.447535946122304e-05, "epoch": 0.3371766905578062, "percentage": 33.72, "elapsed_time": "1 day, 0:04:48", "remaining_time": "1 day, 23:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3247, "total_steps": 9627, "loss": 1.6136, "learning_rate": 7.446113012006756e-05, "epoch": 0.3372805650773865, "percentage": 33.73, "elapsed_time": "1 day, 0:05:13", "remaining_time": "1 day, 23:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3248, "total_steps": 9627, "loss": 1.7797, "learning_rate": 7.444689817399251e-05, "epoch": 0.33738443959696685, "percentage": 33.74, "elapsed_time": "1 day, 0:05:41", "remaining_time": "1 day, 23:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3249, "total_steps": 9627, "loss": 1.7013, "learning_rate": 7.443266362451349e-05, "epoch": 0.33748831411654723, "percentage": 33.75, "elapsed_time": "1 day, 0:06:06", "remaining_time": "1 day, 23:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 9627, "loss": 1.7065, "learning_rate": 7.441842647314638e-05, "epoch": 0.33759218863612755, "percentage": 33.76, "elapsed_time": "1 day, 0:06:33", "remaining_time": "1 day, 23:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3251, "total_steps": 9627, "loss": 1.7509, "learning_rate": 7.440418672140733e-05, "epoch": 0.3376960631557079, "percentage": 33.77, "elapsed_time": "1 day, 0:06:59", "remaining_time": "1 day, 23:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3252, "total_steps": 9627, "loss": 1.7629, "learning_rate": 7.438994437081272e-05, "epoch": 0.33779993767528826, "percentage": 33.78, "elapsed_time": "1 day, 0:07:26", "remaining_time": "1 day, 23:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3253, "total_steps": 9627, "loss": 1.8509, "learning_rate": 7.437569942287932e-05, "epoch": 0.3379038121948686, "percentage": 33.79, "elapsed_time": "1 day, 0:07:52", "remaining_time": "1 day, 23:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3254, "total_steps": 9627, "loss": 1.6512, "learning_rate": 7.436145187912406e-05, "epoch": 0.3380076867144489, "percentage": 33.8, "elapsed_time": "1 day, 0:08:18", "remaining_time": "1 day, 23:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3255, "total_steps": 9627, "loss": 1.5277, "learning_rate": 7.43472017410642e-05, "epoch": 0.3381115612340293, "percentage": 33.81, "elapsed_time": "1 day, 0:08:45", "remaining_time": "1 day, 23:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3256, "total_steps": 9627, "loss": 1.5944, "learning_rate": 7.433294901021727e-05, "epoch": 0.33821543575360963, "percentage": 33.82, "elapsed_time": "1 day, 0:09:11", "remaining_time": "1 day, 23:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3257, "total_steps": 9627, "loss": 1.6653, "learning_rate": 7.431869368810106e-05, "epoch": 0.33831931027319, "percentage": 33.83, "elapsed_time": "1 day, 0:09:36", "remaining_time": "1 day, 23:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3258, "total_steps": 9627, "loss": 1.7842, "learning_rate": 7.430443577623369e-05, "epoch": 0.33842318479277034, "percentage": 33.84, "elapsed_time": "1 day, 0:10:04", "remaining_time": "1 day, 23:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3259, "total_steps": 9627, "loss": 1.721, "learning_rate": 7.429017527613347e-05, "epoch": 0.33852705931235066, "percentage": 33.85, "elapsed_time": "1 day, 0:10:29", "remaining_time": "1 day, 23:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3260, "total_steps": 9627, "loss": 1.9518, "learning_rate": 7.427591218931906e-05, "epoch": 0.33863093383193105, "percentage": 33.86, "elapsed_time": "1 day, 0:10:56", "remaining_time": "1 day, 23:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3261, "total_steps": 9627, "loss": 1.5893, "learning_rate": 7.426164651730937e-05, "epoch": 0.3387348083515114, "percentage": 33.87, "elapsed_time": "1 day, 0:11:22", "remaining_time": "1 day, 23:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3262, "total_steps": 9627, "loss": 1.6549, "learning_rate": 7.424737826162358e-05, "epoch": 0.3388386828710917, "percentage": 33.88, "elapsed_time": "1 day, 0:11:48", "remaining_time": "1 day, 23:12:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3263, "total_steps": 9627, "loss": 1.6472, "learning_rate": 7.423310742378113e-05, "epoch": 0.3389425573906721, "percentage": 33.89, "elapsed_time": "1 day, 0:12:14", "remaining_time": "1 day, 23:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3264, "total_steps": 9627, "loss": 1.7416, "learning_rate": 7.421883400530176e-05, "epoch": 0.3390464319102524, "percentage": 33.9, "elapsed_time": "1 day, 0:12:41", "remaining_time": "1 day, 23:11:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3265, "total_steps": 9627, "loss": 1.6492, "learning_rate": 7.42045580077055e-05, "epoch": 0.33915030642983274, "percentage": 33.92, "elapsed_time": "1 day, 0:13:07", "remaining_time": "1 day, 23:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3266, "total_steps": 9627, "loss": 1.7518, "learning_rate": 7.41902794325126e-05, "epoch": 0.3392541809494131, "percentage": 33.93, "elapsed_time": "1 day, 0:13:33", "remaining_time": "1 day, 23:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3267, "total_steps": 9627, "loss": 1.6747, "learning_rate": 7.417599828124363e-05, "epoch": 0.33935805546899345, "percentage": 33.94, "elapsed_time": "1 day, 0:13:59", "remaining_time": "1 day, 23:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3268, "total_steps": 9627, "loss": 1.7727, "learning_rate": 7.416171455541943e-05, "epoch": 0.33946192998857383, "percentage": 33.95, "elapsed_time": "1 day, 0:14:25", "remaining_time": "1 day, 23:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3269, "total_steps": 9627, "loss": 1.6616, "learning_rate": 7.414742825656111e-05, "epoch": 0.33956580450815416, "percentage": 33.96, "elapsed_time": "1 day, 0:14:51", "remaining_time": "1 day, 23:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3270, "total_steps": 9627, "loss": 1.8302, "learning_rate": 7.413313938619003e-05, "epoch": 0.3396696790277345, "percentage": 33.97, "elapsed_time": "1 day, 0:15:17", "remaining_time": "1 day, 23:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3271, "total_steps": 9627, "loss": 1.7629, "learning_rate": 7.411884794582784e-05, "epoch": 0.33977355354731487, "percentage": 33.98, "elapsed_time": "1 day, 0:15:44", "remaining_time": "1 day, 23:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3272, "total_steps": 9627, "loss": 1.6549, "learning_rate": 7.410455393699647e-05, "epoch": 0.3398774280668952, "percentage": 33.99, "elapsed_time": "1 day, 0:16:10", "remaining_time": "1 day, 23:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3273, "total_steps": 9627, "loss": 1.6949, "learning_rate": 7.409025736121816e-05, "epoch": 0.3399813025864755, "percentage": 34.0, "elapsed_time": "1 day, 0:16:36", "remaining_time": "1 day, 23:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3274, "total_steps": 9627, "loss": 1.8114, "learning_rate": 7.407595822001532e-05, "epoch": 0.3400851771060559, "percentage": 34.01, "elapsed_time": "1 day, 0:17:02", "remaining_time": "1 day, 23:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3275, "total_steps": 9627, "loss": 1.6883, "learning_rate": 7.406165651491075e-05, "epoch": 0.34018905162563623, "percentage": 34.02, "elapsed_time": "1 day, 0:17:28", "remaining_time": "1 day, 23:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3276, "total_steps": 9627, "loss": 1.7254, "learning_rate": 7.404735224742745e-05, "epoch": 0.34029292614521656, "percentage": 34.03, "elapsed_time": "1 day, 0:17:53", "remaining_time": "1 day, 23:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3277, "total_steps": 9627, "loss": 1.6418, "learning_rate": 7.40330454190887e-05, "epoch": 0.34039680066479694, "percentage": 34.04, "elapsed_time": "1 day, 0:18:21", "remaining_time": "1 day, 23:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3278, "total_steps": 9627, "loss": 1.8138, "learning_rate": 7.401873603141809e-05, "epoch": 0.34050067518437727, "percentage": 34.05, "elapsed_time": "1 day, 0:18:47", "remaining_time": "1 day, 23:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3279, "total_steps": 9627, "loss": 1.9727, "learning_rate": 7.400442408593944e-05, "epoch": 0.3406045497039576, "percentage": 34.06, "elapsed_time": "1 day, 0:19:13", "remaining_time": "1 day, 23:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3280, "total_steps": 9627, "loss": 1.7511, "learning_rate": 7.399010958417684e-05, "epoch": 0.340708424223538, "percentage": 34.07, "elapsed_time": "1 day, 0:19:39", "remaining_time": "1 day, 23:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3281, "total_steps": 9627, "loss": 1.7119, "learning_rate": 7.397579252765475e-05, "epoch": 0.3408122987431183, "percentage": 34.08, "elapsed_time": "1 day, 0:20:05", "remaining_time": "1 day, 23:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3282, "total_steps": 9627, "loss": 1.7253, "learning_rate": 7.396147291789775e-05, "epoch": 0.3409161732626987, "percentage": 34.09, "elapsed_time": "1 day, 0:20:32", "remaining_time": "1 day, 23:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3283, "total_steps": 9627, "loss": 1.7831, "learning_rate": 7.394715075643078e-05, "epoch": 0.341020047782279, "percentage": 34.1, "elapsed_time": "1 day, 0:20:58", "remaining_time": "1 day, 23:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3284, "total_steps": 9627, "loss": 1.8239, "learning_rate": 7.393282604477907e-05, "epoch": 0.34112392230185934, "percentage": 34.11, "elapsed_time": "1 day, 0:21:24", "remaining_time": "1 day, 23:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3285, "total_steps": 9627, "loss": 1.8158, "learning_rate": 7.391849878446805e-05, "epoch": 0.3412277968214397, "percentage": 34.12, "elapsed_time": "1 day, 0:21:50", "remaining_time": "1 day, 23:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3286, "total_steps": 9627, "loss": 1.6549, "learning_rate": 7.39041689770235e-05, "epoch": 0.34133167134102005, "percentage": 34.13, "elapsed_time": "1 day, 0:22:16", "remaining_time": "1 day, 23:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3287, "total_steps": 9627, "loss": 1.8314, "learning_rate": 7.388983662397139e-05, "epoch": 0.3414355458606004, "percentage": 34.14, "elapsed_time": "1 day, 0:22:43", "remaining_time": "1 day, 23:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3288, "total_steps": 9627, "loss": 1.9213, "learning_rate": 7.387550172683803e-05, "epoch": 0.34153942038018076, "percentage": 34.15, "elapsed_time": "1 day, 0:23:09", "remaining_time": "1 day, 23:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3289, "total_steps": 9627, "loss": 1.7343, "learning_rate": 7.386116428715e-05, "epoch": 0.3416432948997611, "percentage": 34.16, "elapsed_time": "1 day, 0:23:36", "remaining_time": "1 day, 23:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3290, "total_steps": 9627, "loss": 1.6233, "learning_rate": 7.384682430643409e-05, "epoch": 0.3417471694193414, "percentage": 34.17, "elapsed_time": "1 day, 0:24:01", "remaining_time": "1 day, 22:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3291, "total_steps": 9627, "loss": 1.7206, "learning_rate": 7.383248178621739e-05, "epoch": 0.3418510439389218, "percentage": 34.19, "elapsed_time": "1 day, 0:24:28", "remaining_time": "1 day, 22:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3292, "total_steps": 9627, "loss": 1.6387, "learning_rate": 7.381813672802729e-05, "epoch": 0.3419549184585021, "percentage": 34.2, "elapsed_time": "1 day, 0:24:54", "remaining_time": "1 day, 22:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3293, "total_steps": 9627, "loss": 1.7021, "learning_rate": 7.380378913339142e-05, "epoch": 0.34205879297808245, "percentage": 34.21, "elapsed_time": "1 day, 0:25:20", "remaining_time": "1 day, 22:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3294, "total_steps": 9627, "loss": 1.6213, "learning_rate": 7.378943900383766e-05, "epoch": 0.34216266749766283, "percentage": 34.22, "elapsed_time": "1 day, 0:25:45", "remaining_time": "1 day, 22:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3295, "total_steps": 9627, "loss": 1.8177, "learning_rate": 7.377508634089422e-05, "epoch": 0.34226654201724316, "percentage": 34.23, "elapsed_time": "1 day, 0:26:13", "remaining_time": "1 day, 22:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3296, "total_steps": 9627, "loss": 1.7282, "learning_rate": 7.376073114608955e-05, "epoch": 0.34237041653682354, "percentage": 34.24, "elapsed_time": "1 day, 0:26:38", "remaining_time": "1 day, 22:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3297, "total_steps": 9627, "loss": 1.7302, "learning_rate": 7.374637342095236e-05, "epoch": 0.34247429105640387, "percentage": 34.25, "elapsed_time": "1 day, 0:27:05", "remaining_time": "1 day, 22:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3298, "total_steps": 9627, "loss": 1.6312, "learning_rate": 7.373201316701162e-05, "epoch": 0.3425781655759842, "percentage": 34.26, "elapsed_time": "1 day, 0:27:31", "remaining_time": "1 day, 22:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3299, "total_steps": 9627, "loss": 1.6591, "learning_rate": 7.371765038579658e-05, "epoch": 0.3426820400955646, "percentage": 34.27, "elapsed_time": "1 day, 0:27:56", "remaining_time": "1 day, 22:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 9627, "loss": 1.8358, "learning_rate": 7.37032850788368e-05, "epoch": 0.3427859146151449, "percentage": 34.28, "elapsed_time": "1 day, 0:28:23", "remaining_time": "1 day, 22:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3301, "total_steps": 9627, "loss": 1.7225, "learning_rate": 7.368891724766204e-05, "epoch": 0.34288978913472523, "percentage": 34.29, "elapsed_time": "1 day, 0:28:50", "remaining_time": "1 day, 22:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3302, "total_steps": 9627, "loss": 1.5813, "learning_rate": 7.367454689380238e-05, "epoch": 0.3429936636543056, "percentage": 34.3, "elapsed_time": "1 day, 0:29:16", "remaining_time": "1 day, 22:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3303, "total_steps": 9627, "loss": 1.8608, "learning_rate": 7.366017401878813e-05, "epoch": 0.34309753817388594, "percentage": 34.31, "elapsed_time": "1 day, 0:29:42", "remaining_time": "1 day, 22:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3304, "total_steps": 9627, "loss": 1.7135, "learning_rate": 7.364579862414993e-05, "epoch": 0.34320141269346627, "percentage": 34.32, "elapsed_time": "1 day, 0:30:09", "remaining_time": "1 day, 22:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3305, "total_steps": 9627, "loss": 1.8721, "learning_rate": 7.36314207114186e-05, "epoch": 0.34330528721304665, "percentage": 34.33, "elapsed_time": "1 day, 0:30:35", "remaining_time": "1 day, 22:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3306, "total_steps": 9627, "loss": 1.6559, "learning_rate": 7.36170402821253e-05, "epoch": 0.343409161732627, "percentage": 34.34, "elapsed_time": "1 day, 0:31:01", "remaining_time": "1 day, 22:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3307, "total_steps": 9627, "loss": 1.7733, "learning_rate": 7.360265733780142e-05, "epoch": 0.34351303625220736, "percentage": 34.35, "elapsed_time": "1 day, 0:31:26", "remaining_time": "1 day, 22:52:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3308, "total_steps": 9627, "loss": 1.5218, "learning_rate": 7.358827187997867e-05, "epoch": 0.3436169107717877, "percentage": 34.36, "elapsed_time": "1 day, 0:31:52", "remaining_time": "1 day, 22:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3309, "total_steps": 9627, "loss": 1.6683, "learning_rate": 7.357388391018893e-05, "epoch": 0.343720785291368, "percentage": 34.37, "elapsed_time": "1 day, 0:32:19", "remaining_time": "1 day, 22:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3310, "total_steps": 9627, "loss": 1.7642, "learning_rate": 7.355949342996447e-05, "epoch": 0.3438246598109484, "percentage": 34.38, "elapsed_time": "1 day, 0:32:45", "remaining_time": "1 day, 22:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3311, "total_steps": 9627, "loss": 1.7529, "learning_rate": 7.35451004408377e-05, "epoch": 0.3439285343305287, "percentage": 34.39, "elapsed_time": "1 day, 0:33:11", "remaining_time": "1 day, 22:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3312, "total_steps": 9627, "loss": 1.77, "learning_rate": 7.353070494434141e-05, "epoch": 0.34403240885010905, "percentage": 34.4, "elapsed_time": "1 day, 0:33:37", "remaining_time": "1 day, 22:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3313, "total_steps": 9627, "loss": 1.7528, "learning_rate": 7.351630694200857e-05, "epoch": 0.34413628336968943, "percentage": 34.41, "elapsed_time": "1 day, 0:34:02", "remaining_time": "1 day, 22:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3314, "total_steps": 9627, "loss": 1.677, "learning_rate": 7.35019064353725e-05, "epoch": 0.34424015788926976, "percentage": 34.42, "elapsed_time": "1 day, 0:34:29", "remaining_time": "1 day, 22:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3315, "total_steps": 9627, "loss": 1.9235, "learning_rate": 7.348750342596671e-05, "epoch": 0.3443440324088501, "percentage": 34.43, "elapsed_time": "1 day, 0:34:55", "remaining_time": "1 day, 22:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3316, "total_steps": 9627, "loss": 1.6732, "learning_rate": 7.3473097915325e-05, "epoch": 0.34444790692843047, "percentage": 34.44, "elapsed_time": "1 day, 0:35:21", "remaining_time": "1 day, 22:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3317, "total_steps": 9627, "loss": 1.6598, "learning_rate": 7.345868990498146e-05, "epoch": 0.3445517814480108, "percentage": 34.46, "elapsed_time": "1 day, 0:35:48", "remaining_time": "1 day, 22:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3318, "total_steps": 9627, "loss": 1.7695, "learning_rate": 7.344427939647045e-05, "epoch": 0.3446556559675911, "percentage": 34.47, "elapsed_time": "1 day, 0:36:14", "remaining_time": "1 day, 22:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3319, "total_steps": 9627, "loss": 1.6552, "learning_rate": 7.342986639132654e-05, "epoch": 0.3447595304871715, "percentage": 34.48, "elapsed_time": "1 day, 0:36:40", "remaining_time": "1 day, 22:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3320, "total_steps": 9627, "loss": 1.9607, "learning_rate": 7.341545089108464e-05, "epoch": 0.34486340500675183, "percentage": 34.49, "elapsed_time": "1 day, 0:37:06", "remaining_time": "1 day, 22:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3321, "total_steps": 9627, "loss": 1.7933, "learning_rate": 7.340103289727983e-05, "epoch": 0.3449672795263322, "percentage": 34.5, "elapsed_time": "1 day, 0:37:32", "remaining_time": "1 day, 22:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3322, "total_steps": 9627, "loss": 1.8795, "learning_rate": 7.338661241144758e-05, "epoch": 0.34507115404591254, "percentage": 34.51, "elapsed_time": "1 day, 0:37:58", "remaining_time": "1 day, 22:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3323, "total_steps": 9627, "loss": 1.764, "learning_rate": 7.337218943512353e-05, "epoch": 0.34517502856549287, "percentage": 34.52, "elapsed_time": "1 day, 0:38:25", "remaining_time": "1 day, 22:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3324, "total_steps": 9627, "loss": 1.814, "learning_rate": 7.335776396984361e-05, "epoch": 0.34527890308507325, "percentage": 34.53, "elapsed_time": "1 day, 0:38:51", "remaining_time": "1 day, 22:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3325, "total_steps": 9627, "loss": 1.5926, "learning_rate": 7.334333601714403e-05, "epoch": 0.3453827776046536, "percentage": 34.54, "elapsed_time": "1 day, 0:39:17", "remaining_time": "1 day, 22:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3326, "total_steps": 9627, "loss": 1.8246, "learning_rate": 7.332890557856125e-05, "epoch": 0.3454866521242339, "percentage": 34.55, "elapsed_time": "1 day, 0:39:43", "remaining_time": "1 day, 22:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3327, "total_steps": 9627, "loss": 1.5425, "learning_rate": 7.331447265563197e-05, "epoch": 0.3455905266438143, "percentage": 34.56, "elapsed_time": "1 day, 0:40:10", "remaining_time": "1 day, 22:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3328, "total_steps": 9627, "loss": 1.5314, "learning_rate": 7.330003724989324e-05, "epoch": 0.3456944011633946, "percentage": 34.57, "elapsed_time": "1 day, 0:40:36", "remaining_time": "1 day, 22:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3329, "total_steps": 9627, "loss": 1.688, "learning_rate": 7.328559936288228e-05, "epoch": 0.34579827568297494, "percentage": 34.58, "elapsed_time": "1 day, 0:41:03", "remaining_time": "1 day, 22:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3330, "total_steps": 9627, "loss": 1.8245, "learning_rate": 7.327115899613662e-05, "epoch": 0.3459021502025553, "percentage": 34.59, "elapsed_time": "1 day, 0:41:29", "remaining_time": "1 day, 22:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3331, "total_steps": 9627, "loss": 1.4173, "learning_rate": 7.325671615119407e-05, "epoch": 0.34600602472213565, "percentage": 34.6, "elapsed_time": "1 day, 0:41:55", "remaining_time": "1 day, 22:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3332, "total_steps": 9627, "loss": 1.7182, "learning_rate": 7.324227082959264e-05, "epoch": 0.34610989924171603, "percentage": 34.61, "elapsed_time": "1 day, 0:42:22", "remaining_time": "1 day, 22:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3333, "total_steps": 9627, "loss": 1.6838, "learning_rate": 7.322782303287067e-05, "epoch": 0.34621377376129636, "percentage": 34.62, "elapsed_time": "1 day, 0:42:48", "remaining_time": "1 day, 22:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3334, "total_steps": 9627, "loss": 1.8532, "learning_rate": 7.321337276256674e-05, "epoch": 0.3463176482808767, "percentage": 34.63, "elapsed_time": "1 day, 0:43:14", "remaining_time": "1 day, 22:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3335, "total_steps": 9627, "loss": 1.7919, "learning_rate": 7.319892002021966e-05, "epoch": 0.34642152280045707, "percentage": 34.64, "elapsed_time": "1 day, 0:43:40", "remaining_time": "1 day, 22:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3336, "total_steps": 9627, "loss": 1.6985, "learning_rate": 7.318446480736857e-05, "epoch": 0.3465253973200374, "percentage": 34.65, "elapsed_time": "1 day, 0:44:07", "remaining_time": "1 day, 22:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3337, "total_steps": 9627, "loss": 1.9947, "learning_rate": 7.317000712555283e-05, "epoch": 0.3466292718396177, "percentage": 34.66, "elapsed_time": "1 day, 0:44:33", "remaining_time": "1 day, 22:38:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3338, "total_steps": 9627, "loss": 1.7206, "learning_rate": 7.315554697631205e-05, "epoch": 0.3467331463591981, "percentage": 34.67, "elapsed_time": "1 day, 0:45:00", "remaining_time": "1 day, 22:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3339, "total_steps": 9627, "loss": 1.6871, "learning_rate": 7.314108436118614e-05, "epoch": 0.34683702087877843, "percentage": 34.68, "elapsed_time": "1 day, 0:45:26", "remaining_time": "1 day, 22:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3340, "total_steps": 9627, "loss": 1.5859, "learning_rate": 7.312661928171525e-05, "epoch": 0.34694089539835876, "percentage": 34.69, "elapsed_time": "1 day, 0:45:52", "remaining_time": "1 day, 22:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3341, "total_steps": 9627, "loss": 1.5721, "learning_rate": 7.311215173943982e-05, "epoch": 0.34704476991793914, "percentage": 34.7, "elapsed_time": "1 day, 0:46:19", "remaining_time": "1 day, 22:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3342, "total_steps": 9627, "loss": 1.6762, "learning_rate": 7.309768173590049e-05, "epoch": 0.34714864443751947, "percentage": 34.71, "elapsed_time": "1 day, 0:46:45", "remaining_time": "1 day, 22:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3343, "total_steps": 9627, "loss": 1.6709, "learning_rate": 7.308320927263823e-05, "epoch": 0.3472525189570998, "percentage": 34.73, "elapsed_time": "1 day, 0:47:12", "remaining_time": "1 day, 22:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3344, "total_steps": 9627, "loss": 1.7338, "learning_rate": 7.306873435119423e-05, "epoch": 0.3473563934766802, "percentage": 34.74, "elapsed_time": "1 day, 0:47:38", "remaining_time": "1 day, 22:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3345, "total_steps": 9627, "loss": 1.5917, "learning_rate": 7.305425697311e-05, "epoch": 0.3474602679962605, "percentage": 34.75, "elapsed_time": "1 day, 0:48:05", "remaining_time": "1 day, 22:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3346, "total_steps": 9627, "loss": 1.6511, "learning_rate": 7.30397771399272e-05, "epoch": 0.3475641425158409, "percentage": 34.76, "elapsed_time": "1 day, 0:48:32", "remaining_time": "1 day, 22:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3347, "total_steps": 9627, "loss": 1.6948, "learning_rate": 7.302529485318786e-05, "epoch": 0.3476680170354212, "percentage": 34.77, "elapsed_time": "1 day, 0:48:58", "remaining_time": "1 day, 22:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3348, "total_steps": 9627, "loss": 1.6319, "learning_rate": 7.301081011443423e-05, "epoch": 0.34777189155500154, "percentage": 34.78, "elapsed_time": "1 day, 0:49:24", "remaining_time": "1 day, 22:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3349, "total_steps": 9627, "loss": 1.7856, "learning_rate": 7.29963229252088e-05, "epoch": 0.3478757660745819, "percentage": 34.79, "elapsed_time": "1 day, 0:49:52", "remaining_time": "1 day, 22:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 9627, "loss": 1.65, "learning_rate": 7.298183328705436e-05, "epoch": 0.34797964059416225, "percentage": 34.8, "elapsed_time": "1 day, 0:50:18", "remaining_time": "1 day, 22:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3351, "total_steps": 9627, "loss": 1.8236, "learning_rate": 7.296734120151394e-05, "epoch": 0.3480835151137426, "percentage": 34.81, "elapsed_time": "1 day, 0:50:44", "remaining_time": "1 day, 22:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3352, "total_steps": 9627, "loss": 1.5903, "learning_rate": 7.295284667013083e-05, "epoch": 0.34818738963332296, "percentage": 34.82, "elapsed_time": "1 day, 0:51:11", "remaining_time": "1 day, 22:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3353, "total_steps": 9627, "loss": 1.8107, "learning_rate": 7.293834969444861e-05, "epoch": 0.3482912641529033, "percentage": 34.83, "elapsed_time": "1 day, 0:51:37", "remaining_time": "1 day, 22:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3354, "total_steps": 9627, "loss": 1.7677, "learning_rate": 7.292385027601105e-05, "epoch": 0.3483951386724836, "percentage": 34.84, "elapsed_time": "1 day, 0:52:04", "remaining_time": "1 day, 22:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3355, "total_steps": 9627, "loss": 1.6464, "learning_rate": 7.290934841636225e-05, "epoch": 0.348499013192064, "percentage": 34.85, "elapsed_time": "1 day, 0:52:30", "remaining_time": "1 day, 22:30:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3356, "total_steps": 9627, "loss": 1.7565, "learning_rate": 7.289484411704656e-05, "epoch": 0.3486028877116443, "percentage": 34.86, "elapsed_time": "1 day, 0:52:58", "remaining_time": "1 day, 22:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3357, "total_steps": 9627, "loss": 1.5508, "learning_rate": 7.288033737960855e-05, "epoch": 0.34870676223122465, "percentage": 34.87, "elapsed_time": "1 day, 0:53:23", "remaining_time": "1 day, 22:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3358, "total_steps": 9627, "loss": 1.6979, "learning_rate": 7.286582820559308e-05, "epoch": 0.34881063675080504, "percentage": 34.88, "elapsed_time": "1 day, 0:53:51", "remaining_time": "1 day, 22:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3359, "total_steps": 9627, "loss": 1.703, "learning_rate": 7.285131659654527e-05, "epoch": 0.34891451127038536, "percentage": 34.89, "elapsed_time": "1 day, 0:54:17", "remaining_time": "1 day, 22:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3360, "total_steps": 9627, "loss": 1.6348, "learning_rate": 7.283680255401049e-05, "epoch": 0.34901838578996575, "percentage": 34.9, "elapsed_time": "1 day, 0:54:43", "remaining_time": "1 day, 22:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3361, "total_steps": 9627, "loss": 1.7792, "learning_rate": 7.282228607953436e-05, "epoch": 0.3491222603095461, "percentage": 34.91, "elapsed_time": "1 day, 0:55:11", "remaining_time": "1 day, 22:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3362, "total_steps": 9627, "loss": 1.7119, "learning_rate": 7.28077671746628e-05, "epoch": 0.3492261348291264, "percentage": 34.92, "elapsed_time": "1 day, 0:55:37", "remaining_time": "1 day, 22:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3363, "total_steps": 9627, "loss": 1.8279, "learning_rate": 7.279324584094194e-05, "epoch": 0.3493300093487068, "percentage": 34.93, "elapsed_time": "1 day, 0:56:03", "remaining_time": "1 day, 22:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3364, "total_steps": 9627, "loss": 1.6366, "learning_rate": 7.277872207991818e-05, "epoch": 0.3494338838682871, "percentage": 34.94, "elapsed_time": "1 day, 0:56:30", "remaining_time": "1 day, 22:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3365, "total_steps": 9627, "loss": 1.6741, "learning_rate": 7.276419589313821e-05, "epoch": 0.34953775838786744, "percentage": 34.95, "elapsed_time": "1 day, 0:56:57", "remaining_time": "1 day, 22:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3366, "total_steps": 9627, "loss": 1.7447, "learning_rate": 7.274966728214895e-05, "epoch": 0.3496416329074478, "percentage": 34.96, "elapsed_time": "1 day, 0:57:24", "remaining_time": "1 day, 22:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3367, "total_steps": 9627, "loss": 1.9171, "learning_rate": 7.273513624849757e-05, "epoch": 0.34974550742702815, "percentage": 34.97, "elapsed_time": "1 day, 0:57:50", "remaining_time": "1 day, 22:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3368, "total_steps": 9627, "loss": 1.7925, "learning_rate": 7.272060279373152e-05, "epoch": 0.3498493819466085, "percentage": 34.98, "elapsed_time": "1 day, 0:58:16", "remaining_time": "1 day, 22:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3369, "total_steps": 9627, "loss": 1.6959, "learning_rate": 7.27060669193985e-05, "epoch": 0.34995325646618886, "percentage": 35.0, "elapsed_time": "1 day, 0:58:44", "remaining_time": "1 day, 22:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3370, "total_steps": 9627, "loss": 1.7667, "learning_rate": 7.269152862704647e-05, "epoch": 0.3500571309857692, "percentage": 35.01, "elapsed_time": "1 day, 0:59:10", "remaining_time": "1 day, 22:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3371, "total_steps": 9627, "loss": 1.8386, "learning_rate": 7.267698791822363e-05, "epoch": 0.35016100550534957, "percentage": 35.02, "elapsed_time": "1 day, 0:59:38", "remaining_time": "1 day, 22:23:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3372, "total_steps": 9627, "loss": 1.9704, "learning_rate": 7.266244479447847e-05, "epoch": 0.3502648800249299, "percentage": 35.03, "elapsed_time": "1 day, 1:00:04", "remaining_time": "1 day, 22:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3373, "total_steps": 9627, "loss": 1.9084, "learning_rate": 7.264789925735974e-05, "epoch": 0.3503687545445102, "percentage": 35.04, "elapsed_time": "1 day, 1:00:30", "remaining_time": "1 day, 22:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3374, "total_steps": 9627, "loss": 1.7802, "learning_rate": 7.263335130841638e-05, "epoch": 0.3504726290640906, "percentage": 35.05, "elapsed_time": "1 day, 1:00:57", "remaining_time": "1 day, 22:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3375, "total_steps": 9627, "loss": 1.6945, "learning_rate": 7.261880094919765e-05, "epoch": 0.35057650358367093, "percentage": 35.06, "elapsed_time": "1 day, 1:01:23", "remaining_time": "1 day, 22:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3376, "total_steps": 9627, "loss": 1.7436, "learning_rate": 7.260424818125305e-05, "epoch": 0.35068037810325126, "percentage": 35.07, "elapsed_time": "1 day, 1:01:51", "remaining_time": "1 day, 22:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3377, "total_steps": 9627, "loss": 1.7358, "learning_rate": 7.258969300613233e-05, "epoch": 0.35078425262283164, "percentage": 35.08, "elapsed_time": "1 day, 1:02:17", "remaining_time": "1 day, 22:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3378, "total_steps": 9627, "loss": 1.8172, "learning_rate": 7.257513542538553e-05, "epoch": 0.35088812714241197, "percentage": 35.09, "elapsed_time": "1 day, 1:02:44", "remaining_time": "1 day, 22:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3379, "total_steps": 9627, "loss": 1.6052, "learning_rate": 7.25605754405629e-05, "epoch": 0.3509920016619923, "percentage": 35.1, "elapsed_time": "1 day, 1:03:11", "remaining_time": "1 day, 22:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3380, "total_steps": 9627, "loss": 1.7486, "learning_rate": 7.254601305321496e-05, "epoch": 0.3510958761815727, "percentage": 35.11, "elapsed_time": "1 day, 1:03:38", "remaining_time": "1 day, 22:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3381, "total_steps": 9627, "loss": 1.6068, "learning_rate": 7.253144826489249e-05, "epoch": 0.351199750701153, "percentage": 35.12, "elapsed_time": "1 day, 1:04:04", "remaining_time": "1 day, 22:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3382, "total_steps": 9627, "loss": 1.6542, "learning_rate": 7.251688107714654e-05, "epoch": 0.35130362522073333, "percentage": 35.13, "elapsed_time": "1 day, 1:04:31", "remaining_time": "1 day, 22:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3383, "total_steps": 9627, "loss": 1.8309, "learning_rate": 7.250231149152838e-05, "epoch": 0.3514074997403137, "percentage": 35.14, "elapsed_time": "1 day, 1:04:57", "remaining_time": "1 day, 22:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3384, "total_steps": 9627, "loss": 1.735, "learning_rate": 7.248773950958958e-05, "epoch": 0.35151137425989404, "percentage": 35.15, "elapsed_time": "1 day, 1:05:25", "remaining_time": "1 day, 22:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3385, "total_steps": 9627, "loss": 1.5545, "learning_rate": 7.247316513288192e-05, "epoch": 0.3516152487794744, "percentage": 35.16, "elapsed_time": "1 day, 1:05:51", "remaining_time": "1 day, 22:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3386, "total_steps": 9627, "loss": 1.748, "learning_rate": 7.245858836295749e-05, "epoch": 0.35171912329905475, "percentage": 35.17, "elapsed_time": "1 day, 1:06:19", "remaining_time": "1 day, 22:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3387, "total_steps": 9627, "loss": 1.703, "learning_rate": 7.244400920136858e-05, "epoch": 0.3518229978186351, "percentage": 35.18, "elapsed_time": "1 day, 1:06:45", "remaining_time": "1 day, 22:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3388, "total_steps": 9627, "loss": 1.6779, "learning_rate": 7.242942764966776e-05, "epoch": 0.35192687233821546, "percentage": 35.19, "elapsed_time": "1 day, 1:07:12", "remaining_time": "1 day, 22:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3389, "total_steps": 9627, "loss": 1.7014, "learning_rate": 7.241484370940784e-05, "epoch": 0.3520307468577958, "percentage": 35.2, "elapsed_time": "1 day, 1:07:40", "remaining_time": "1 day, 22:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3390, "total_steps": 9627, "loss": 1.6532, "learning_rate": 7.240025738214192e-05, "epoch": 0.3521346213773761, "percentage": 35.21, "elapsed_time": "1 day, 1:08:05", "remaining_time": "1 day, 22:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3391, "total_steps": 9627, "loss": 1.9818, "learning_rate": 7.238566866942332e-05, "epoch": 0.3522384958969565, "percentage": 35.22, "elapsed_time": "1 day, 1:08:33", "remaining_time": "1 day, 22:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3392, "total_steps": 9627, "loss": 1.7702, "learning_rate": 7.23710775728056e-05, "epoch": 0.3523423704165368, "percentage": 35.23, "elapsed_time": "1 day, 1:09:00", "remaining_time": "1 day, 22:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3393, "total_steps": 9627, "loss": 1.6614, "learning_rate": 7.235648409384263e-05, "epoch": 0.35244624493611715, "percentage": 35.24, "elapsed_time": "1 day, 1:09:26", "remaining_time": "1 day, 22:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3394, "total_steps": 9627, "loss": 1.6692, "learning_rate": 7.234188823408851e-05, "epoch": 0.35255011945569753, "percentage": 35.26, "elapsed_time": "1 day, 1:09:54", "remaining_time": "1 day, 22:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3395, "total_steps": 9627, "loss": 1.7263, "learning_rate": 7.232728999509754e-05, "epoch": 0.35265399397527786, "percentage": 35.27, "elapsed_time": "1 day, 1:10:20", "remaining_time": "1 day, 22:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3396, "total_steps": 9627, "loss": 1.7052, "learning_rate": 7.231268937842438e-05, "epoch": 0.3527578684948582, "percentage": 35.28, "elapsed_time": "1 day, 1:10:47", "remaining_time": "1 day, 22:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3397, "total_steps": 9627, "loss": 1.659, "learning_rate": 7.229808638562381e-05, "epoch": 0.35286174301443857, "percentage": 35.29, "elapsed_time": "1 day, 1:11:14", "remaining_time": "1 day, 22:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3398, "total_steps": 9627, "loss": 1.5006, "learning_rate": 7.228348101825099e-05, "epoch": 0.3529656175340189, "percentage": 35.3, "elapsed_time": "1 day, 1:11:42", "remaining_time": "1 day, 22:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3399, "total_steps": 9627, "loss": 1.8323, "learning_rate": 7.226887327786125e-05, "epoch": 0.3530694920535993, "percentage": 35.31, "elapsed_time": "1 day, 1:12:09", "remaining_time": "1 day, 22:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 9627, "loss": 1.6357, "learning_rate": 7.22542631660102e-05, "epoch": 0.3531733665731796, "percentage": 35.32, "elapsed_time": "1 day, 1:12:36", "remaining_time": "1 day, 22:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3401, "total_steps": 9627, "loss": 1.7819, "learning_rate": 7.223965068425376e-05, "epoch": 0.35327724109275993, "percentage": 35.33, "elapsed_time": "1 day, 1:13:02", "remaining_time": "1 day, 22:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3402, "total_steps": 9627, "loss": 1.6478, "learning_rate": 7.222503583414795e-05, "epoch": 0.3533811156123403, "percentage": 35.34, "elapsed_time": "1 day, 1:13:30", "remaining_time": "1 day, 22:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3403, "total_steps": 9627, "loss": 1.8901, "learning_rate": 7.22104186172492e-05, "epoch": 0.35348499013192064, "percentage": 35.35, "elapsed_time": "1 day, 1:13:56", "remaining_time": "1 day, 22:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3404, "total_steps": 9627, "loss": 1.7524, "learning_rate": 7.219579903511412e-05, "epoch": 0.35358886465150097, "percentage": 35.36, "elapsed_time": "1 day, 1:14:24", "remaining_time": "1 day, 22:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3405, "total_steps": 9627, "loss": 1.6646, "learning_rate": 7.218117708929957e-05, "epoch": 0.35369273917108135, "percentage": 35.37, "elapsed_time": "1 day, 1:14:50", "remaining_time": "1 day, 22:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3406, "total_steps": 9627, "loss": 1.8199, "learning_rate": 7.216655278136269e-05, "epoch": 0.3537966136906617, "percentage": 35.38, "elapsed_time": "1 day, 1:15:18", "remaining_time": "1 day, 22:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3407, "total_steps": 9627, "loss": 1.5446, "learning_rate": 7.215192611286083e-05, "epoch": 0.353900488210242, "percentage": 35.39, "elapsed_time": "1 day, 1:15:45", "remaining_time": "1 day, 22:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3408, "total_steps": 9627, "loss": 1.4702, "learning_rate": 7.213729708535164e-05, "epoch": 0.3540043627298224, "percentage": 35.4, "elapsed_time": "1 day, 1:16:11", "remaining_time": "1 day, 22:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3409, "total_steps": 9627, "loss": 1.7324, "learning_rate": 7.212266570039299e-05, "epoch": 0.3541082372494027, "percentage": 35.41, "elapsed_time": "1 day, 1:16:39", "remaining_time": "1 day, 22:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3410, "total_steps": 9627, "loss": 1.7712, "learning_rate": 7.2108031959543e-05, "epoch": 0.3542121117689831, "percentage": 35.42, "elapsed_time": "1 day, 1:17:05", "remaining_time": "1 day, 22:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3411, "total_steps": 9627, "loss": 1.5812, "learning_rate": 7.209339586436005e-05, "epoch": 0.3543159862885634, "percentage": 35.43, "elapsed_time": "1 day, 1:17:32", "remaining_time": "1 day, 22:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3412, "total_steps": 9627, "loss": 1.4846, "learning_rate": 7.20787574164028e-05, "epoch": 0.35441986080814375, "percentage": 35.44, "elapsed_time": "1 day, 1:17:59", "remaining_time": "1 day, 22:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3413, "total_steps": 9627, "loss": 1.7985, "learning_rate": 7.206411661723007e-05, "epoch": 0.35452373532772413, "percentage": 35.45, "elapsed_time": "1 day, 1:18:27", "remaining_time": "1 day, 22:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3414, "total_steps": 9627, "loss": 1.7178, "learning_rate": 7.204947346840106e-05, "epoch": 0.35462760984730446, "percentage": 35.46, "elapsed_time": "1 day, 1:18:53", "remaining_time": "1 day, 22:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3415, "total_steps": 9627, "loss": 1.5386, "learning_rate": 7.203482797147512e-05, "epoch": 0.3547314843668848, "percentage": 35.47, "elapsed_time": "1 day, 1:19:21", "remaining_time": "1 day, 22:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3416, "total_steps": 9627, "loss": 1.8462, "learning_rate": 7.202018012801185e-05, "epoch": 0.35483535888646517, "percentage": 35.48, "elapsed_time": "1 day, 1:19:47", "remaining_time": "1 day, 22:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3417, "total_steps": 9627, "loss": 1.6743, "learning_rate": 7.200552993957117e-05, "epoch": 0.3549392334060455, "percentage": 35.49, "elapsed_time": "1 day, 1:20:15", "remaining_time": "1 day, 22:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3418, "total_steps": 9627, "loss": 1.6801, "learning_rate": 7.199087740771321e-05, "epoch": 0.3550431079256258, "percentage": 35.5, "elapsed_time": "1 day, 1:20:42", "remaining_time": "1 day, 22:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3419, "total_steps": 9627, "loss": 1.9052, "learning_rate": 7.197622253399833e-05, "epoch": 0.3551469824452062, "percentage": 35.51, "elapsed_time": "1 day, 1:21:08", "remaining_time": "1 day, 22:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3420, "total_steps": 9627, "loss": 1.6895, "learning_rate": 7.196156531998718e-05, "epoch": 0.35525085696478653, "percentage": 35.53, "elapsed_time": "1 day, 1:21:36", "remaining_time": "1 day, 22:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3421, "total_steps": 9627, "loss": 1.6898, "learning_rate": 7.194690576724064e-05, "epoch": 0.35535473148436686, "percentage": 35.54, "elapsed_time": "1 day, 1:22:03", "remaining_time": "1 day, 22:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3422, "total_steps": 9627, "loss": 1.7735, "learning_rate": 7.19322438773198e-05, "epoch": 0.35545860600394724, "percentage": 35.55, "elapsed_time": "1 day, 1:22:30", "remaining_time": "1 day, 22:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3423, "total_steps": 9627, "loss": 1.7066, "learning_rate": 7.191757965178609e-05, "epoch": 0.35556248052352757, "percentage": 35.56, "elapsed_time": "1 day, 1:22:57", "remaining_time": "1 day, 22:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3424, "total_steps": 9627, "loss": 1.622, "learning_rate": 7.19029130922011e-05, "epoch": 0.35566635504310795, "percentage": 35.57, "elapsed_time": "1 day, 1:23:24", "remaining_time": "1 day, 21:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3425, "total_steps": 9627, "loss": 1.5406, "learning_rate": 7.188824420012671e-05, "epoch": 0.3557702295626883, "percentage": 35.58, "elapsed_time": "1 day, 1:23:52", "remaining_time": "1 day, 21:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3426, "total_steps": 9627, "loss": 1.6681, "learning_rate": 7.187357297712506e-05, "epoch": 0.3558741040822686, "percentage": 35.59, "elapsed_time": "1 day, 1:24:19", "remaining_time": "1 day, 21:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3427, "total_steps": 9627, "loss": 1.7488, "learning_rate": 7.185889942475851e-05, "epoch": 0.355977978601849, "percentage": 35.6, "elapsed_time": "1 day, 1:24:45", "remaining_time": "1 day, 21:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3428, "total_steps": 9627, "loss": 1.6041, "learning_rate": 7.184422354458966e-05, "epoch": 0.3560818531214293, "percentage": 35.61, "elapsed_time": "1 day, 1:25:13", "remaining_time": "1 day, 21:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3429, "total_steps": 9627, "loss": 1.7968, "learning_rate": 7.182954533818142e-05, "epoch": 0.35618572764100964, "percentage": 35.62, "elapsed_time": "1 day, 1:25:39", "remaining_time": "1 day, 21:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3430, "total_steps": 9627, "loss": 1.7446, "learning_rate": 7.181486480709687e-05, "epoch": 0.35628960216059, "percentage": 35.63, "elapsed_time": "1 day, 1:26:07", "remaining_time": "1 day, 21:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3431, "total_steps": 9627, "loss": 1.7684, "learning_rate": 7.180018195289937e-05, "epoch": 0.35639347668017035, "percentage": 35.64, "elapsed_time": "1 day, 1:26:34", "remaining_time": "1 day, 21:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3432, "total_steps": 9627, "loss": 1.7591, "learning_rate": 7.178549677715254e-05, "epoch": 0.3564973511997507, "percentage": 35.65, "elapsed_time": "1 day, 1:27:01", "remaining_time": "1 day, 21:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3433, "total_steps": 9627, "loss": 1.8228, "learning_rate": 7.177080928142024e-05, "epoch": 0.35660122571933106, "percentage": 35.66, "elapsed_time": "1 day, 1:27:28", "remaining_time": "1 day, 21:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3434, "total_steps": 9627, "loss": 1.7026, "learning_rate": 7.175611946726657e-05, "epoch": 0.3567051002389114, "percentage": 35.67, "elapsed_time": "1 day, 1:27:55", "remaining_time": "1 day, 21:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3435, "total_steps": 9627, "loss": 1.4263, "learning_rate": 7.174142733625589e-05, "epoch": 0.3568089747584917, "percentage": 35.68, "elapsed_time": "1 day, 1:28:23", "remaining_time": "1 day, 21:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3436, "total_steps": 9627, "loss": 1.6076, "learning_rate": 7.172673288995277e-05, "epoch": 0.3569128492780721, "percentage": 35.69, "elapsed_time": "1 day, 1:28:49", "remaining_time": "1 day, 21:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3437, "total_steps": 9627, "loss": 1.7049, "learning_rate": 7.171203612992209e-05, "epoch": 0.3570167237976524, "percentage": 35.7, "elapsed_time": "1 day, 1:29:17", "remaining_time": "1 day, 21:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3438, "total_steps": 9627, "loss": 1.5924, "learning_rate": 7.169733705772891e-05, "epoch": 0.3571205983172328, "percentage": 35.71, "elapsed_time": "1 day, 1:29:44", "remaining_time": "1 day, 21:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3439, "total_steps": 9627, "loss": 1.8338, "learning_rate": 7.168263567493859e-05, "epoch": 0.35722447283681313, "percentage": 35.72, "elapsed_time": "1 day, 1:30:12", "remaining_time": "1 day, 21:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3440, "total_steps": 9627, "loss": 1.8652, "learning_rate": 7.16679319831167e-05, "epoch": 0.35732834735639346, "percentage": 35.73, "elapsed_time": "1 day, 1:30:39", "remaining_time": "1 day, 21:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3441, "total_steps": 9627, "loss": 1.8941, "learning_rate": 7.165322598382905e-05, "epoch": 0.35743222187597384, "percentage": 35.74, "elapsed_time": "1 day, 1:31:06", "remaining_time": "1 day, 21:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3442, "total_steps": 9627, "loss": 1.8183, "learning_rate": 7.163851767864176e-05, "epoch": 0.35753609639555417, "percentage": 35.75, "elapsed_time": "1 day, 1:31:33", "remaining_time": "1 day, 21:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3443, "total_steps": 9627, "loss": 1.7119, "learning_rate": 7.162380706912112e-05, "epoch": 0.3576399709151345, "percentage": 35.76, "elapsed_time": "1 day, 1:31:59", "remaining_time": "1 day, 21:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3444, "total_steps": 9627, "loss": 1.5949, "learning_rate": 7.16090941568337e-05, "epoch": 0.3577438454347149, "percentage": 35.77, "elapsed_time": "1 day, 1:32:27", "remaining_time": "1 day, 21:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3445, "total_steps": 9627, "loss": 1.5768, "learning_rate": 7.159437894334629e-05, "epoch": 0.3578477199542952, "percentage": 35.78, "elapsed_time": "1 day, 1:32:54", "remaining_time": "1 day, 21:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3446, "total_steps": 9627, "loss": 1.7067, "learning_rate": 7.157966143022599e-05, "epoch": 0.35795159447387553, "percentage": 35.8, "elapsed_time": "1 day, 1:33:21", "remaining_time": "1 day, 21:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3447, "total_steps": 9627, "loss": 1.6634, "learning_rate": 7.156494161904005e-05, "epoch": 0.3580554689934559, "percentage": 35.81, "elapsed_time": "1 day, 1:33:48", "remaining_time": "1 day, 21:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3448, "total_steps": 9627, "loss": 1.6025, "learning_rate": 7.155021951135605e-05, "epoch": 0.35815934351303624, "percentage": 35.82, "elapsed_time": "1 day, 1:34:14", "remaining_time": "1 day, 21:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3449, "total_steps": 9627, "loss": 1.709, "learning_rate": 7.153549510874178e-05, "epoch": 0.3582632180326166, "percentage": 35.83, "elapsed_time": "1 day, 1:34:42", "remaining_time": "1 day, 21:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 9627, "loss": 1.6638, "learning_rate": 7.152076841276527e-05, "epoch": 0.35836709255219695, "percentage": 35.84, "elapsed_time": "1 day, 1:35:09", "remaining_time": "1 day, 21:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3451, "total_steps": 9627, "loss": 1.7261, "learning_rate": 7.150603942499478e-05, "epoch": 0.3584709670717773, "percentage": 35.85, "elapsed_time": "1 day, 1:35:37", "remaining_time": "1 day, 21:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3452, "total_steps": 9627, "loss": 1.7373, "learning_rate": 7.149130814699884e-05, "epoch": 0.35857484159135766, "percentage": 35.86, "elapsed_time": "1 day, 1:36:03", "remaining_time": "1 day, 21:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3453, "total_steps": 9627, "loss": 1.6811, "learning_rate": 7.147657458034622e-05, "epoch": 0.358678716110938, "percentage": 35.87, "elapsed_time": "1 day, 1:36:32", "remaining_time": "1 day, 21:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3454, "total_steps": 9627, "loss": 1.6032, "learning_rate": 7.146183872660595e-05, "epoch": 0.3587825906305183, "percentage": 35.88, "elapsed_time": "1 day, 1:36:58", "remaining_time": "1 day, 21:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3455, "total_steps": 9627, "loss": 1.5488, "learning_rate": 7.144710058734724e-05, "epoch": 0.3588864651500987, "percentage": 35.89, "elapsed_time": "1 day, 1:37:25", "remaining_time": "1 day, 21:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3456, "total_steps": 9627, "loss": 1.6905, "learning_rate": 7.143236016413963e-05, "epoch": 0.358990339669679, "percentage": 35.9, "elapsed_time": "1 day, 1:37:53", "remaining_time": "1 day, 21:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3457, "total_steps": 9627, "loss": 1.7514, "learning_rate": 7.141761745855284e-05, "epoch": 0.35909421418925935, "percentage": 35.91, "elapsed_time": "1 day, 1:38:19", "remaining_time": "1 day, 21:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3458, "total_steps": 9627, "loss": 1.3697, "learning_rate": 7.140287247215685e-05, "epoch": 0.35919808870883974, "percentage": 35.92, "elapsed_time": "1 day, 1:38:47", "remaining_time": "1 day, 21:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3459, "total_steps": 9627, "loss": 1.6055, "learning_rate": 7.13881252065219e-05, "epoch": 0.35930196322842006, "percentage": 35.93, "elapsed_time": "1 day, 1:39:15", "remaining_time": "1 day, 21:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3460, "total_steps": 9627, "loss": 1.7294, "learning_rate": 7.137337566321844e-05, "epoch": 0.3594058377480004, "percentage": 35.94, "elapsed_time": "1 day, 1:39:42", "remaining_time": "1 day, 21:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3461, "total_steps": 9627, "loss": 1.8147, "learning_rate": 7.135862384381717e-05, "epoch": 0.35950971226758077, "percentage": 35.95, "elapsed_time": "1 day, 1:40:08", "remaining_time": "1 day, 21:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3462, "total_steps": 9627, "loss": 1.5631, "learning_rate": 7.134386974988909e-05, "epoch": 0.3596135867871611, "percentage": 35.96, "elapsed_time": "1 day, 1:40:36", "remaining_time": "1 day, 21:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3463, "total_steps": 9627, "loss": 1.8052, "learning_rate": 7.132911338300537e-05, "epoch": 0.3597174613067415, "percentage": 35.97, "elapsed_time": "1 day, 1:41:02", "remaining_time": "1 day, 21:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3464, "total_steps": 9627, "loss": 1.8405, "learning_rate": 7.131435474473744e-05, "epoch": 0.3598213358263218, "percentage": 35.98, "elapsed_time": "1 day, 1:41:29", "remaining_time": "1 day, 21:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3465, "total_steps": 9627, "loss": 1.6957, "learning_rate": 7.1299593836657e-05, "epoch": 0.35992521034590214, "percentage": 35.99, "elapsed_time": "1 day, 1:41:58", "remaining_time": "1 day, 21:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3466, "total_steps": 9627, "loss": 1.6149, "learning_rate": 7.128483066033594e-05, "epoch": 0.3600290848654825, "percentage": 36.0, "elapsed_time": "1 day, 1:42:25", "remaining_time": "1 day, 21:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3467, "total_steps": 9627, "loss": 1.7836, "learning_rate": 7.127006521734646e-05, "epoch": 0.36013295938506285, "percentage": 36.01, "elapsed_time": "1 day, 1:42:52", "remaining_time": "1 day, 21:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3468, "total_steps": 9627, "loss": 1.7712, "learning_rate": 7.125529750926094e-05, "epoch": 0.36023683390464317, "percentage": 36.02, "elapsed_time": "1 day, 1:43:19", "remaining_time": "1 day, 21:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3469, "total_steps": 9627, "loss": 1.7435, "learning_rate": 7.124052753765202e-05, "epoch": 0.36034070842422355, "percentage": 36.03, "elapsed_time": "1 day, 1:43:46", "remaining_time": "1 day, 21:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3470, "total_steps": 9627, "loss": 1.4758, "learning_rate": 7.122575530409262e-05, "epoch": 0.3604445829438039, "percentage": 36.04, "elapsed_time": "1 day, 1:44:13", "remaining_time": "1 day, 21:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3471, "total_steps": 9627, "loss": 1.6, "learning_rate": 7.121098081015586e-05, "epoch": 0.3605484574633842, "percentage": 36.05, "elapsed_time": "1 day, 1:44:41", "remaining_time": "1 day, 21:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3472, "total_steps": 9627, "loss": 1.845, "learning_rate": 7.119620405741506e-05, "epoch": 0.3606523319829646, "percentage": 36.07, "elapsed_time": "1 day, 1:45:08", "remaining_time": "1 day, 21:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3473, "total_steps": 9627, "loss": 1.7532, "learning_rate": 7.118142504744389e-05, "epoch": 0.3607562065025449, "percentage": 36.08, "elapsed_time": "1 day, 1:45:36", "remaining_time": "1 day, 21:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3474, "total_steps": 9627, "loss": 1.7787, "learning_rate": 7.116664378181616e-05, "epoch": 0.36086008102212525, "percentage": 36.09, "elapsed_time": "1 day, 1:46:03", "remaining_time": "1 day, 21:38:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3475, "total_steps": 9627, "loss": 1.7785, "learning_rate": 7.115186026210597e-05, "epoch": 0.36096395554170563, "percentage": 36.1, "elapsed_time": "1 day, 1:46:30", "remaining_time": "1 day, 21:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3476, "total_steps": 9627, "loss": 1.6208, "learning_rate": 7.113707448988767e-05, "epoch": 0.36106783006128595, "percentage": 36.11, "elapsed_time": "1 day, 1:46:57", "remaining_time": "1 day, 21:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3477, "total_steps": 9627, "loss": 1.66, "learning_rate": 7.11222864667358e-05, "epoch": 0.36117170458086634, "percentage": 36.12, "elapsed_time": "1 day, 1:47:26", "remaining_time": "1 day, 21:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3478, "total_steps": 9627, "loss": 1.6975, "learning_rate": 7.110749619422519e-05, "epoch": 0.36127557910044666, "percentage": 36.13, "elapsed_time": "1 day, 1:47:52", "remaining_time": "1 day, 21:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3479, "total_steps": 9627, "loss": 1.7015, "learning_rate": 7.109270367393088e-05, "epoch": 0.361379453620027, "percentage": 36.14, "elapsed_time": "1 day, 1:48:20", "remaining_time": "1 day, 21:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3480, "total_steps": 9627, "loss": 1.7778, "learning_rate": 7.107790890742815e-05, "epoch": 0.3614833281396074, "percentage": 36.15, "elapsed_time": "1 day, 1:48:46", "remaining_time": "1 day, 21:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3481, "total_steps": 9627, "loss": 1.8917, "learning_rate": 7.106311189629253e-05, "epoch": 0.3615872026591877, "percentage": 36.16, "elapsed_time": "1 day, 1:49:15", "remaining_time": "1 day, 21:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3482, "total_steps": 9627, "loss": 1.6972, "learning_rate": 7.104831264209982e-05, "epoch": 0.36169107717876803, "percentage": 36.17, "elapsed_time": "1 day, 1:49:41", "remaining_time": "1 day, 21:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3483, "total_steps": 9627, "loss": 1.5879, "learning_rate": 7.103351114642596e-05, "epoch": 0.3617949516983484, "percentage": 36.18, "elapsed_time": "1 day, 1:50:10", "remaining_time": "1 day, 21:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3484, "total_steps": 9627, "loss": 1.7124, "learning_rate": 7.101870741084726e-05, "epoch": 0.36189882621792874, "percentage": 36.19, "elapsed_time": "1 day, 1:50:37", "remaining_time": "1 day, 21:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3485, "total_steps": 9627, "loss": 1.681, "learning_rate": 7.100390143694016e-05, "epoch": 0.36200270073750906, "percentage": 36.2, "elapsed_time": "1 day, 1:51:05", "remaining_time": "1 day, 21:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3486, "total_steps": 9627, "loss": 1.703, "learning_rate": 7.098909322628138e-05, "epoch": 0.36210657525708945, "percentage": 36.21, "elapsed_time": "1 day, 1:51:31", "remaining_time": "1 day, 21:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3487, "total_steps": 9627, "loss": 1.7333, "learning_rate": 7.097428278044792e-05, "epoch": 0.3622104497766698, "percentage": 36.22, "elapsed_time": "1 day, 1:52:00", "remaining_time": "1 day, 21:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3488, "total_steps": 9627, "loss": 1.713, "learning_rate": 7.095947010101693e-05, "epoch": 0.36231432429625016, "percentage": 36.23, "elapsed_time": "1 day, 1:52:26", "remaining_time": "1 day, 21:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3489, "total_steps": 9627, "loss": 1.7749, "learning_rate": 7.094465518956588e-05, "epoch": 0.3624181988158305, "percentage": 36.24, "elapsed_time": "1 day, 1:52:54", "remaining_time": "1 day, 21:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3490, "total_steps": 9627, "loss": 1.6216, "learning_rate": 7.092983804767242e-05, "epoch": 0.3625220733354108, "percentage": 36.25, "elapsed_time": "1 day, 1:53:21", "remaining_time": "1 day, 21:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3491, "total_steps": 9627, "loss": 1.6914, "learning_rate": 7.091501867691446e-05, "epoch": 0.3626259478549912, "percentage": 36.26, "elapsed_time": "1 day, 1:53:49", "remaining_time": "1 day, 21:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3492, "total_steps": 9627, "loss": 1.4819, "learning_rate": 7.090019707887017e-05, "epoch": 0.3627298223745715, "percentage": 36.27, "elapsed_time": "1 day, 1:54:16", "remaining_time": "1 day, 21:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3493, "total_steps": 9627, "loss": 1.6425, "learning_rate": 7.08853732551179e-05, "epoch": 0.36283369689415185, "percentage": 36.28, "elapsed_time": "1 day, 1:54:42", "remaining_time": "1 day, 21:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3494, "total_steps": 9627, "loss": 1.6724, "learning_rate": 7.087054720723629e-05, "epoch": 0.36293757141373223, "percentage": 36.29, "elapsed_time": "1 day, 1:55:11", "remaining_time": "1 day, 21:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3495, "total_steps": 9627, "loss": 1.7549, "learning_rate": 7.085571893680421e-05, "epoch": 0.36304144593331256, "percentage": 36.3, "elapsed_time": "1 day, 1:55:37", "remaining_time": "1 day, 21:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3496, "total_steps": 9627, "loss": 1.7959, "learning_rate": 7.084088844540074e-05, "epoch": 0.3631453204528929, "percentage": 36.31, "elapsed_time": "1 day, 1:56:06", "remaining_time": "1 day, 21:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3497, "total_steps": 9627, "loss": 1.907, "learning_rate": 7.08260557346052e-05, "epoch": 0.36324919497247327, "percentage": 36.32, "elapsed_time": "1 day, 1:56:32", "remaining_time": "1 day, 21:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3498, "total_steps": 9627, "loss": 1.7573, "learning_rate": 7.081122080599721e-05, "epoch": 0.3633530694920536, "percentage": 36.34, "elapsed_time": "1 day, 1:57:00", "remaining_time": "1 day, 21:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3499, "total_steps": 9627, "loss": 1.8399, "learning_rate": 7.079638366115653e-05, "epoch": 0.3634569440116339, "percentage": 36.35, "elapsed_time": "1 day, 1:57:28", "remaining_time": "1 day, 21:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 9627, "loss": 1.5973, "learning_rate": 7.078154430166319e-05, "epoch": 0.3635608185312143, "percentage": 36.36, "elapsed_time": "1 day, 1:57:55", "remaining_time": "1 day, 21:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3501, "total_steps": 9627, "loss": 1.8829, "learning_rate": 7.07667027290975e-05, "epoch": 0.36366469305079463, "percentage": 36.37, "elapsed_time": "1 day, 1:58:22", "remaining_time": "1 day, 21:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3502, "total_steps": 9627, "loss": 1.9544, "learning_rate": 7.075185894503993e-05, "epoch": 0.363768567570375, "percentage": 36.38, "elapsed_time": "1 day, 1:58:51", "remaining_time": "1 day, 21:26:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3503, "total_steps": 9627, "loss": 1.7017, "learning_rate": 7.073701295107128e-05, "epoch": 0.36387244208995534, "percentage": 36.39, "elapsed_time": "1 day, 1:59:17", "remaining_time": "1 day, 21:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3504, "total_steps": 9627, "loss": 1.5732, "learning_rate": 7.072216474877249e-05, "epoch": 0.36397631660953567, "percentage": 36.4, "elapsed_time": "1 day, 1:59:46", "remaining_time": "1 day, 21:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3505, "total_steps": 9627, "loss": 1.5651, "learning_rate": 7.070731433972481e-05, "epoch": 0.36408019112911605, "percentage": 36.41, "elapsed_time": "1 day, 2:00:14", "remaining_time": "1 day, 21:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3506, "total_steps": 9627, "loss": 1.5276, "learning_rate": 7.069246172550967e-05, "epoch": 0.3641840656486964, "percentage": 36.42, "elapsed_time": "1 day, 2:00:41", "remaining_time": "1 day, 21:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3507, "total_steps": 9627, "loss": 1.4874, "learning_rate": 7.067760690770876e-05, "epoch": 0.3642879401682767, "percentage": 36.43, "elapsed_time": "1 day, 2:01:08", "remaining_time": "1 day, 21:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3508, "total_steps": 9627, "loss": 1.6168, "learning_rate": 7.066274988790399e-05, "epoch": 0.3643918146878571, "percentage": 36.44, "elapsed_time": "1 day, 2:01:36", "remaining_time": "1 day, 21:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3509, "total_steps": 9627, "loss": 1.8023, "learning_rate": 7.064789066767755e-05, "epoch": 0.3644956892074374, "percentage": 36.45, "elapsed_time": "1 day, 2:02:03", "remaining_time": "1 day, 21:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3510, "total_steps": 9627, "loss": 1.718, "learning_rate": 7.063302924861182e-05, "epoch": 0.36459956372701774, "percentage": 36.46, "elapsed_time": "1 day, 2:02:31", "remaining_time": "1 day, 21:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3511, "total_steps": 9627, "loss": 1.6952, "learning_rate": 7.06181656322894e-05, "epoch": 0.3647034382465981, "percentage": 36.47, "elapsed_time": "1 day, 2:02:58", "remaining_time": "1 day, 21:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3512, "total_steps": 9627, "loss": 1.5578, "learning_rate": 7.060329982029317e-05, "epoch": 0.36480731276617845, "percentage": 36.48, "elapsed_time": "1 day, 2:03:26", "remaining_time": "1 day, 21:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3513, "total_steps": 9627, "loss": 1.7363, "learning_rate": 7.058843181420624e-05, "epoch": 0.3649111872857588, "percentage": 36.49, "elapsed_time": "1 day, 2:03:53", "remaining_time": "1 day, 21:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3514, "total_steps": 9627, "loss": 1.5816, "learning_rate": 7.05735616156119e-05, "epoch": 0.36501506180533916, "percentage": 36.5, "elapsed_time": "1 day, 2:04:21", "remaining_time": "1 day, 21:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3515, "total_steps": 9627, "loss": 1.8035, "learning_rate": 7.055868922609374e-05, "epoch": 0.3651189363249195, "percentage": 36.51, "elapsed_time": "1 day, 2:04:48", "remaining_time": "1 day, 21:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3516, "total_steps": 9627, "loss": 2.132, "learning_rate": 7.054381464723554e-05, "epoch": 0.36522281084449987, "percentage": 36.52, "elapsed_time": "1 day, 2:05:17", "remaining_time": "1 day, 21:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3517, "total_steps": 9627, "loss": 1.7564, "learning_rate": 7.052893788062131e-05, "epoch": 0.3653266853640802, "percentage": 36.53, "elapsed_time": "1 day, 2:05:44", "remaining_time": "1 day, 21:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3518, "total_steps": 9627, "loss": 1.6212, "learning_rate": 7.051405892783536e-05, "epoch": 0.3654305598836605, "percentage": 36.54, "elapsed_time": "1 day, 2:06:12", "remaining_time": "1 day, 21:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3519, "total_steps": 9627, "loss": 1.6613, "learning_rate": 7.049917779046213e-05, "epoch": 0.3655344344032409, "percentage": 36.55, "elapsed_time": "1 day, 2:06:39", "remaining_time": "1 day, 21:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3520, "total_steps": 9627, "loss": 1.7108, "learning_rate": 7.048429447008636e-05, "epoch": 0.36563830892282123, "percentage": 36.56, "elapsed_time": "1 day, 2:07:07", "remaining_time": "1 day, 21:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3521, "total_steps": 9627, "loss": 1.722, "learning_rate": 7.046940896829302e-05, "epoch": 0.36574218344240156, "percentage": 36.57, "elapsed_time": "1 day, 2:07:35", "remaining_time": "1 day, 21:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3522, "total_steps": 9627, "loss": 1.7693, "learning_rate": 7.04545212866673e-05, "epoch": 0.36584605796198194, "percentage": 36.58, "elapsed_time": "1 day, 2:08:02", "remaining_time": "1 day, 21:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3523, "total_steps": 9627, "loss": 1.8372, "learning_rate": 7.043963142679459e-05, "epoch": 0.36594993248156227, "percentage": 36.59, "elapsed_time": "1 day, 2:08:30", "remaining_time": "1 day, 21:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3524, "total_steps": 9627, "loss": 1.9524, "learning_rate": 7.04247393902606e-05, "epoch": 0.3660538070011426, "percentage": 36.61, "elapsed_time": "1 day, 2:08:58", "remaining_time": "1 day, 21:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3525, "total_steps": 9627, "loss": 1.7887, "learning_rate": 7.040984517865116e-05, "epoch": 0.366157681520723, "percentage": 36.62, "elapsed_time": "1 day, 2:09:26", "remaining_time": "1 day, 21:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3526, "total_steps": 9627, "loss": 1.7503, "learning_rate": 7.039494879355242e-05, "epoch": 0.3662615560403033, "percentage": 36.63, "elapsed_time": "1 day, 2:09:53", "remaining_time": "1 day, 21:16:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3527, "total_steps": 9627, "loss": 1.6939, "learning_rate": 7.038005023655072e-05, "epoch": 0.3663654305598837, "percentage": 36.64, "elapsed_time": "1 day, 2:10:20", "remaining_time": "1 day, 21:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3528, "total_steps": 9627, "loss": 1.7095, "learning_rate": 7.036514950923264e-05, "epoch": 0.366469305079464, "percentage": 36.65, "elapsed_time": "1 day, 2:10:48", "remaining_time": "1 day, 21:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3529, "total_steps": 9627, "loss": 1.6409, "learning_rate": 7.0350246613185e-05, "epoch": 0.36657317959904434, "percentage": 36.66, "elapsed_time": "1 day, 2:11:16", "remaining_time": "1 day, 21:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3530, "total_steps": 9627, "loss": 1.781, "learning_rate": 7.033534154999481e-05, "epoch": 0.3666770541186247, "percentage": 36.67, "elapsed_time": "1 day, 2:11:44", "remaining_time": "1 day, 21:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3531, "total_steps": 9627, "loss": 1.7551, "learning_rate": 7.032043432124939e-05, "epoch": 0.36678092863820505, "percentage": 36.68, "elapsed_time": "1 day, 2:12:12", "remaining_time": "1 day, 21:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3532, "total_steps": 9627, "loss": 1.4163, "learning_rate": 7.030552492853621e-05, "epoch": 0.3668848031577854, "percentage": 36.69, "elapsed_time": "1 day, 2:12:39", "remaining_time": "1 day, 21:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3533, "total_steps": 9627, "loss": 1.8067, "learning_rate": 7.029061337344303e-05, "epoch": 0.36698867767736576, "percentage": 36.7, "elapsed_time": "1 day, 2:13:07", "remaining_time": "1 day, 21:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3534, "total_steps": 9627, "loss": 1.819, "learning_rate": 7.027569965755777e-05, "epoch": 0.3670925521969461, "percentage": 36.71, "elapsed_time": "1 day, 2:13:33", "remaining_time": "1 day, 21:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3535, "total_steps": 9627, "loss": 1.6656, "learning_rate": 7.026078378246868e-05, "epoch": 0.3671964267165264, "percentage": 36.72, "elapsed_time": "1 day, 2:14:02", "remaining_time": "1 day, 21:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3536, "total_steps": 9627, "loss": 1.7219, "learning_rate": 7.024586574976414e-05, "epoch": 0.3673003012361068, "percentage": 36.73, "elapsed_time": "1 day, 2:14:29", "remaining_time": "1 day, 21:12:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3537, "total_steps": 9627, "loss": 1.6209, "learning_rate": 7.023094556103283e-05, "epoch": 0.3674041757556871, "percentage": 36.74, "elapsed_time": "1 day, 2:14:57", "remaining_time": "1 day, 21:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3538, "total_steps": 9627, "loss": 1.7411, "learning_rate": 7.021602321786362e-05, "epoch": 0.36750805027526745, "percentage": 36.75, "elapsed_time": "1 day, 2:15:25", "remaining_time": "1 day, 21:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3539, "total_steps": 9627, "loss": 1.6651, "learning_rate": 7.020109872184563e-05, "epoch": 0.36761192479484783, "percentage": 36.76, "elapsed_time": "1 day, 2:15:53", "remaining_time": "1 day, 21:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3540, "total_steps": 9627, "loss": 1.7601, "learning_rate": 7.018617207456821e-05, "epoch": 0.36771579931442816, "percentage": 36.77, "elapsed_time": "1 day, 2:16:20", "remaining_time": "1 day, 21:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3541, "total_steps": 9627, "loss": 1.6426, "learning_rate": 7.01712432776209e-05, "epoch": 0.36781967383400854, "percentage": 36.78, "elapsed_time": "1 day, 2:16:48", "remaining_time": "1 day, 21:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3542, "total_steps": 9627, "loss": 1.4646, "learning_rate": 7.015631233259354e-05, "epoch": 0.36792354835358887, "percentage": 36.79, "elapsed_time": "1 day, 2:17:16", "remaining_time": "1 day, 21:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3543, "total_steps": 9627, "loss": 1.7999, "learning_rate": 7.014137924107614e-05, "epoch": 0.3680274228731692, "percentage": 36.8, "elapsed_time": "1 day, 2:17:43", "remaining_time": "1 day, 21:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3544, "total_steps": 9627, "loss": 1.8085, "learning_rate": 7.012644400465895e-05, "epoch": 0.3681312973927496, "percentage": 36.81, "elapsed_time": "1 day, 2:18:11", "remaining_time": "1 day, 21:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3545, "total_steps": 9627, "loss": 1.851, "learning_rate": 7.011150662493248e-05, "epoch": 0.3682351719123299, "percentage": 36.82, "elapsed_time": "1 day, 2:18:38", "remaining_time": "1 day, 21:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3546, "total_steps": 9627, "loss": 2.0409, "learning_rate": 7.009656710348742e-05, "epoch": 0.36833904643191023, "percentage": 36.83, "elapsed_time": "1 day, 2:19:06", "remaining_time": "1 day, 21:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3547, "total_steps": 9627, "loss": 1.7269, "learning_rate": 7.008162544191474e-05, "epoch": 0.3684429209514906, "percentage": 36.84, "elapsed_time": "1 day, 2:19:34", "remaining_time": "1 day, 21:07:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3548, "total_steps": 9627, "loss": 1.8257, "learning_rate": 7.006668164180557e-05, "epoch": 0.36854679547107094, "percentage": 36.85, "elapsed_time": "1 day, 2:20:01", "remaining_time": "1 day, 21:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3549, "total_steps": 9627, "loss": 1.8499, "learning_rate": 7.005173570475135e-05, "epoch": 0.36865066999065127, "percentage": 36.87, "elapsed_time": "1 day, 2:20:28", "remaining_time": "1 day, 21:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 9627, "loss": 1.8105, "learning_rate": 7.003678763234367e-05, "epoch": 0.36875454451023165, "percentage": 36.88, "elapsed_time": "1 day, 2:20:57", "remaining_time": "1 day, 21:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3551, "total_steps": 9627, "loss": 1.7043, "learning_rate": 7.002183742617441e-05, "epoch": 0.368858419029812, "percentage": 36.89, "elapsed_time": "1 day, 2:21:24", "remaining_time": "1 day, 21:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3552, "total_steps": 9627, "loss": 1.7842, "learning_rate": 7.000688508783564e-05, "epoch": 0.36896229354939236, "percentage": 36.9, "elapsed_time": "1 day, 2:21:52", "remaining_time": "1 day, 21:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3553, "total_steps": 9627, "loss": 1.5356, "learning_rate": 6.999193061891967e-05, "epoch": 0.3690661680689727, "percentage": 36.91, "elapsed_time": "1 day, 2:22:21", "remaining_time": "1 day, 21:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3554, "total_steps": 9627, "loss": 1.8425, "learning_rate": 6.997697402101904e-05, "epoch": 0.369170042588553, "percentage": 36.92, "elapsed_time": "1 day, 2:22:48", "remaining_time": "1 day, 21:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3555, "total_steps": 9627, "loss": 1.7272, "learning_rate": 6.996201529572648e-05, "epoch": 0.3692739171081334, "percentage": 36.93, "elapsed_time": "1 day, 2:23:16", "remaining_time": "1 day, 21:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3556, "total_steps": 9627, "loss": 1.661, "learning_rate": 6.994705444463501e-05, "epoch": 0.3693777916277137, "percentage": 36.94, "elapsed_time": "1 day, 2:23:44", "remaining_time": "1 day, 21:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3557, "total_steps": 9627, "loss": 1.5626, "learning_rate": 6.993209146933784e-05, "epoch": 0.36948166614729405, "percentage": 36.95, "elapsed_time": "1 day, 2:24:10", "remaining_time": "1 day, 21:03:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3558, "total_steps": 9627, "loss": 1.8327, "learning_rate": 6.991712637142839e-05, "epoch": 0.36958554066687443, "percentage": 36.96, "elapsed_time": "1 day, 2:24:39", "remaining_time": "1 day, 21:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3559, "total_steps": 9627, "loss": 1.6256, "learning_rate": 6.990215915250035e-05, "epoch": 0.36968941518645476, "percentage": 36.97, "elapsed_time": "1 day, 2:25:06", "remaining_time": "1 day, 21:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3560, "total_steps": 9627, "loss": 1.8755, "learning_rate": 6.988718981414761e-05, "epoch": 0.3697932897060351, "percentage": 36.98, "elapsed_time": "1 day, 2:25:34", "remaining_time": "1 day, 21:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3561, "total_steps": 9627, "loss": 1.8136, "learning_rate": 6.987221835796429e-05, "epoch": 0.36989716422561547, "percentage": 36.99, "elapsed_time": "1 day, 2:26:02", "remaining_time": "1 day, 21:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3562, "total_steps": 9627, "loss": 1.66, "learning_rate": 6.98572447855447e-05, "epoch": 0.3700010387451958, "percentage": 37.0, "elapsed_time": "1 day, 2:26:30", "remaining_time": "1 day, 21:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3563, "total_steps": 9627, "loss": 1.6159, "learning_rate": 6.984226909848346e-05, "epoch": 0.3701049132647761, "percentage": 37.01, "elapsed_time": "1 day, 2:26:58", "remaining_time": "1 day, 21:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3564, "total_steps": 9627, "loss": 1.888, "learning_rate": 6.982729129837531e-05, "epoch": 0.3702087877843565, "percentage": 37.02, "elapsed_time": "1 day, 2:27:26", "remaining_time": "1 day, 21:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3565, "total_steps": 9627, "loss": 1.7992, "learning_rate": 6.981231138681531e-05, "epoch": 0.37031266230393683, "percentage": 37.03, "elapsed_time": "1 day, 2:27:54", "remaining_time": "1 day, 21:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3566, "total_steps": 9627, "loss": 1.7709, "learning_rate": 6.979732936539868e-05, "epoch": 0.3704165368235172, "percentage": 37.04, "elapsed_time": "1 day, 2:28:21", "remaining_time": "1 day, 20:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3567, "total_steps": 9627, "loss": 1.765, "learning_rate": 6.97823452357209e-05, "epoch": 0.37052041134309754, "percentage": 37.05, "elapsed_time": "1 day, 2:28:50", "remaining_time": "1 day, 20:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3568, "total_steps": 9627, "loss": 1.7137, "learning_rate": 6.976735899937767e-05, "epoch": 0.37062428586267787, "percentage": 37.06, "elapsed_time": "1 day, 2:29:17", "remaining_time": "1 day, 20:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3569, "total_steps": 9627, "loss": 1.7768, "learning_rate": 6.97523706579649e-05, "epoch": 0.37072816038225825, "percentage": 37.07, "elapsed_time": "1 day, 2:29:45", "remaining_time": "1 day, 20:58:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3570, "total_steps": 9627, "loss": 1.4456, "learning_rate": 6.973738021307871e-05, "epoch": 0.3708320349018386, "percentage": 37.08, "elapsed_time": "1 day, 2:30:12", "remaining_time": "1 day, 20:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3571, "total_steps": 9627, "loss": 1.6854, "learning_rate": 6.97223876663155e-05, "epoch": 0.3709359094214189, "percentage": 37.09, "elapsed_time": "1 day, 2:30:41", "remaining_time": "1 day, 20:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3572, "total_steps": 9627, "loss": 1.7468, "learning_rate": 6.970739301927183e-05, "epoch": 0.3710397839409993, "percentage": 37.1, "elapsed_time": "1 day, 2:31:08", "remaining_time": "1 day, 20:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3573, "total_steps": 9627, "loss": 1.6043, "learning_rate": 6.969239627354453e-05, "epoch": 0.3711436584605796, "percentage": 37.11, "elapsed_time": "1 day, 2:31:37", "remaining_time": "1 day, 20:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3574, "total_steps": 9627, "loss": 1.7144, "learning_rate": 6.967739743073065e-05, "epoch": 0.37124753298015994, "percentage": 37.12, "elapsed_time": "1 day, 2:32:03", "remaining_time": "1 day, 20:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3575, "total_steps": 9627, "loss": 1.8287, "learning_rate": 6.966239649242743e-05, "epoch": 0.3713514074997403, "percentage": 37.14, "elapsed_time": "1 day, 2:32:33", "remaining_time": "1 day, 20:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3576, "total_steps": 9627, "loss": 1.8377, "learning_rate": 6.964739346023235e-05, "epoch": 0.37145528201932065, "percentage": 37.15, "elapsed_time": "1 day, 2:33:01", "remaining_time": "1 day, 20:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3577, "total_steps": 9627, "loss": 1.7471, "learning_rate": 6.963238833574312e-05, "epoch": 0.371559156538901, "percentage": 37.16, "elapsed_time": "1 day, 2:33:29", "remaining_time": "1 day, 20:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3578, "total_steps": 9627, "loss": 1.4237, "learning_rate": 6.961738112055767e-05, "epoch": 0.37166303105848136, "percentage": 37.17, "elapsed_time": "1 day, 2:33:56", "remaining_time": "1 day, 20:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3579, "total_steps": 9627, "loss": 1.7035, "learning_rate": 6.960237181627416e-05, "epoch": 0.3717669055780617, "percentage": 37.18, "elapsed_time": "1 day, 2:34:25", "remaining_time": "1 day, 20:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3580, "total_steps": 9627, "loss": 1.8277, "learning_rate": 6.958736042449095e-05, "epoch": 0.3718707800976421, "percentage": 37.19, "elapsed_time": "1 day, 2:34:53", "remaining_time": "1 day, 20:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3581, "total_steps": 9627, "loss": 1.7919, "learning_rate": 6.957234694680663e-05, "epoch": 0.3719746546172224, "percentage": 37.2, "elapsed_time": "1 day, 2:35:21", "remaining_time": "1 day, 20:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3582, "total_steps": 9627, "loss": 1.795, "learning_rate": 6.955733138482006e-05, "epoch": 0.3720785291368027, "percentage": 37.21, "elapsed_time": "1 day, 2:35:49", "remaining_time": "1 day, 20:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3583, "total_steps": 9627, "loss": 1.7831, "learning_rate": 6.954231374013022e-05, "epoch": 0.3721824036563831, "percentage": 37.22, "elapsed_time": "1 day, 2:36:17", "remaining_time": "1 day, 20:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3584, "total_steps": 9627, "loss": 1.4946, "learning_rate": 6.952729401433642e-05, "epoch": 0.37228627817596344, "percentage": 37.23, "elapsed_time": "1 day, 2:36:45", "remaining_time": "1 day, 20:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3585, "total_steps": 9627, "loss": 1.7404, "learning_rate": 6.951227220903813e-05, "epoch": 0.37239015269554376, "percentage": 37.24, "elapsed_time": "1 day, 2:37:14", "remaining_time": "1 day, 20:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3586, "total_steps": 9627, "loss": 1.6906, "learning_rate": 6.949724832583504e-05, "epoch": 0.37249402721512415, "percentage": 37.25, "elapsed_time": "1 day, 2:37:40", "remaining_time": "1 day, 20:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3587, "total_steps": 9627, "loss": 1.7632, "learning_rate": 6.948222236632709e-05, "epoch": 0.3725979017347045, "percentage": 37.26, "elapsed_time": "1 day, 2:38:09", "remaining_time": "1 day, 20:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3588, "total_steps": 9627, "loss": 1.6058, "learning_rate": 6.946719433211442e-05, "epoch": 0.3727017762542848, "percentage": 37.27, "elapsed_time": "1 day, 2:38:37", "remaining_time": "1 day, 20:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3589, "total_steps": 9627, "loss": 1.7819, "learning_rate": 6.945216422479741e-05, "epoch": 0.3728056507738652, "percentage": 37.28, "elapsed_time": "1 day, 2:39:05", "remaining_time": "1 day, 20:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3590, "total_steps": 9627, "loss": 1.8151, "learning_rate": 6.943713204597664e-05, "epoch": 0.3729095252934455, "percentage": 37.29, "elapsed_time": "1 day, 2:39:34", "remaining_time": "1 day, 20:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3591, "total_steps": 9627, "loss": 1.775, "learning_rate": 6.942209779725292e-05, "epoch": 0.3730133998130259, "percentage": 37.3, "elapsed_time": "1 day, 2:40:01", "remaining_time": "1 day, 20:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3592, "total_steps": 9627, "loss": 1.6656, "learning_rate": 6.94070614802273e-05, "epoch": 0.3731172743326062, "percentage": 37.31, "elapsed_time": "1 day, 2:40:30", "remaining_time": "1 day, 20:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3593, "total_steps": 9627, "loss": 1.7774, "learning_rate": 6.9392023096501e-05, "epoch": 0.37322114885218655, "percentage": 37.32, "elapsed_time": "1 day, 2:40:57", "remaining_time": "1 day, 20:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3594, "total_steps": 9627, "loss": 1.8816, "learning_rate": 6.937698264767549e-05, "epoch": 0.37332502337176693, "percentage": 37.33, "elapsed_time": "1 day, 2:41:26", "remaining_time": "1 day, 20:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3595, "total_steps": 9627, "loss": 1.7163, "learning_rate": 6.93619401353525e-05, "epoch": 0.37342889789134726, "percentage": 37.34, "elapsed_time": "1 day, 2:41:54", "remaining_time": "1 day, 20:47:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3596, "total_steps": 9627, "loss": 1.7318, "learning_rate": 6.934689556113391e-05, "epoch": 0.3735327724109276, "percentage": 37.35, "elapsed_time": "1 day, 2:42:21", "remaining_time": "1 day, 20:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3597, "total_steps": 9627, "loss": 1.8164, "learning_rate": 6.933184892662185e-05, "epoch": 0.37363664693050797, "percentage": 37.36, "elapsed_time": "1 day, 2:42:51", "remaining_time": "1 day, 20:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3598, "total_steps": 9627, "loss": 1.7503, "learning_rate": 6.931680023341867e-05, "epoch": 0.3737405214500883, "percentage": 37.37, "elapsed_time": "1 day, 2:43:18", "remaining_time": "1 day, 20:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3599, "total_steps": 9627, "loss": 1.6838, "learning_rate": 6.930174948312696e-05, "epoch": 0.3738443959696686, "percentage": 37.38, "elapsed_time": "1 day, 2:43:47", "remaining_time": "1 day, 20:46:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 9627, "loss": 1.743, "learning_rate": 6.928669667734945e-05, "epoch": 0.373948270489249, "percentage": 37.39, "elapsed_time": "1 day, 2:44:15", "remaining_time": "1 day, 20:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3601, "total_steps": 9627, "loss": 1.868, "learning_rate": 6.927164181768921e-05, "epoch": 0.37405214500882933, "percentage": 37.41, "elapsed_time": "1 day, 2:44:42", "remaining_time": "1 day, 20:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3602, "total_steps": 9627, "loss": 1.8172, "learning_rate": 6.925658490574945e-05, "epoch": 0.37415601952840966, "percentage": 37.42, "elapsed_time": "1 day, 2:45:11", "remaining_time": "1 day, 20:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3603, "total_steps": 9627, "loss": 1.671, "learning_rate": 6.92415259431336e-05, "epoch": 0.37425989404799004, "percentage": 37.43, "elapsed_time": "1 day, 2:45:39", "remaining_time": "1 day, 20:44:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3604, "total_steps": 9627, "loss": 1.6493, "learning_rate": 6.922646493144532e-05, "epoch": 0.37436376856757037, "percentage": 37.44, "elapsed_time": "1 day, 2:46:07", "remaining_time": "1 day, 20:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3605, "total_steps": 9627, "loss": 1.6539, "learning_rate": 6.92114018722885e-05, "epoch": 0.37446764308715075, "percentage": 37.45, "elapsed_time": "1 day, 2:46:36", "remaining_time": "1 day, 20:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3606, "total_steps": 9627, "loss": 1.5816, "learning_rate": 6.919633676726722e-05, "epoch": 0.3745715176067311, "percentage": 37.46, "elapsed_time": "1 day, 2:47:04", "remaining_time": "1 day, 20:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3607, "total_steps": 9627, "loss": 1.7291, "learning_rate": 6.918126961798583e-05, "epoch": 0.3746753921263114, "percentage": 37.47, "elapsed_time": "1 day, 2:47:32", "remaining_time": "1 day, 20:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3608, "total_steps": 9627, "loss": 1.7515, "learning_rate": 6.916620042604883e-05, "epoch": 0.3747792666458918, "percentage": 37.48, "elapsed_time": "1 day, 2:48:00", "remaining_time": "1 day, 20:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3609, "total_steps": 9627, "loss": 1.6408, "learning_rate": 6.915112919306101e-05, "epoch": 0.3748831411654721, "percentage": 37.49, "elapsed_time": "1 day, 2:48:28", "remaining_time": "1 day, 20:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3610, "total_steps": 9627, "loss": 1.7996, "learning_rate": 6.913605592062731e-05, "epoch": 0.37498701568505244, "percentage": 37.5, "elapsed_time": "1 day, 2:48:57", "remaining_time": "1 day, 20:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3611, "total_steps": 9627, "loss": 1.6188, "learning_rate": 6.91209806103529e-05, "epoch": 0.3750908902046328, "percentage": 37.51, "elapsed_time": "1 day, 2:49:25", "remaining_time": "1 day, 20:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3612, "total_steps": 9627, "loss": 1.8074, "learning_rate": 6.910590326384323e-05, "epoch": 0.37519476472421315, "percentage": 37.52, "elapsed_time": "1 day, 2:49:54", "remaining_time": "1 day, 20:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3613, "total_steps": 9627, "loss": 1.6607, "learning_rate": 6.909082388270389e-05, "epoch": 0.3752986392437935, "percentage": 37.53, "elapsed_time": "1 day, 2:50:22", "remaining_time": "1 day, 20:40:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3614, "total_steps": 9627, "loss": 1.7711, "learning_rate": 6.90757424685407e-05, "epoch": 0.37540251376337386, "percentage": 37.54, "elapsed_time": "1 day, 2:50:50", "remaining_time": "1 day, 20:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3615, "total_steps": 9627, "loss": 1.8252, "learning_rate": 6.906065902295975e-05, "epoch": 0.3755063882829542, "percentage": 37.55, "elapsed_time": "1 day, 2:51:19", "remaining_time": "1 day, 20:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3616, "total_steps": 9627, "loss": 1.7832, "learning_rate": 6.904557354756728e-05, "epoch": 0.3756102628025345, "percentage": 37.56, "elapsed_time": "1 day, 2:51:46", "remaining_time": "1 day, 20:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3617, "total_steps": 9627, "loss": 1.6776, "learning_rate": 6.903048604396981e-05, "epoch": 0.3757141373221149, "percentage": 37.57, "elapsed_time": "1 day, 2:52:14", "remaining_time": "1 day, 20:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3618, "total_steps": 9627, "loss": 1.7664, "learning_rate": 6.9015396513774e-05, "epoch": 0.3758180118416952, "percentage": 37.58, "elapsed_time": "1 day, 2:52:44", "remaining_time": "1 day, 20:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3619, "total_steps": 9627, "loss": 1.5807, "learning_rate": 6.900030495858681e-05, "epoch": 0.3759218863612756, "percentage": 37.59, "elapsed_time": "1 day, 2:53:11", "remaining_time": "1 day, 20:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3620, "total_steps": 9627, "loss": 1.8023, "learning_rate": 6.898521138001533e-05, "epoch": 0.37602576088085593, "percentage": 37.6, "elapsed_time": "1 day, 2:53:40", "remaining_time": "1 day, 20:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3621, "total_steps": 9627, "loss": 1.7831, "learning_rate": 6.897011577966693e-05, "epoch": 0.37612963540043626, "percentage": 37.61, "elapsed_time": "1 day, 2:54:08", "remaining_time": "1 day, 20:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3622, "total_steps": 9627, "loss": 1.7742, "learning_rate": 6.895501815914917e-05, "epoch": 0.37623350992001664, "percentage": 37.62, "elapsed_time": "1 day, 2:54:36", "remaining_time": "1 day, 20:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3623, "total_steps": 9627, "loss": 1.6418, "learning_rate": 6.893991852006983e-05, "epoch": 0.37633738443959697, "percentage": 37.63, "elapsed_time": "1 day, 2:55:05", "remaining_time": "1 day, 20:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3624, "total_steps": 9627, "loss": 1.6307, "learning_rate": 6.892481686403694e-05, "epoch": 0.3764412589591773, "percentage": 37.64, "elapsed_time": "1 day, 2:55:33", "remaining_time": "1 day, 20:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3625, "total_steps": 9627, "loss": 1.6734, "learning_rate": 6.890971319265863e-05, "epoch": 0.3765451334787577, "percentage": 37.65, "elapsed_time": "1 day, 2:56:01", "remaining_time": "1 day, 20:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3626, "total_steps": 9627, "loss": 1.6584, "learning_rate": 6.889460750754337e-05, "epoch": 0.376649007998338, "percentage": 37.66, "elapsed_time": "1 day, 2:56:30", "remaining_time": "1 day, 20:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3627, "total_steps": 9627, "loss": 1.9331, "learning_rate": 6.887949981029981e-05, "epoch": 0.37675288251791833, "percentage": 37.68, "elapsed_time": "1 day, 2:56:58", "remaining_time": "1 day, 20:34:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3628, "total_steps": 9627, "loss": 1.8305, "learning_rate": 6.886439010253678e-05, "epoch": 0.3768567570374987, "percentage": 37.69, "elapsed_time": "1 day, 2:57:27", "remaining_time": "1 day, 20:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3629, "total_steps": 9627, "loss": 1.675, "learning_rate": 6.884927838586336e-05, "epoch": 0.37696063155707904, "percentage": 37.7, "elapsed_time": "1 day, 2:57:54", "remaining_time": "1 day, 20:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3630, "total_steps": 9627, "loss": 1.6902, "learning_rate": 6.88341646618888e-05, "epoch": 0.3770645060766594, "percentage": 37.71, "elapsed_time": "1 day, 2:58:24", "remaining_time": "1 day, 20:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3631, "total_steps": 9627, "loss": 1.593, "learning_rate": 6.881904893222265e-05, "epoch": 0.37716838059623975, "percentage": 37.72, "elapsed_time": "1 day, 2:58:51", "remaining_time": "1 day, 20:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3632, "total_steps": 9627, "loss": 1.5337, "learning_rate": 6.880393119847456e-05, "epoch": 0.3772722551158201, "percentage": 37.73, "elapsed_time": "1 day, 2:59:20", "remaining_time": "1 day, 20:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3633, "total_steps": 9627, "loss": 1.7957, "learning_rate": 6.878881146225447e-05, "epoch": 0.37737612963540046, "percentage": 37.74, "elapsed_time": "1 day, 2:59:49", "remaining_time": "1 day, 20:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3634, "total_steps": 9627, "loss": 1.783, "learning_rate": 6.877368972517252e-05, "epoch": 0.3774800041549808, "percentage": 37.75, "elapsed_time": "1 day, 3:00:16", "remaining_time": "1 day, 20:32:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3635, "total_steps": 9627, "loss": 1.756, "learning_rate": 6.875856598883907e-05, "epoch": 0.3775838786745611, "percentage": 37.76, "elapsed_time": "1 day, 3:00:45", "remaining_time": "1 day, 20:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3636, "total_steps": 9627, "loss": 1.7357, "learning_rate": 6.874344025486464e-05, "epoch": 0.3776877531941415, "percentage": 37.77, "elapsed_time": "1 day, 3:01:13", "remaining_time": "1 day, 20:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3637, "total_steps": 9627, "loss": 1.9177, "learning_rate": 6.872831252486005e-05, "epoch": 0.3777916277137218, "percentage": 37.78, "elapsed_time": "1 day, 3:01:42", "remaining_time": "1 day, 20:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3638, "total_steps": 9627, "loss": 1.6861, "learning_rate": 6.871318280043626e-05, "epoch": 0.37789550223330215, "percentage": 37.79, "elapsed_time": "1 day, 3:02:11", "remaining_time": "1 day, 20:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3639, "total_steps": 9627, "loss": 1.7634, "learning_rate": 6.869805108320446e-05, "epoch": 0.37799937675288253, "percentage": 37.8, "elapsed_time": "1 day, 3:02:39", "remaining_time": "1 day, 20:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3640, "total_steps": 9627, "loss": 1.616, "learning_rate": 6.868291737477608e-05, "epoch": 0.37810325127246286, "percentage": 37.81, "elapsed_time": "1 day, 3:03:07", "remaining_time": "1 day, 20:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3641, "total_steps": 9627, "loss": 1.6158, "learning_rate": 6.866778167676272e-05, "epoch": 0.3782071257920432, "percentage": 37.82, "elapsed_time": "1 day, 3:03:35", "remaining_time": "1 day, 20:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3642, "total_steps": 9627, "loss": 1.657, "learning_rate": 6.865264399077623e-05, "epoch": 0.37831100031162357, "percentage": 37.83, "elapsed_time": "1 day, 3:04:04", "remaining_time": "1 day, 20:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3643, "total_steps": 9627, "loss": 1.536, "learning_rate": 6.863750431842865e-05, "epoch": 0.3784148748312039, "percentage": 37.84, "elapsed_time": "1 day, 3:04:33", "remaining_time": "1 day, 20:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3644, "total_steps": 9627, "loss": 1.8389, "learning_rate": 6.862236266133225e-05, "epoch": 0.3785187493507843, "percentage": 37.85, "elapsed_time": "1 day, 3:05:00", "remaining_time": "1 day, 20:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3645, "total_steps": 9627, "loss": 1.6854, "learning_rate": 6.860721902109948e-05, "epoch": 0.3786226238703646, "percentage": 37.86, "elapsed_time": "1 day, 3:05:29", "remaining_time": "1 day, 20:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3646, "total_steps": 9627, "loss": 1.8258, "learning_rate": 6.859207339934302e-05, "epoch": 0.37872649838994493, "percentage": 37.87, "elapsed_time": "1 day, 3:05:57", "remaining_time": "1 day, 20:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3647, "total_steps": 9627, "loss": 1.7949, "learning_rate": 6.857692579767576e-05, "epoch": 0.3788303729095253, "percentage": 37.88, "elapsed_time": "1 day, 3:06:26", "remaining_time": "1 day, 20:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3648, "total_steps": 9627, "loss": 1.6723, "learning_rate": 6.856177621771083e-05, "epoch": 0.37893424742910564, "percentage": 37.89, "elapsed_time": "1 day, 3:06:53", "remaining_time": "1 day, 20:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3649, "total_steps": 9627, "loss": 1.7018, "learning_rate": 6.854662466106151e-05, "epoch": 0.37903812194868597, "percentage": 37.9, "elapsed_time": "1 day, 3:07:22", "remaining_time": "1 day, 20:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 9627, "loss": 1.7914, "learning_rate": 6.853147112934132e-05, "epoch": 0.37914199646826635, "percentage": 37.91, "elapsed_time": "1 day, 3:07:51", "remaining_time": "1 day, 20:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3651, "total_steps": 9627, "loss": 1.7757, "learning_rate": 6.851631562416402e-05, "epoch": 0.3792458709878467, "percentage": 37.92, "elapsed_time": "1 day, 3:08:19", "remaining_time": "1 day, 20:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3652, "total_steps": 9627, "loss": 1.5974, "learning_rate": 6.850115814714355e-05, "epoch": 0.379349745507427, "percentage": 37.93, "elapsed_time": "1 day, 3:08:47", "remaining_time": "1 day, 20:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3653, "total_steps": 9627, "loss": 1.8257, "learning_rate": 6.848599869989403e-05, "epoch": 0.3794536200270074, "percentage": 37.95, "elapsed_time": "1 day, 3:09:16", "remaining_time": "1 day, 20:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3654, "total_steps": 9627, "loss": 1.5854, "learning_rate": 6.847083728402986e-05, "epoch": 0.3795574945465877, "percentage": 37.96, "elapsed_time": "1 day, 3:09:43", "remaining_time": "1 day, 20:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3655, "total_steps": 9627, "loss": 1.8799, "learning_rate": 6.845567390116558e-05, "epoch": 0.37966136906616804, "percentage": 37.97, "elapsed_time": "1 day, 3:10:12", "remaining_time": "1 day, 20:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3656, "total_steps": 9627, "loss": 1.9001, "learning_rate": 6.8440508552916e-05, "epoch": 0.3797652435857484, "percentage": 37.98, "elapsed_time": "1 day, 3:10:40", "remaining_time": "1 day, 20:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3657, "total_steps": 9627, "loss": 1.5654, "learning_rate": 6.84253412408961e-05, "epoch": 0.37986911810532875, "percentage": 37.99, "elapsed_time": "1 day, 3:11:09", "remaining_time": "1 day, 20:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3658, "total_steps": 9627, "loss": 1.5015, "learning_rate": 6.841017196672109e-05, "epoch": 0.37997299262490913, "percentage": 38.0, "elapsed_time": "1 day, 3:11:37", "remaining_time": "1 day, 20:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3659, "total_steps": 9627, "loss": 1.7024, "learning_rate": 6.839500073200636e-05, "epoch": 0.38007686714448946, "percentage": 38.01, "elapsed_time": "1 day, 3:12:07", "remaining_time": "1 day, 20:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3660, "total_steps": 9627, "loss": 1.7241, "learning_rate": 6.837982753836755e-05, "epoch": 0.3801807416640698, "percentage": 38.02, "elapsed_time": "1 day, 3:12:33", "remaining_time": "1 day, 20:21:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3661, "total_steps": 9627, "loss": 1.6898, "learning_rate": 6.836465238742045e-05, "epoch": 0.38028461618365017, "percentage": 38.03, "elapsed_time": "1 day, 3:13:03", "remaining_time": "1 day, 20:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3662, "total_steps": 9627, "loss": 1.8323, "learning_rate": 6.834947528078114e-05, "epoch": 0.3803884907032305, "percentage": 38.04, "elapsed_time": "1 day, 3:13:31", "remaining_time": "1 day, 20:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3663, "total_steps": 9627, "loss": 1.7061, "learning_rate": 6.833429622006584e-05, "epoch": 0.3804923652228108, "percentage": 38.05, "elapsed_time": "1 day, 3:14:01", "remaining_time": "1 day, 20:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3664, "total_steps": 9627, "loss": 1.8332, "learning_rate": 6.8319115206891e-05, "epoch": 0.3805962397423912, "percentage": 38.06, "elapsed_time": "1 day, 3:14:29", "remaining_time": "1 day, 20:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3665, "total_steps": 9627, "loss": 1.6706, "learning_rate": 6.83039322428733e-05, "epoch": 0.38070011426197153, "percentage": 38.07, "elapsed_time": "1 day, 3:14:57", "remaining_time": "1 day, 20:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3666, "total_steps": 9627, "loss": 1.4825, "learning_rate": 6.828874732962958e-05, "epoch": 0.38080398878155186, "percentage": 38.08, "elapsed_time": "1 day, 3:15:25", "remaining_time": "1 day, 20:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3667, "total_steps": 9627, "loss": 1.6615, "learning_rate": 6.827356046877693e-05, "epoch": 0.38090786330113224, "percentage": 38.09, "elapsed_time": "1 day, 3:15:54", "remaining_time": "1 day, 20:18:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3668, "total_steps": 9627, "loss": 1.5442, "learning_rate": 6.825837166193263e-05, "epoch": 0.38101173782071257, "percentage": 38.1, "elapsed_time": "1 day, 3:16:23", "remaining_time": "1 day, 20:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3669, "total_steps": 9627, "loss": 1.6057, "learning_rate": 6.824318091071416e-05, "epoch": 0.38111561234029295, "percentage": 38.11, "elapsed_time": "1 day, 3:16:51", "remaining_time": "1 day, 20:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3670, "total_steps": 9627, "loss": 1.7737, "learning_rate": 6.822798821673923e-05, "epoch": 0.3812194868598733, "percentage": 38.12, "elapsed_time": "1 day, 3:17:19", "remaining_time": "1 day, 20:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3671, "total_steps": 9627, "loss": 1.506, "learning_rate": 6.821279358162575e-05, "epoch": 0.3813233613794536, "percentage": 38.13, "elapsed_time": "1 day, 3:17:48", "remaining_time": "1 day, 20:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3672, "total_steps": 9627, "loss": 1.7086, "learning_rate": 6.819759700699181e-05, "epoch": 0.381427235899034, "percentage": 38.14, "elapsed_time": "1 day, 3:18:17", "remaining_time": "1 day, 20:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3673, "total_steps": 9627, "loss": 1.8619, "learning_rate": 6.818239849445574e-05, "epoch": 0.3815311104186143, "percentage": 38.15, "elapsed_time": "1 day, 3:18:45", "remaining_time": "1 day, 20:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3674, "total_steps": 9627, "loss": 1.7338, "learning_rate": 6.816719804563606e-05, "epoch": 0.38163498493819464, "percentage": 38.16, "elapsed_time": "1 day, 3:19:14", "remaining_time": "1 day, 20:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3675, "total_steps": 9627, "loss": 1.5691, "learning_rate": 6.815199566215149e-05, "epoch": 0.381738859457775, "percentage": 38.17, "elapsed_time": "1 day, 3:19:43", "remaining_time": "1 day, 20:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3676, "total_steps": 9627, "loss": 1.8749, "learning_rate": 6.813679134562098e-05, "epoch": 0.38184273397735535, "percentage": 38.18, "elapsed_time": "1 day, 3:20:11", "remaining_time": "1 day, 20:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3677, "total_steps": 9627, "loss": 1.6885, "learning_rate": 6.812158509766366e-05, "epoch": 0.3819466084969357, "percentage": 38.19, "elapsed_time": "1 day, 3:20:39", "remaining_time": "1 day, 20:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3678, "total_steps": 9627, "loss": 1.7689, "learning_rate": 6.810637691989887e-05, "epoch": 0.38205048301651606, "percentage": 38.21, "elapsed_time": "1 day, 3:21:08", "remaining_time": "1 day, 20:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3679, "total_steps": 9627, "loss": 1.6354, "learning_rate": 6.809116681394618e-05, "epoch": 0.3821543575360964, "percentage": 38.22, "elapsed_time": "1 day, 3:21:37", "remaining_time": "1 day, 20:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3680, "total_steps": 9627, "loss": 1.6749, "learning_rate": 6.807595478142536e-05, "epoch": 0.3822582320556767, "percentage": 38.23, "elapsed_time": "1 day, 3:22:06", "remaining_time": "1 day, 20:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3681, "total_steps": 9627, "loss": 1.7558, "learning_rate": 6.806074082395633e-05, "epoch": 0.3823621065752571, "percentage": 38.24, "elapsed_time": "1 day, 3:22:34", "remaining_time": "1 day, 20:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3682, "total_steps": 9627, "loss": 1.6639, "learning_rate": 6.80455249431593e-05, "epoch": 0.3824659810948374, "percentage": 38.25, "elapsed_time": "1 day, 3:23:03", "remaining_time": "1 day, 20:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3683, "total_steps": 9627, "loss": 1.6497, "learning_rate": 6.803030714065461e-05, "epoch": 0.3825698556144178, "percentage": 38.26, "elapsed_time": "1 day, 3:23:30", "remaining_time": "1 day, 20:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3684, "total_steps": 9627, "loss": 1.86, "learning_rate": 6.801508741806285e-05, "epoch": 0.38267373013399814, "percentage": 38.27, "elapsed_time": "1 day, 3:24:00", "remaining_time": "1 day, 20:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3685, "total_steps": 9627, "loss": 1.7865, "learning_rate": 6.799986577700481e-05, "epoch": 0.38277760465357846, "percentage": 38.28, "elapsed_time": "1 day, 3:24:28", "remaining_time": "1 day, 20:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3686, "total_steps": 9627, "loss": 1.7091, "learning_rate": 6.798464221910147e-05, "epoch": 0.38288147917315885, "percentage": 38.29, "elapsed_time": "1 day, 3:24:57", "remaining_time": "1 day, 20:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3687, "total_steps": 9627, "loss": 1.7886, "learning_rate": 6.796941674597402e-05, "epoch": 0.38298535369273917, "percentage": 38.3, "elapsed_time": "1 day, 3:25:25", "remaining_time": "1 day, 20:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3688, "total_steps": 9627, "loss": 1.8681, "learning_rate": 6.795418935924384e-05, "epoch": 0.3830892282123195, "percentage": 38.31, "elapsed_time": "1 day, 3:25:55", "remaining_time": "1 day, 20:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3689, "total_steps": 9627, "loss": 1.8301, "learning_rate": 6.793896006053255e-05, "epoch": 0.3831931027318999, "percentage": 38.32, "elapsed_time": "1 day, 3:26:22", "remaining_time": "1 day, 20:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3690, "total_steps": 9627, "loss": 1.6537, "learning_rate": 6.792372885146195e-05, "epoch": 0.3832969772514802, "percentage": 38.33, "elapsed_time": "1 day, 3:26:50", "remaining_time": "1 day, 20:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3691, "total_steps": 9627, "loss": 1.5565, "learning_rate": 6.790849573365404e-05, "epoch": 0.38340085177106054, "percentage": 38.34, "elapsed_time": "1 day, 3:27:20", "remaining_time": "1 day, 20:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3692, "total_steps": 9627, "loss": 1.8307, "learning_rate": 6.7893260708731e-05, "epoch": 0.3835047262906409, "percentage": 38.35, "elapsed_time": "1 day, 3:27:48", "remaining_time": "1 day, 20:08:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3693, "total_steps": 9627, "loss": 1.6495, "learning_rate": 6.78780237783153e-05, "epoch": 0.38360860081022125, "percentage": 38.36, "elapsed_time": "1 day, 3:28:17", "remaining_time": "1 day, 20:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3694, "total_steps": 9627, "loss": 1.8522, "learning_rate": 6.786278494402952e-05, "epoch": 0.38371247532980157, "percentage": 38.37, "elapsed_time": "1 day, 3:28:45", "remaining_time": "1 day, 20:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3695, "total_steps": 9627, "loss": 1.7361, "learning_rate": 6.784754420749645e-05, "epoch": 0.38381634984938195, "percentage": 38.38, "elapsed_time": "1 day, 3:29:13", "remaining_time": "1 day, 20:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3696, "total_steps": 9627, "loss": 1.7802, "learning_rate": 6.783230157033915e-05, "epoch": 0.3839202243689623, "percentage": 38.39, "elapsed_time": "1 day, 3:29:43", "remaining_time": "1 day, 20:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3697, "total_steps": 9627, "loss": 1.7411, "learning_rate": 6.781705703418084e-05, "epoch": 0.38402409888854266, "percentage": 38.4, "elapsed_time": "1 day, 3:30:11", "remaining_time": "1 day, 20:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3698, "total_steps": 9627, "loss": 1.4685, "learning_rate": 6.780181060064493e-05, "epoch": 0.384127973408123, "percentage": 38.41, "elapsed_time": "1 day, 3:30:40", "remaining_time": "1 day, 20:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3699, "total_steps": 9627, "loss": 1.4894, "learning_rate": 6.778656227135505e-05, "epoch": 0.3842318479277033, "percentage": 38.42, "elapsed_time": "1 day, 3:31:08", "remaining_time": "1 day, 20:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 9627, "loss": 1.5972, "learning_rate": 6.777131204793502e-05, "epoch": 0.3843357224472837, "percentage": 38.43, "elapsed_time": "1 day, 3:31:37", "remaining_time": "1 day, 20:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3701, "total_steps": 9627, "loss": 1.474, "learning_rate": 6.775605993200889e-05, "epoch": 0.38443959696686403, "percentage": 38.44, "elapsed_time": "1 day, 3:32:06", "remaining_time": "1 day, 20:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3702, "total_steps": 9627, "loss": 1.8876, "learning_rate": 6.774080592520088e-05, "epoch": 0.38454347148644435, "percentage": 38.45, "elapsed_time": "1 day, 3:32:34", "remaining_time": "1 day, 20:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3703, "total_steps": 9627, "loss": 1.8743, "learning_rate": 6.77255500291354e-05, "epoch": 0.38464734600602474, "percentage": 38.46, "elapsed_time": "1 day, 3:33:03", "remaining_time": "1 day, 20:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3704, "total_steps": 9627, "loss": 1.9229, "learning_rate": 6.771029224543713e-05, "epoch": 0.38475122052560506, "percentage": 38.48, "elapsed_time": "1 day, 3:33:31", "remaining_time": "1 day, 20:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3705, "total_steps": 9627, "loss": 1.5463, "learning_rate": 6.769503257573089e-05, "epoch": 0.3848550950451854, "percentage": 38.49, "elapsed_time": "1 day, 3:34:00", "remaining_time": "1 day, 20:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3706, "total_steps": 9627, "loss": 1.724, "learning_rate": 6.767977102164167e-05, "epoch": 0.3849589695647658, "percentage": 38.5, "elapsed_time": "1 day, 3:34:29", "remaining_time": "1 day, 20:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3707, "total_steps": 9627, "loss": 1.965, "learning_rate": 6.766450758479479e-05, "epoch": 0.3850628440843461, "percentage": 38.51, "elapsed_time": "1 day, 3:34:58", "remaining_time": "1 day, 20:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3708, "total_steps": 9627, "loss": 1.6066, "learning_rate": 6.76492422668156e-05, "epoch": 0.3851667186039265, "percentage": 38.52, "elapsed_time": "1 day, 3:35:27", "remaining_time": "1 day, 20:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3709, "total_steps": 9627, "loss": 1.8164, "learning_rate": 6.76339750693298e-05, "epoch": 0.3852705931235068, "percentage": 38.53, "elapsed_time": "1 day, 3:35:55", "remaining_time": "1 day, 20:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3710, "total_steps": 9627, "loss": 1.6843, "learning_rate": 6.76187059939632e-05, "epoch": 0.38537446764308714, "percentage": 38.54, "elapsed_time": "1 day, 3:36:24", "remaining_time": "1 day, 20:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3711, "total_steps": 9627, "loss": 1.5059, "learning_rate": 6.760343504234184e-05, "epoch": 0.3854783421626675, "percentage": 38.55, "elapsed_time": "1 day, 3:36:52", "remaining_time": "1 day, 20:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3712, "total_steps": 9627, "loss": 1.8893, "learning_rate": 6.758816221609196e-05, "epoch": 0.38558221668224785, "percentage": 38.56, "elapsed_time": "1 day, 3:37:21", "remaining_time": "1 day, 20:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3713, "total_steps": 9627, "loss": 1.7954, "learning_rate": 6.757288751684e-05, "epoch": 0.3856860912018282, "percentage": 38.57, "elapsed_time": "1 day, 3:37:49", "remaining_time": "1 day, 20:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3714, "total_steps": 9627, "loss": 1.8645, "learning_rate": 6.75576109462126e-05, "epoch": 0.38578996572140856, "percentage": 38.58, "elapsed_time": "1 day, 3:38:18", "remaining_time": "1 day, 20:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3715, "total_steps": 9627, "loss": 1.8103, "learning_rate": 6.75423325058366e-05, "epoch": 0.3858938402409889, "percentage": 38.59, "elapsed_time": "1 day, 3:38:46", "remaining_time": "1 day, 19:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3716, "total_steps": 9627, "loss": 1.6896, "learning_rate": 6.7527052197339e-05, "epoch": 0.3859977147605692, "percentage": 38.6, "elapsed_time": "1 day, 3:39:15", "remaining_time": "1 day, 19:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3717, "total_steps": 9627, "loss": 1.9697, "learning_rate": 6.751177002234706e-05, "epoch": 0.3861015892801496, "percentage": 38.61, "elapsed_time": "1 day, 3:39:43", "remaining_time": "1 day, 19:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3718, "total_steps": 9627, "loss": 1.9304, "learning_rate": 6.749648598248821e-05, "epoch": 0.3862054637997299, "percentage": 38.62, "elapsed_time": "1 day, 3:40:10", "remaining_time": "1 day, 19:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3719, "total_steps": 9627, "loss": 1.6306, "learning_rate": 6.74812000793901e-05, "epoch": 0.38630933831931025, "percentage": 38.63, "elapsed_time": "1 day, 3:40:39", "remaining_time": "1 day, 19:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3720, "total_steps": 9627, "loss": 1.6424, "learning_rate": 6.74659123146805e-05, "epoch": 0.38641321283889063, "percentage": 38.64, "elapsed_time": "1 day, 3:41:09", "remaining_time": "1 day, 19:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3721, "total_steps": 9627, "loss": 1.4823, "learning_rate": 6.745062268998752e-05, "epoch": 0.38651708735847096, "percentage": 38.65, "elapsed_time": "1 day, 3:41:37", "remaining_time": "1 day, 19:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3722, "total_steps": 9627, "loss": 1.6857, "learning_rate": 6.743533120693932e-05, "epoch": 0.38662096187805134, "percentage": 38.66, "elapsed_time": "1 day, 3:42:05", "remaining_time": "1 day, 19:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3723, "total_steps": 9627, "loss": 1.7333, "learning_rate": 6.742003786716435e-05, "epoch": 0.38672483639763167, "percentage": 38.67, "elapsed_time": "1 day, 3:42:33", "remaining_time": "1 day, 19:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3724, "total_steps": 9627, "loss": 1.7304, "learning_rate": 6.740474267229123e-05, "epoch": 0.386828710917212, "percentage": 38.68, "elapsed_time": "1 day, 3:43:02", "remaining_time": "1 day, 19:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3725, "total_steps": 9627, "loss": 1.6984, "learning_rate": 6.738944562394878e-05, "epoch": 0.3869325854367924, "percentage": 38.69, "elapsed_time": "1 day, 3:43:31", "remaining_time": "1 day, 19:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3726, "total_steps": 9627, "loss": 1.6048, "learning_rate": 6.737414672376601e-05, "epoch": 0.3870364599563727, "percentage": 38.7, "elapsed_time": "1 day, 3:43:59", "remaining_time": "1 day, 19:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3727, "total_steps": 9627, "loss": 1.8856, "learning_rate": 6.735884597337214e-05, "epoch": 0.38714033447595303, "percentage": 38.71, "elapsed_time": "1 day, 3:44:27", "remaining_time": "1 day, 19:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3728, "total_steps": 9627, "loss": 1.6613, "learning_rate": 6.73435433743966e-05, "epoch": 0.3872442089955334, "percentage": 38.72, "elapsed_time": "1 day, 3:44:55", "remaining_time": "1 day, 19:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3729, "total_steps": 9627, "loss": 1.6385, "learning_rate": 6.732823892846895e-05, "epoch": 0.38734808351511374, "percentage": 38.73, "elapsed_time": "1 day, 3:45:24", "remaining_time": "1 day, 19:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3730, "total_steps": 9627, "loss": 1.6883, "learning_rate": 6.731293263721902e-05, "epoch": 0.38745195803469407, "percentage": 38.75, "elapsed_time": "1 day, 3:45:52", "remaining_time": "1 day, 19:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3731, "total_steps": 9627, "loss": 1.677, "learning_rate": 6.72976245022768e-05, "epoch": 0.38755583255427445, "percentage": 38.76, "elapsed_time": "1 day, 3:46:21", "remaining_time": "1 day, 19:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3732, "total_steps": 9627, "loss": 1.8645, "learning_rate": 6.728231452527251e-05, "epoch": 0.3876597070738548, "percentage": 38.77, "elapsed_time": "1 day, 3:46:50", "remaining_time": "1 day, 19:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3733, "total_steps": 9627, "loss": 1.7683, "learning_rate": 6.726700270783655e-05, "epoch": 0.3877635815934351, "percentage": 38.78, "elapsed_time": "1 day, 3:47:18", "remaining_time": "1 day, 19:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3734, "total_steps": 9627, "loss": 1.821, "learning_rate": 6.725168905159945e-05, "epoch": 0.3878674561130155, "percentage": 38.79, "elapsed_time": "1 day, 3:47:47", "remaining_time": "1 day, 19:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3735, "total_steps": 9627, "loss": 1.7861, "learning_rate": 6.723637355819206e-05, "epoch": 0.3879713306325958, "percentage": 38.8, "elapsed_time": "1 day, 3:48:15", "remaining_time": "1 day, 19:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3736, "total_steps": 9627, "loss": 1.7543, "learning_rate": 6.722105622924533e-05, "epoch": 0.3880752051521762, "percentage": 38.81, "elapsed_time": "1 day, 3:48:44", "remaining_time": "1 day, 19:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3737, "total_steps": 9627, "loss": 1.7804, "learning_rate": 6.720573706639044e-05, "epoch": 0.3881790796717565, "percentage": 38.82, "elapsed_time": "1 day, 3:49:13", "remaining_time": "1 day, 19:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3738, "total_steps": 9627, "loss": 1.5168, "learning_rate": 6.719041607125877e-05, "epoch": 0.38828295419133685, "percentage": 38.83, "elapsed_time": "1 day, 3:49:41", "remaining_time": "1 day, 19:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3739, "total_steps": 9627, "loss": 1.801, "learning_rate": 6.717509324548187e-05, "epoch": 0.38838682871091723, "percentage": 38.84, "elapsed_time": "1 day, 3:50:10", "remaining_time": "1 day, 19:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3740, "total_steps": 9627, "loss": 1.6002, "learning_rate": 6.715976859069151e-05, "epoch": 0.38849070323049756, "percentage": 38.85, "elapsed_time": "1 day, 3:50:38", "remaining_time": "1 day, 19:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3741, "total_steps": 9627, "loss": 1.5895, "learning_rate": 6.714444210851964e-05, "epoch": 0.3885945777500779, "percentage": 38.86, "elapsed_time": "1 day, 3:51:06", "remaining_time": "1 day, 19:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3742, "total_steps": 9627, "loss": 1.8872, "learning_rate": 6.712911380059845e-05, "epoch": 0.38869845226965827, "percentage": 38.87, "elapsed_time": "1 day, 3:51:35", "remaining_time": "1 day, 19:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3743, "total_steps": 9627, "loss": 1.7437, "learning_rate": 6.711378366856023e-05, "epoch": 0.3888023267892386, "percentage": 38.88, "elapsed_time": "1 day, 3:52:03", "remaining_time": "1 day, 19:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3744, "total_steps": 9627, "loss": 1.7002, "learning_rate": 6.709845171403754e-05, "epoch": 0.3889062013088189, "percentage": 38.89, "elapsed_time": "1 day, 3:52:31", "remaining_time": "1 day, 19:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3745, "total_steps": 9627, "loss": 1.7328, "learning_rate": 6.70831179386631e-05, "epoch": 0.3890100758283993, "percentage": 38.9, "elapsed_time": "1 day, 3:53:00", "remaining_time": "1 day, 19:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3746, "total_steps": 9627, "loss": 1.7358, "learning_rate": 6.706778234406987e-05, "epoch": 0.38911395034797963, "percentage": 38.91, "elapsed_time": "1 day, 3:53:28", "remaining_time": "1 day, 19:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3747, "total_steps": 9627, "loss": 1.7627, "learning_rate": 6.705244493189094e-05, "epoch": 0.38921782486756, "percentage": 38.92, "elapsed_time": "1 day, 3:53:55", "remaining_time": "1 day, 19:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3748, "total_steps": 9627, "loss": 1.6005, "learning_rate": 6.703710570375966e-05, "epoch": 0.38932169938714034, "percentage": 38.93, "elapsed_time": "1 day, 3:54:24", "remaining_time": "1 day, 19:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3749, "total_steps": 9627, "loss": 1.6763, "learning_rate": 6.702176466130953e-05, "epoch": 0.38942557390672067, "percentage": 38.94, "elapsed_time": "1 day, 3:54:53", "remaining_time": "1 day, 19:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 9627, "loss": 1.8209, "learning_rate": 6.70064218061742e-05, "epoch": 0.38952944842630105, "percentage": 38.95, "elapsed_time": "1 day, 3:55:21", "remaining_time": "1 day, 19:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3751, "total_steps": 9627, "loss": 1.4882, "learning_rate": 6.699107713998762e-05, "epoch": 0.3896333229458814, "percentage": 38.96, "elapsed_time": "1 day, 3:55:49", "remaining_time": "1 day, 19:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3752, "total_steps": 9627, "loss": 1.713, "learning_rate": 6.697573066438387e-05, "epoch": 0.3897371974654617, "percentage": 38.97, "elapsed_time": "1 day, 3:56:17", "remaining_time": "1 day, 19:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3753, "total_steps": 9627, "loss": 1.9039, "learning_rate": 6.69603823809972e-05, "epoch": 0.3898410719850421, "percentage": 38.98, "elapsed_time": "1 day, 3:56:46", "remaining_time": "1 day, 19:44:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3754, "total_steps": 9627, "loss": 1.7179, "learning_rate": 6.694503229146212e-05, "epoch": 0.3899449465046224, "percentage": 38.99, "elapsed_time": "1 day, 3:57:14", "remaining_time": "1 day, 19:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3755, "total_steps": 9627, "loss": 1.5286, "learning_rate": 6.692968039741328e-05, "epoch": 0.39004882102420274, "percentage": 39.0, "elapsed_time": "1 day, 3:57:42", "remaining_time": "1 day, 19:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3756, "total_steps": 9627, "loss": 1.6235, "learning_rate": 6.691432670048552e-05, "epoch": 0.3901526955437831, "percentage": 39.02, "elapsed_time": "1 day, 3:58:12", "remaining_time": "1 day, 19:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3757, "total_steps": 9627, "loss": 1.6554, "learning_rate": 6.689897120231389e-05, "epoch": 0.39025657006336345, "percentage": 39.03, "elapsed_time": "1 day, 3:58:39", "remaining_time": "1 day, 19:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3758, "total_steps": 9627, "loss": 1.7059, "learning_rate": 6.688361390453368e-05, "epoch": 0.3903604445829438, "percentage": 39.04, "elapsed_time": "1 day, 3:59:08", "remaining_time": "1 day, 19:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3759, "total_steps": 9627, "loss": 1.5193, "learning_rate": 6.686825480878026e-05, "epoch": 0.39046431910252416, "percentage": 39.05, "elapsed_time": "1 day, 3:59:36", "remaining_time": "1 day, 19:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3760, "total_steps": 9627, "loss": 1.7383, "learning_rate": 6.685289391668929e-05, "epoch": 0.3905681936221045, "percentage": 39.06, "elapsed_time": "1 day, 4:00:03", "remaining_time": "1 day, 19:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3761, "total_steps": 9627, "loss": 1.6945, "learning_rate": 6.683753122989656e-05, "epoch": 0.39067206814168487, "percentage": 39.07, "elapsed_time": "1 day, 4:00:33", "remaining_time": "1 day, 19:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3762, "total_steps": 9627, "loss": 1.5765, "learning_rate": 6.682216675003811e-05, "epoch": 0.3907759426612652, "percentage": 39.08, "elapsed_time": "1 day, 4:01:01", "remaining_time": "1 day, 19:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3763, "total_steps": 9627, "loss": 1.7523, "learning_rate": 6.680680047875014e-05, "epoch": 0.3908798171808455, "percentage": 39.09, "elapsed_time": "1 day, 4:01:30", "remaining_time": "1 day, 19:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3764, "total_steps": 9627, "loss": 1.7129, "learning_rate": 6.679143241766898e-05, "epoch": 0.3909836917004259, "percentage": 39.1, "elapsed_time": "1 day, 4:01:58", "remaining_time": "1 day, 19:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3765, "total_steps": 9627, "loss": 1.7823, "learning_rate": 6.677606256843126e-05, "epoch": 0.39108756622000623, "percentage": 39.11, "elapsed_time": "1 day, 4:02:26", "remaining_time": "1 day, 19:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3766, "total_steps": 9627, "loss": 1.7184, "learning_rate": 6.676069093267374e-05, "epoch": 0.39119144073958656, "percentage": 39.12, "elapsed_time": "1 day, 4:02:55", "remaining_time": "1 day, 19:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3767, "total_steps": 9627, "loss": 1.921, "learning_rate": 6.674531751203335e-05, "epoch": 0.39129531525916694, "percentage": 39.13, "elapsed_time": "1 day, 4:03:23", "remaining_time": "1 day, 19:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3768, "total_steps": 9627, "loss": 1.6948, "learning_rate": 6.672994230814729e-05, "epoch": 0.39139918977874727, "percentage": 39.14, "elapsed_time": "1 day, 4:03:51", "remaining_time": "1 day, 19:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3769, "total_steps": 9627, "loss": 1.6143, "learning_rate": 6.671456532265285e-05, "epoch": 0.3915030642983276, "percentage": 39.15, "elapsed_time": "1 day, 4:04:20", "remaining_time": "1 day, 19:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3770, "total_steps": 9627, "loss": 1.6526, "learning_rate": 6.669918655718759e-05, "epoch": 0.391606938817908, "percentage": 39.16, "elapsed_time": "1 day, 4:04:48", "remaining_time": "1 day, 19:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3771, "total_steps": 9627, "loss": 1.8916, "learning_rate": 6.668380601338924e-05, "epoch": 0.3917108133374883, "percentage": 39.17, "elapsed_time": "1 day, 4:05:17", "remaining_time": "1 day, 19:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3772, "total_steps": 9627, "loss": 1.803, "learning_rate": 6.666842369289566e-05, "epoch": 0.3918146878570687, "percentage": 39.18, "elapsed_time": "1 day, 4:05:45", "remaining_time": "1 day, 19:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3773, "total_steps": 9627, "loss": 1.7646, "learning_rate": 6.665303959734499e-05, "epoch": 0.391918562376649, "percentage": 39.19, "elapsed_time": "1 day, 4:06:13", "remaining_time": "1 day, 19:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3774, "total_steps": 9627, "loss": 1.8358, "learning_rate": 6.66376537283755e-05, "epoch": 0.39202243689622934, "percentage": 39.2, "elapsed_time": "1 day, 4:06:42", "remaining_time": "1 day, 19:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3775, "total_steps": 9627, "loss": 1.7087, "learning_rate": 6.662226608762566e-05, "epoch": 0.3921263114158097, "percentage": 39.21, "elapsed_time": "1 day, 4:07:10", "remaining_time": "1 day, 19:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3776, "total_steps": 9627, "loss": 1.81, "learning_rate": 6.660687667673416e-05, "epoch": 0.39223018593539005, "percentage": 39.22, "elapsed_time": "1 day, 4:07:38", "remaining_time": "1 day, 19:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3777, "total_steps": 9627, "loss": 1.6589, "learning_rate": 6.659148549733983e-05, "epoch": 0.3923340604549704, "percentage": 39.23, "elapsed_time": "1 day, 4:08:07", "remaining_time": "1 day, 19:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3778, "total_steps": 9627, "loss": 1.653, "learning_rate": 6.657609255108169e-05, "epoch": 0.39243793497455076, "percentage": 39.24, "elapsed_time": "1 day, 4:08:34", "remaining_time": "1 day, 19:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3779, "total_steps": 9627, "loss": 1.7404, "learning_rate": 6.656069783959901e-05, "epoch": 0.3925418094941311, "percentage": 39.25, "elapsed_time": "1 day, 4:09:04", "remaining_time": "1 day, 19:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3780, "total_steps": 9627, "loss": 2.1317, "learning_rate": 6.654530136453118e-05, "epoch": 0.3926456840137114, "percentage": 39.26, "elapsed_time": "1 day, 4:09:32", "remaining_time": "1 day, 19:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3781, "total_steps": 9627, "loss": 1.864, "learning_rate": 6.652990312751781e-05, "epoch": 0.3927495585332918, "percentage": 39.27, "elapsed_time": "1 day, 4:10:01", "remaining_time": "1 day, 19:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3782, "total_steps": 9627, "loss": 1.7456, "learning_rate": 6.65145031301987e-05, "epoch": 0.3928534330528721, "percentage": 39.29, "elapsed_time": "1 day, 4:10:29", "remaining_time": "1 day, 19:32:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3783, "total_steps": 9627, "loss": 1.7215, "learning_rate": 6.649910137421383e-05, "epoch": 0.39295730757245245, "percentage": 39.3, "elapsed_time": "1 day, 4:10:58", "remaining_time": "1 day, 19:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3784, "total_steps": 9627, "loss": 1.8767, "learning_rate": 6.648369786120336e-05, "epoch": 0.39306118209203283, "percentage": 39.31, "elapsed_time": "1 day, 4:11:26", "remaining_time": "1 day, 19:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3785, "total_steps": 9627, "loss": 1.7678, "learning_rate": 6.646829259280765e-05, "epoch": 0.39316505661161316, "percentage": 39.32, "elapsed_time": "1 day, 4:11:55", "remaining_time": "1 day, 19:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3786, "total_steps": 9627, "loss": 1.6417, "learning_rate": 6.645288557066722e-05, "epoch": 0.39326893113119354, "percentage": 39.33, "elapsed_time": "1 day, 4:12:23", "remaining_time": "1 day, 19:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3787, "total_steps": 9627, "loss": 1.7405, "learning_rate": 6.643747679642282e-05, "epoch": 0.39337280565077387, "percentage": 39.34, "elapsed_time": "1 day, 4:12:52", "remaining_time": "1 day, 19:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3788, "total_steps": 9627, "loss": 1.7114, "learning_rate": 6.642206627171536e-05, "epoch": 0.3934766801703542, "percentage": 39.35, "elapsed_time": "1 day, 4:13:20", "remaining_time": "1 day, 19:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3789, "total_steps": 9627, "loss": 1.433, "learning_rate": 6.640665399818594e-05, "epoch": 0.3935805546899346, "percentage": 39.36, "elapsed_time": "1 day, 4:13:49", "remaining_time": "1 day, 19:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3790, "total_steps": 9627, "loss": 1.6693, "learning_rate": 6.639123997747585e-05, "epoch": 0.3936844292095149, "percentage": 39.37, "elapsed_time": "1 day, 4:14:17", "remaining_time": "1 day, 19:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3791, "total_steps": 9627, "loss": 1.7434, "learning_rate": 6.637582421122657e-05, "epoch": 0.39378830372909523, "percentage": 39.38, "elapsed_time": "1 day, 4:14:45", "remaining_time": "1 day, 19:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3792, "total_steps": 9627, "loss": 1.6637, "learning_rate": 6.636040670107972e-05, "epoch": 0.3938921782486756, "percentage": 39.39, "elapsed_time": "1 day, 4:15:13", "remaining_time": "1 day, 19:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3793, "total_steps": 9627, "loss": 1.9512, "learning_rate": 6.63449874486772e-05, "epoch": 0.39399605276825594, "percentage": 39.4, "elapsed_time": "1 day, 4:15:43", "remaining_time": "1 day, 19:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3794, "total_steps": 9627, "loss": 1.5369, "learning_rate": 6.632956645566099e-05, "epoch": 0.39409992728783627, "percentage": 39.41, "elapsed_time": "1 day, 4:16:11", "remaining_time": "1 day, 19:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3795, "total_steps": 9627, "loss": 1.7759, "learning_rate": 6.631414372367333e-05, "epoch": 0.39420380180741665, "percentage": 39.42, "elapsed_time": "1 day, 4:16:40", "remaining_time": "1 day, 19:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3796, "total_steps": 9627, "loss": 1.8498, "learning_rate": 6.629871925435663e-05, "epoch": 0.394307676326997, "percentage": 39.43, "elapsed_time": "1 day, 4:17:08", "remaining_time": "1 day, 19:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3797, "total_steps": 9627, "loss": 1.7042, "learning_rate": 6.628329304935346e-05, "epoch": 0.3944115508465773, "percentage": 39.44, "elapsed_time": "1 day, 4:17:36", "remaining_time": "1 day, 19:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3798, "total_steps": 9627, "loss": 1.6208, "learning_rate": 6.62678651103066e-05, "epoch": 0.3945154253661577, "percentage": 39.45, "elapsed_time": "1 day, 4:18:05", "remaining_time": "1 day, 19:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3799, "total_steps": 9627, "loss": 1.8095, "learning_rate": 6.625243543885899e-05, "epoch": 0.394619299885738, "percentage": 39.46, "elapsed_time": "1 day, 4:18:33", "remaining_time": "1 day, 19:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 9627, "loss": 1.821, "learning_rate": 6.623700403665378e-05, "epoch": 0.3947231744053184, "percentage": 39.47, "elapsed_time": "1 day, 4:19:02", "remaining_time": "1 day, 19:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3801, "total_steps": 9627, "loss": 1.9329, "learning_rate": 6.622157090533431e-05, "epoch": 0.3948270489248987, "percentage": 39.48, "elapsed_time": "1 day, 4:19:31", "remaining_time": "1 day, 19:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3802, "total_steps": 9627, "loss": 1.641, "learning_rate": 6.620613604654405e-05, "epoch": 0.39493092344447905, "percentage": 39.49, "elapsed_time": "1 day, 4:19:59", "remaining_time": "1 day, 19:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3803, "total_steps": 9627, "loss": 1.8927, "learning_rate": 6.619069946192672e-05, "epoch": 0.39503479796405944, "percentage": 39.5, "elapsed_time": "1 day, 4:20:28", "remaining_time": "1 day, 19:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3804, "total_steps": 9627, "loss": 1.7063, "learning_rate": 6.61752611531262e-05, "epoch": 0.39513867248363976, "percentage": 39.51, "elapsed_time": "1 day, 4:20:57", "remaining_time": "1 day, 19:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3805, "total_steps": 9627, "loss": 1.6576, "learning_rate": 6.615982112178653e-05, "epoch": 0.3952425470032201, "percentage": 39.52, "elapsed_time": "1 day, 4:21:25", "remaining_time": "1 day, 19:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3806, "total_steps": 9627, "loss": 1.7814, "learning_rate": 6.614437936955196e-05, "epoch": 0.3953464215228005, "percentage": 39.53, "elapsed_time": "1 day, 4:21:53", "remaining_time": "1 day, 19:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3807, "total_steps": 9627, "loss": 1.7102, "learning_rate": 6.612893589806693e-05, "epoch": 0.3954502960423808, "percentage": 39.55, "elapsed_time": "1 day, 4:22:23", "remaining_time": "1 day, 19:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3808, "total_steps": 9627, "loss": 1.6924, "learning_rate": 6.611349070897604e-05, "epoch": 0.3955541705619611, "percentage": 39.56, "elapsed_time": "1 day, 4:22:50", "remaining_time": "1 day, 19:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3809, "total_steps": 9627, "loss": 1.5255, "learning_rate": 6.609804380392406e-05, "epoch": 0.3956580450815415, "percentage": 39.57, "elapsed_time": "1 day, 4:23:18", "remaining_time": "1 day, 19:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3810, "total_steps": 9627, "loss": 1.734, "learning_rate": 6.6082595184556e-05, "epoch": 0.39576191960112184, "percentage": 39.58, "elapsed_time": "1 day, 4:23:48", "remaining_time": "1 day, 19:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3811, "total_steps": 9627, "loss": 1.7854, "learning_rate": 6.606714485251699e-05, "epoch": 0.3958657941207022, "percentage": 39.59, "elapsed_time": "1 day, 4:24:16", "remaining_time": "1 day, 19:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3812, "total_steps": 9627, "loss": 1.7713, "learning_rate": 6.605169280945238e-05, "epoch": 0.39596966864028255, "percentage": 39.6, "elapsed_time": "1 day, 4:24:45", "remaining_time": "1 day, 19:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3813, "total_steps": 9627, "loss": 1.5804, "learning_rate": 6.603623905700771e-05, "epoch": 0.3960735431598629, "percentage": 39.61, "elapsed_time": "1 day, 4:25:13", "remaining_time": "1 day, 19:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3814, "total_steps": 9627, "loss": 1.7562, "learning_rate": 6.602078359682865e-05, "epoch": 0.39617741767944326, "percentage": 39.62, "elapsed_time": "1 day, 4:25:42", "remaining_time": "1 day, 19:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3815, "total_steps": 9627, "loss": 1.6313, "learning_rate": 6.600532643056112e-05, "epoch": 0.3962812921990236, "percentage": 39.63, "elapsed_time": "1 day, 4:26:10", "remaining_time": "1 day, 19:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3816, "total_steps": 9627, "loss": 1.7867, "learning_rate": 6.598986755985116e-05, "epoch": 0.3963851667186039, "percentage": 39.64, "elapsed_time": "1 day, 4:26:39", "remaining_time": "1 day, 19:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3817, "total_steps": 9627, "loss": 1.5696, "learning_rate": 6.597440698634503e-05, "epoch": 0.3964890412381843, "percentage": 39.65, "elapsed_time": "1 day, 4:27:07", "remaining_time": "1 day, 19:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3818, "total_steps": 9627, "loss": 1.688, "learning_rate": 6.595894471168917e-05, "epoch": 0.3965929157577646, "percentage": 39.66, "elapsed_time": "1 day, 4:27:36", "remaining_time": "1 day, 19:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3819, "total_steps": 9627, "loss": 1.7786, "learning_rate": 6.594348073753019e-05, "epoch": 0.39669679027734495, "percentage": 39.67, "elapsed_time": "1 day, 4:28:04", "remaining_time": "1 day, 19:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3820, "total_steps": 9627, "loss": 1.5053, "learning_rate": 6.592801506551486e-05, "epoch": 0.39680066479692533, "percentage": 39.68, "elapsed_time": "1 day, 4:28:34", "remaining_time": "1 day, 19:17:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3821, "total_steps": 9627, "loss": 1.7091, "learning_rate": 6.591254769729018e-05, "epoch": 0.39690453931650566, "percentage": 39.69, "elapsed_time": "1 day, 4:29:01", "remaining_time": "1 day, 19:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3822, "total_steps": 9627, "loss": 1.6866, "learning_rate": 6.589707863450327e-05, "epoch": 0.397008413836086, "percentage": 39.7, "elapsed_time": "1 day, 4:29:30", "remaining_time": "1 day, 19:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3823, "total_steps": 9627, "loss": 1.703, "learning_rate": 6.588160787880151e-05, "epoch": 0.39711228835566637, "percentage": 39.71, "elapsed_time": "1 day, 4:29:58", "remaining_time": "1 day, 19:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3824, "total_steps": 9627, "loss": 1.6685, "learning_rate": 6.586613543183237e-05, "epoch": 0.3972161628752467, "percentage": 39.72, "elapsed_time": "1 day, 4:30:28", "remaining_time": "1 day, 19:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3825, "total_steps": 9627, "loss": 1.6512, "learning_rate": 6.58506612952436e-05, "epoch": 0.3973200373948271, "percentage": 39.73, "elapsed_time": "1 day, 4:30:56", "remaining_time": "1 day, 19:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3826, "total_steps": 9627, "loss": 1.7624, "learning_rate": 6.583518547068302e-05, "epoch": 0.3974239119144074, "percentage": 39.74, "elapsed_time": "1 day, 4:31:25", "remaining_time": "1 day, 19:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3827, "total_steps": 9627, "loss": 1.4234, "learning_rate": 6.581970795979871e-05, "epoch": 0.39752778643398773, "percentage": 39.75, "elapsed_time": "1 day, 4:31:54", "remaining_time": "1 day, 19:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3828, "total_steps": 9627, "loss": 1.7441, "learning_rate": 6.580422876423891e-05, "epoch": 0.3976316609535681, "percentage": 39.76, "elapsed_time": "1 day, 4:32:21", "remaining_time": "1 day, 19:14:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3829, "total_steps": 9627, "loss": 1.6835, "learning_rate": 6.578874788565201e-05, "epoch": 0.39773553547314844, "percentage": 39.77, "elapsed_time": "1 day, 4:32:50", "remaining_time": "1 day, 19:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3830, "total_steps": 9627, "loss": 1.5985, "learning_rate": 6.577326532568663e-05, "epoch": 0.39783940999272877, "percentage": 39.78, "elapsed_time": "1 day, 4:33:20", "remaining_time": "1 day, 19:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3831, "total_steps": 9627, "loss": 1.734, "learning_rate": 6.575778108599151e-05, "epoch": 0.39794328451230915, "percentage": 39.79, "elapsed_time": "1 day, 4:33:47", "remaining_time": "1 day, 19:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3832, "total_steps": 9627, "loss": 1.6279, "learning_rate": 6.574229516821564e-05, "epoch": 0.3980471590318895, "percentage": 39.8, "elapsed_time": "1 day, 4:34:16", "remaining_time": "1 day, 19:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3833, "total_steps": 9627, "loss": 1.7271, "learning_rate": 6.572680757400813e-05, "epoch": 0.3981510335514698, "percentage": 39.82, "elapsed_time": "1 day, 4:34:45", "remaining_time": "1 day, 19:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3834, "total_steps": 9627, "loss": 1.8058, "learning_rate": 6.571131830501827e-05, "epoch": 0.3982549080710502, "percentage": 39.83, "elapsed_time": "1 day, 4:35:13", "remaining_time": "1 day, 19:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3835, "total_steps": 9627, "loss": 1.6509, "learning_rate": 6.569582736289556e-05, "epoch": 0.3983587825906305, "percentage": 39.84, "elapsed_time": "1 day, 4:35:42", "remaining_time": "1 day, 19:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3836, "total_steps": 9627, "loss": 1.5513, "learning_rate": 6.56803347492897e-05, "epoch": 0.39846265711021084, "percentage": 39.85, "elapsed_time": "1 day, 4:36:10", "remaining_time": "1 day, 19:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3837, "total_steps": 9627, "loss": 1.5777, "learning_rate": 6.566484046585047e-05, "epoch": 0.3985665316297912, "percentage": 39.86, "elapsed_time": "1 day, 4:36:39", "remaining_time": "1 day, 19:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3838, "total_steps": 9627, "loss": 1.8612, "learning_rate": 6.564934451422793e-05, "epoch": 0.39867040614937155, "percentage": 39.87, "elapsed_time": "1 day, 4:37:08", "remaining_time": "1 day, 19:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3839, "total_steps": 9627, "loss": 1.7228, "learning_rate": 6.563384689607227e-05, "epoch": 0.39877428066895193, "percentage": 39.88, "elapsed_time": "1 day, 4:37:37", "remaining_time": "1 day, 19:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3840, "total_steps": 9627, "loss": 1.7733, "learning_rate": 6.561834761303386e-05, "epoch": 0.39887815518853226, "percentage": 39.89, "elapsed_time": "1 day, 4:38:05", "remaining_time": "1 day, 19:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3841, "total_steps": 9627, "loss": 1.8526, "learning_rate": 6.560284666676327e-05, "epoch": 0.3989820297081126, "percentage": 39.9, "elapsed_time": "1 day, 4:38:33", "remaining_time": "1 day, 19:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3842, "total_steps": 9627, "loss": 1.4567, "learning_rate": 6.558734405891121e-05, "epoch": 0.39908590422769297, "percentage": 39.91, "elapsed_time": "1 day, 4:39:03", "remaining_time": "1 day, 19:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3843, "total_steps": 9627, "loss": 1.8229, "learning_rate": 6.557183979112859e-05, "epoch": 0.3991897787472733, "percentage": 39.92, "elapsed_time": "1 day, 4:39:30", "remaining_time": "1 day, 19:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3844, "total_steps": 9627, "loss": 1.7953, "learning_rate": 6.55563338650665e-05, "epoch": 0.3992936532668536, "percentage": 39.93, "elapsed_time": "1 day, 4:40:00", "remaining_time": "1 day, 19:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3845, "total_steps": 9627, "loss": 1.4815, "learning_rate": 6.554082628237619e-05, "epoch": 0.399397527786434, "percentage": 39.94, "elapsed_time": "1 day, 4:40:29", "remaining_time": "1 day, 19:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3846, "total_steps": 9627, "loss": 1.9411, "learning_rate": 6.552531704470911e-05, "epoch": 0.39950140230601433, "percentage": 39.95, "elapsed_time": "1 day, 4:40:57", "remaining_time": "1 day, 19:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3847, "total_steps": 9627, "loss": 1.6889, "learning_rate": 6.550980615371687e-05, "epoch": 0.39960527682559466, "percentage": 39.96, "elapsed_time": "1 day, 4:41:26", "remaining_time": "1 day, 19:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3848, "total_steps": 9627, "loss": 1.6639, "learning_rate": 6.549429361105126e-05, "epoch": 0.39970915134517504, "percentage": 39.97, "elapsed_time": "1 day, 4:41:54", "remaining_time": "1 day, 19:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3849, "total_steps": 9627, "loss": 1.7107, "learning_rate": 6.547877941836424e-05, "epoch": 0.39981302586475537, "percentage": 39.98, "elapsed_time": "1 day, 4:42:24", "remaining_time": "1 day, 19:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3850, "total_steps": 9627, "loss": 1.7377, "learning_rate": 6.546326357730794e-05, "epoch": 0.39991690038433575, "percentage": 39.99, "elapsed_time": "1 day, 4:42:52", "remaining_time": "1 day, 19:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3851, "total_steps": 9627, "loss": 1.8146, "learning_rate": 6.544774608953468e-05, "epoch": 0.4000207749039161, "percentage": 40.0, "elapsed_time": "1 day, 4:43:21", "remaining_time": "1 day, 19:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3852, "total_steps": 9627, "loss": 1.6474, "learning_rate": 6.543222695669697e-05, "epoch": 0.4001246494234964, "percentage": 40.01, "elapsed_time": "1 day, 4:43:49", "remaining_time": "1 day, 19:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3853, "total_steps": 9627, "loss": 1.8214, "learning_rate": 6.541670618044748e-05, "epoch": 0.4002285239430768, "percentage": 40.02, "elapsed_time": "1 day, 4:44:19", "remaining_time": "1 day, 19:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3854, "total_steps": 9627, "loss": 1.7134, "learning_rate": 6.540118376243903e-05, "epoch": 0.4003323984626571, "percentage": 40.03, "elapsed_time": "1 day, 4:44:47", "remaining_time": "1 day, 19:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3855, "total_steps": 9627, "loss": 1.974, "learning_rate": 6.538565970432463e-05, "epoch": 0.40043627298223744, "percentage": 40.04, "elapsed_time": "1 day, 4:45:16", "remaining_time": "1 day, 19:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3856, "total_steps": 9627, "loss": 1.5895, "learning_rate": 6.537013400775748e-05, "epoch": 0.4005401475018178, "percentage": 40.05, "elapsed_time": "1 day, 4:45:43", "remaining_time": "1 day, 19:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3857, "total_steps": 9627, "loss": 1.6404, "learning_rate": 6.535460667439097e-05, "epoch": 0.40064402202139815, "percentage": 40.06, "elapsed_time": "1 day, 4:46:13", "remaining_time": "1 day, 19:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3858, "total_steps": 9627, "loss": 1.8849, "learning_rate": 6.53390777058786e-05, "epoch": 0.4007478965409785, "percentage": 40.07, "elapsed_time": "1 day, 4:46:40", "remaining_time": "1 day, 19:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3859, "total_steps": 9627, "loss": 1.7472, "learning_rate": 6.532354710387411e-05, "epoch": 0.40085177106055886, "percentage": 40.09, "elapsed_time": "1 day, 4:47:10", "remaining_time": "1 day, 19:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3860, "total_steps": 9627, "loss": 1.601, "learning_rate": 6.530801487003139e-05, "epoch": 0.4009556455801392, "percentage": 40.1, "elapsed_time": "1 day, 4:47:38", "remaining_time": "1 day, 19:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3861, "total_steps": 9627, "loss": 1.7275, "learning_rate": 6.529248100600449e-05, "epoch": 0.4010595200997195, "percentage": 40.11, "elapsed_time": "1 day, 4:48:07", "remaining_time": "1 day, 19:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3862, "total_steps": 9627, "loss": 1.6634, "learning_rate": 6.527694551344765e-05, "epoch": 0.4011633946192999, "percentage": 40.12, "elapsed_time": "1 day, 4:48:35", "remaining_time": "1 day, 19:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3863, "total_steps": 9627, "loss": 1.6647, "learning_rate": 6.526140839401527e-05, "epoch": 0.4012672691388802, "percentage": 40.13, "elapsed_time": "1 day, 4:49:03", "remaining_time": "1 day, 18:59:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3864, "total_steps": 9627, "loss": 1.8112, "learning_rate": 6.524586964936194e-05, "epoch": 0.4013711436584606, "percentage": 40.14, "elapsed_time": "1 day, 4:49:33", "remaining_time": "1 day, 18:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3865, "total_steps": 9627, "loss": 1.7179, "learning_rate": 6.523032928114242e-05, "epoch": 0.40147501817804093, "percentage": 40.15, "elapsed_time": "1 day, 4:50:01", "remaining_time": "1 day, 18:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3866, "total_steps": 9627, "loss": 1.4234, "learning_rate": 6.521478729101164e-05, "epoch": 0.40157889269762126, "percentage": 40.16, "elapsed_time": "1 day, 4:50:31", "remaining_time": "1 day, 18:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3867, "total_steps": 9627, "loss": 1.7079, "learning_rate": 6.519924368062468e-05, "epoch": 0.40168276721720164, "percentage": 40.17, "elapsed_time": "1 day, 4:50:58", "remaining_time": "1 day, 18:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3868, "total_steps": 9627, "loss": 1.6538, "learning_rate": 6.518369845163683e-05, "epoch": 0.40178664173678197, "percentage": 40.18, "elapsed_time": "1 day, 4:51:28", "remaining_time": "1 day, 18:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3869, "total_steps": 9627, "loss": 1.7034, "learning_rate": 6.516815160570355e-05, "epoch": 0.4018905162563623, "percentage": 40.19, "elapsed_time": "1 day, 4:51:56", "remaining_time": "1 day, 18:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3870, "total_steps": 9627, "loss": 1.5712, "learning_rate": 6.515260314448041e-05, "epoch": 0.4019943907759427, "percentage": 40.2, "elapsed_time": "1 day, 4:52:26", "remaining_time": "1 day, 18:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3871, "total_steps": 9627, "loss": 1.6909, "learning_rate": 6.513705306962325e-05, "epoch": 0.402098265295523, "percentage": 40.21, "elapsed_time": "1 day, 4:52:54", "remaining_time": "1 day, 18:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3872, "total_steps": 9627, "loss": 1.5812, "learning_rate": 6.5121501382788e-05, "epoch": 0.40220213981510333, "percentage": 40.22, "elapsed_time": "1 day, 4:53:22", "remaining_time": "1 day, 18:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3873, "total_steps": 9627, "loss": 1.6611, "learning_rate": 6.51059480856308e-05, "epoch": 0.4023060143346837, "percentage": 40.23, "elapsed_time": "1 day, 4:53:51", "remaining_time": "1 day, 18:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3874, "total_steps": 9627, "loss": 1.5964, "learning_rate": 6.509039317980798e-05, "epoch": 0.40240988885426404, "percentage": 40.24, "elapsed_time": "1 day, 4:54:19", "remaining_time": "1 day, 18:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3875, "total_steps": 9627, "loss": 1.6734, "learning_rate": 6.5074836666976e-05, "epoch": 0.40251376337384437, "percentage": 40.25, "elapsed_time": "1 day, 4:54:49", "remaining_time": "1 day, 18:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3876, "total_steps": 9627, "loss": 1.5993, "learning_rate": 6.505927854879148e-05, "epoch": 0.40261763789342475, "percentage": 40.26, "elapsed_time": "1 day, 4:55:16", "remaining_time": "1 day, 18:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3877, "total_steps": 9627, "loss": 1.6791, "learning_rate": 6.504371882691126e-05, "epoch": 0.4027215124130051, "percentage": 40.27, "elapsed_time": "1 day, 4:55:46", "remaining_time": "1 day, 18:54:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3878, "total_steps": 9627, "loss": 1.7729, "learning_rate": 6.502815750299235e-05, "epoch": 0.40282538693258546, "percentage": 40.28, "elapsed_time": "1 day, 4:56:14", "remaining_time": "1 day, 18:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3879, "total_steps": 9627, "loss": 1.7063, "learning_rate": 6.501259457869187e-05, "epoch": 0.4029292614521658, "percentage": 40.29, "elapsed_time": "1 day, 4:56:43", "remaining_time": "1 day, 18:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3880, "total_steps": 9627, "loss": 1.546, "learning_rate": 6.49970300556672e-05, "epoch": 0.4030331359717461, "percentage": 40.3, "elapsed_time": "1 day, 4:57:11", "remaining_time": "1 day, 18:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3881, "total_steps": 9627, "loss": 1.7616, "learning_rate": 6.498146393557578e-05, "epoch": 0.4031370104913265, "percentage": 40.31, "elapsed_time": "1 day, 4:57:39", "remaining_time": "1 day, 18:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3882, "total_steps": 9627, "loss": 1.7472, "learning_rate": 6.496589622007532e-05, "epoch": 0.4032408850109068, "percentage": 40.32, "elapsed_time": "1 day, 4:58:09", "remaining_time": "1 day, 18:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3883, "total_steps": 9627, "loss": 1.5378, "learning_rate": 6.495032691082367e-05, "epoch": 0.40334475953048715, "percentage": 40.33, "elapsed_time": "1 day, 4:58:37", "remaining_time": "1 day, 18:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3884, "total_steps": 9627, "loss": 1.6228, "learning_rate": 6.493475600947879e-05, "epoch": 0.40344863405006753, "percentage": 40.34, "elapsed_time": "1 day, 4:59:05", "remaining_time": "1 day, 18:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3885, "total_steps": 9627, "loss": 1.8077, "learning_rate": 6.491918351769891e-05, "epoch": 0.40355250856964786, "percentage": 40.36, "elapsed_time": "1 day, 4:59:34", "remaining_time": "1 day, 18:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3886, "total_steps": 9627, "loss": 1.8393, "learning_rate": 6.490360943714235e-05, "epoch": 0.4036563830892282, "percentage": 40.37, "elapsed_time": "1 day, 5:00:02", "remaining_time": "1 day, 18:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3887, "total_steps": 9627, "loss": 1.9139, "learning_rate": 6.488803376946764e-05, "epoch": 0.40376025760880857, "percentage": 40.38, "elapsed_time": "1 day, 5:00:30", "remaining_time": "1 day, 18:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3888, "total_steps": 9627, "loss": 1.7191, "learning_rate": 6.48724565163335e-05, "epoch": 0.4038641321283889, "percentage": 40.39, "elapsed_time": "1 day, 5:01:00", "remaining_time": "1 day, 18:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3889, "total_steps": 9627, "loss": 1.6855, "learning_rate": 6.48568776793987e-05, "epoch": 0.4039680066479693, "percentage": 40.4, "elapsed_time": "1 day, 5:01:28", "remaining_time": "1 day, 18:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3890, "total_steps": 9627, "loss": 1.7529, "learning_rate": 6.484129726032233e-05, "epoch": 0.4040718811675496, "percentage": 40.41, "elapsed_time": "1 day, 5:01:57", "remaining_time": "1 day, 18:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3891, "total_steps": 9627, "loss": 1.5992, "learning_rate": 6.482571526076357e-05, "epoch": 0.40417575568712993, "percentage": 40.42, "elapsed_time": "1 day, 5:02:25", "remaining_time": "1 day, 18:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3892, "total_steps": 9627, "loss": 1.7882, "learning_rate": 6.481013168238178e-05, "epoch": 0.4042796302067103, "percentage": 40.43, "elapsed_time": "1 day, 5:02:55", "remaining_time": "1 day, 18:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3893, "total_steps": 9627, "loss": 1.9548, "learning_rate": 6.479454652683649e-05, "epoch": 0.40438350472629064, "percentage": 40.44, "elapsed_time": "1 day, 5:03:23", "remaining_time": "1 day, 18:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3894, "total_steps": 9627, "loss": 1.5784, "learning_rate": 6.47789597957874e-05, "epoch": 0.40448737924587097, "percentage": 40.45, "elapsed_time": "1 day, 5:03:51", "remaining_time": "1 day, 18:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3895, "total_steps": 9627, "loss": 1.9224, "learning_rate": 6.476337149089438e-05, "epoch": 0.40459125376545135, "percentage": 40.46, "elapsed_time": "1 day, 5:04:19", "remaining_time": "1 day, 18:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3896, "total_steps": 9627, "loss": 1.4597, "learning_rate": 6.474778161381743e-05, "epoch": 0.4046951282850317, "percentage": 40.47, "elapsed_time": "1 day, 5:04:49", "remaining_time": "1 day, 18:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3897, "total_steps": 9627, "loss": 1.9036, "learning_rate": 6.47321901662168e-05, "epoch": 0.404799002804612, "percentage": 40.48, "elapsed_time": "1 day, 5:05:18", "remaining_time": "1 day, 18:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3898, "total_steps": 9627, "loss": 1.802, "learning_rate": 6.471659714975282e-05, "epoch": 0.4049028773241924, "percentage": 40.49, "elapsed_time": "1 day, 5:05:46", "remaining_time": "1 day, 18:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3899, "total_steps": 9627, "loss": 1.7556, "learning_rate": 6.470100256608603e-05, "epoch": 0.4050067518437727, "percentage": 40.5, "elapsed_time": "1 day, 5:06:15", "remaining_time": "1 day, 18:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3900, "total_steps": 9627, "loss": 1.6419, "learning_rate": 6.468540641687716e-05, "epoch": 0.40511062636335304, "percentage": 40.51, "elapsed_time": "1 day, 5:06:43", "remaining_time": "1 day, 18:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3901, "total_steps": 9627, "loss": 1.7802, "learning_rate": 6.466980870378704e-05, "epoch": 0.4052145008829334, "percentage": 40.52, "elapsed_time": "1 day, 5:07:12", "remaining_time": "1 day, 18:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3902, "total_steps": 9627, "loss": 1.9368, "learning_rate": 6.465420942847673e-05, "epoch": 0.40531837540251375, "percentage": 40.53, "elapsed_time": "1 day, 5:07:40", "remaining_time": "1 day, 18:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3903, "total_steps": 9627, "loss": 1.8801, "learning_rate": 6.463860859260742e-05, "epoch": 0.40542224992209414, "percentage": 40.54, "elapsed_time": "1 day, 5:08:10", "remaining_time": "1 day, 18:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3904, "total_steps": 9627, "loss": 1.8356, "learning_rate": 6.462300619784048e-05, "epoch": 0.40552612444167446, "percentage": 40.55, "elapsed_time": "1 day, 5:08:39", "remaining_time": "1 day, 18:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3905, "total_steps": 9627, "loss": 1.5941, "learning_rate": 6.460740224583746e-05, "epoch": 0.4056299989612548, "percentage": 40.56, "elapsed_time": "1 day, 5:09:07", "remaining_time": "1 day, 18:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3906, "total_steps": 9627, "loss": 1.8269, "learning_rate": 6.459179673826001e-05, "epoch": 0.40573387348083517, "percentage": 40.57, "elapsed_time": "1 day, 5:09:36", "remaining_time": "1 day, 18:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3907, "total_steps": 9627, "loss": 1.7104, "learning_rate": 6.457618967677004e-05, "epoch": 0.4058377480004155, "percentage": 40.58, "elapsed_time": "1 day, 5:10:04", "remaining_time": "1 day, 18:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3908, "total_steps": 9627, "loss": 2.0598, "learning_rate": 6.456058106302958e-05, "epoch": 0.4059416225199958, "percentage": 40.59, "elapsed_time": "1 day, 5:10:34", "remaining_time": "1 day, 18:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3909, "total_steps": 9627, "loss": 1.8005, "learning_rate": 6.454497089870082e-05, "epoch": 0.4060454970395762, "percentage": 40.6, "elapsed_time": "1 day, 5:11:03", "remaining_time": "1 day, 18:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3910, "total_steps": 9627, "loss": 1.5732, "learning_rate": 6.45293591854461e-05, "epoch": 0.40614937155915654, "percentage": 40.61, "elapsed_time": "1 day, 5:11:30", "remaining_time": "1 day, 18:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3911, "total_steps": 9627, "loss": 1.8357, "learning_rate": 6.451374592492796e-05, "epoch": 0.40625324607873686, "percentage": 40.63, "elapsed_time": "1 day, 5:12:00", "remaining_time": "1 day, 18:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3912, "total_steps": 9627, "loss": 1.851, "learning_rate": 6.449813111880909e-05, "epoch": 0.40635712059831725, "percentage": 40.64, "elapsed_time": "1 day, 5:12:27", "remaining_time": "1 day, 18:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3913, "total_steps": 9627, "loss": 1.4937, "learning_rate": 6.448251476875235e-05, "epoch": 0.40646099511789757, "percentage": 40.65, "elapsed_time": "1 day, 5:12:56", "remaining_time": "1 day, 18:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3914, "total_steps": 9627, "loss": 1.6035, "learning_rate": 6.446689687642076e-05, "epoch": 0.4065648696374779, "percentage": 40.66, "elapsed_time": "1 day, 5:13:26", "remaining_time": "1 day, 18:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3915, "total_steps": 9627, "loss": 1.5591, "learning_rate": 6.445127744347748e-05, "epoch": 0.4066687441570583, "percentage": 40.67, "elapsed_time": "1 day, 5:13:54", "remaining_time": "1 day, 18:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3916, "total_steps": 9627, "loss": 1.5891, "learning_rate": 6.443565647158589e-05, "epoch": 0.4067726186766386, "percentage": 40.68, "elapsed_time": "1 day, 5:14:23", "remaining_time": "1 day, 18:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3917, "total_steps": 9627, "loss": 1.8029, "learning_rate": 6.442003396240949e-05, "epoch": 0.406876493196219, "percentage": 40.69, "elapsed_time": "1 day, 5:14:51", "remaining_time": "1 day, 18:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3918, "total_steps": 9627, "loss": 1.8338, "learning_rate": 6.440440991761195e-05, "epoch": 0.4069803677157993, "percentage": 40.7, "elapsed_time": "1 day, 5:15:20", "remaining_time": "1 day, 18:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3919, "total_steps": 9627, "loss": 1.5756, "learning_rate": 6.438878433885711e-05, "epoch": 0.40708424223537965, "percentage": 40.71, "elapsed_time": "1 day, 5:15:49", "remaining_time": "1 day, 18:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3920, "total_steps": 9627, "loss": 1.6578, "learning_rate": 6.437315722780898e-05, "epoch": 0.40718811675496003, "percentage": 40.72, "elapsed_time": "1 day, 5:16:17", "remaining_time": "1 day, 18:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3921, "total_steps": 9627, "loss": 1.7394, "learning_rate": 6.435752858613171e-05, "epoch": 0.40729199127454035, "percentage": 40.73, "elapsed_time": "1 day, 5:16:46", "remaining_time": "1 day, 18:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3922, "total_steps": 9627, "loss": 1.7368, "learning_rate": 6.434189841548965e-05, "epoch": 0.4073958657941207, "percentage": 40.74, "elapsed_time": "1 day, 5:17:14", "remaining_time": "1 day, 18:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3923, "total_steps": 9627, "loss": 1.6122, "learning_rate": 6.432626671754729e-05, "epoch": 0.40749974031370106, "percentage": 40.75, "elapsed_time": "1 day, 5:17:44", "remaining_time": "1 day, 18:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3924, "total_steps": 9627, "loss": 1.5676, "learning_rate": 6.431063349396926e-05, "epoch": 0.4076036148332814, "percentage": 40.76, "elapsed_time": "1 day, 5:18:13", "remaining_time": "1 day, 18:35:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3925, "total_steps": 9627, "loss": 1.5929, "learning_rate": 6.429499874642038e-05, "epoch": 0.4077074893528617, "percentage": 40.77, "elapsed_time": "1 day, 5:18:41", "remaining_time": "1 day, 18:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3926, "total_steps": 9627, "loss": 1.4869, "learning_rate": 6.427936247656565e-05, "epoch": 0.4078113638724421, "percentage": 40.78, "elapsed_time": "1 day, 5:19:09", "remaining_time": "1 day, 18:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3927, "total_steps": 9627, "loss": 1.6425, "learning_rate": 6.42637246860702e-05, "epoch": 0.40791523839202243, "percentage": 40.79, "elapsed_time": "1 day, 5:19:39", "remaining_time": "1 day, 18:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3928, "total_steps": 9627, "loss": 1.7858, "learning_rate": 6.424808537659932e-05, "epoch": 0.4080191129116028, "percentage": 40.8, "elapsed_time": "1 day, 5:20:07", "remaining_time": "1 day, 18:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3929, "total_steps": 9627, "loss": 1.7072, "learning_rate": 6.423244454981851e-05, "epoch": 0.40812298743118314, "percentage": 40.81, "elapsed_time": "1 day, 5:20:36", "remaining_time": "1 day, 18:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3930, "total_steps": 9627, "loss": 1.792, "learning_rate": 6.421680220739336e-05, "epoch": 0.40822686195076346, "percentage": 40.82, "elapsed_time": "1 day, 5:21:04", "remaining_time": "1 day, 18:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3931, "total_steps": 9627, "loss": 1.9283, "learning_rate": 6.420115835098967e-05, "epoch": 0.40833073647034385, "percentage": 40.83, "elapsed_time": "1 day, 5:21:33", "remaining_time": "1 day, 18:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3932, "total_steps": 9627, "loss": 1.6607, "learning_rate": 6.418551298227338e-05, "epoch": 0.4084346109899242, "percentage": 40.84, "elapsed_time": "1 day, 5:22:02", "remaining_time": "1 day, 18:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3933, "total_steps": 9627, "loss": 1.7383, "learning_rate": 6.416986610291064e-05, "epoch": 0.4085384855095045, "percentage": 40.85, "elapsed_time": "1 day, 5:22:31", "remaining_time": "1 day, 18:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3934, "total_steps": 9627, "loss": 1.5812, "learning_rate": 6.415421771456766e-05, "epoch": 0.4086423600290849, "percentage": 40.86, "elapsed_time": "1 day, 5:22:58", "remaining_time": "1 day, 18:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3935, "total_steps": 9627, "loss": 1.7514, "learning_rate": 6.41385678189109e-05, "epoch": 0.4087462345486652, "percentage": 40.87, "elapsed_time": "1 day, 5:23:28", "remaining_time": "1 day, 18:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3936, "total_steps": 9627, "loss": 1.6141, "learning_rate": 6.412291641760697e-05, "epoch": 0.40885010906824554, "percentage": 40.89, "elapsed_time": "1 day, 5:23:56", "remaining_time": "1 day, 18:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3937, "total_steps": 9627, "loss": 1.6868, "learning_rate": 6.410726351232259e-05, "epoch": 0.4089539835878259, "percentage": 40.9, "elapsed_time": "1 day, 5:24:25", "remaining_time": "1 day, 18:30:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3938, "total_steps": 9627, "loss": 1.7051, "learning_rate": 6.409160910472469e-05, "epoch": 0.40905785810740625, "percentage": 40.91, "elapsed_time": "1 day, 5:24:54", "remaining_time": "1 day, 18:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3939, "total_steps": 9627, "loss": 1.7432, "learning_rate": 6.407595319648034e-05, "epoch": 0.4091617326269866, "percentage": 40.92, "elapsed_time": "1 day, 5:25:22", "remaining_time": "1 day, 18:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3940, "total_steps": 9627, "loss": 1.6319, "learning_rate": 6.406029578925677e-05, "epoch": 0.40926560714656696, "percentage": 40.93, "elapsed_time": "1 day, 5:25:52", "remaining_time": "1 day, 18:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3941, "total_steps": 9627, "loss": 1.6741, "learning_rate": 6.404463688472138e-05, "epoch": 0.4093694816661473, "percentage": 40.94, "elapsed_time": "1 day, 5:26:19", "remaining_time": "1 day, 18:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3942, "total_steps": 9627, "loss": 1.6135, "learning_rate": 6.402897648454171e-05, "epoch": 0.40947335618572767, "percentage": 40.95, "elapsed_time": "1 day, 5:26:49", "remaining_time": "1 day, 18:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3943, "total_steps": 9627, "loss": 1.6742, "learning_rate": 6.401331459038546e-05, "epoch": 0.409577230705308, "percentage": 40.96, "elapsed_time": "1 day, 5:27:17", "remaining_time": "1 day, 18:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3944, "total_steps": 9627, "loss": 1.7462, "learning_rate": 6.399765120392054e-05, "epoch": 0.4096811052248883, "percentage": 40.97, "elapsed_time": "1 day, 5:27:46", "remaining_time": "1 day, 18:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3945, "total_steps": 9627, "loss": 1.6549, "learning_rate": 6.398198632681494e-05, "epoch": 0.4097849797444687, "percentage": 40.98, "elapsed_time": "1 day, 5:28:15", "remaining_time": "1 day, 18:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3946, "total_steps": 9627, "loss": 1.5801, "learning_rate": 6.396631996073686e-05, "epoch": 0.40988885426404903, "percentage": 40.99, "elapsed_time": "1 day, 5:28:43", "remaining_time": "1 day, 18:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3947, "total_steps": 9627, "loss": 1.6841, "learning_rate": 6.395065210735464e-05, "epoch": 0.40999272878362936, "percentage": 41.0, "elapsed_time": "1 day, 5:29:12", "remaining_time": "1 day, 18:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3948, "total_steps": 9627, "loss": 1.8659, "learning_rate": 6.39349827683368e-05, "epoch": 0.41009660330320974, "percentage": 41.01, "elapsed_time": "1 day, 5:29:40", "remaining_time": "1 day, 18:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3949, "total_steps": 9627, "loss": 1.82, "learning_rate": 6.391931194535199e-05, "epoch": 0.41020047782279007, "percentage": 41.02, "elapsed_time": "1 day, 5:30:09", "remaining_time": "1 day, 18:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3950, "total_steps": 9627, "loss": 1.5473, "learning_rate": 6.390363964006903e-05, "epoch": 0.4103043523423704, "percentage": 41.03, "elapsed_time": "1 day, 5:30:37", "remaining_time": "1 day, 18:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3951, "total_steps": 9627, "loss": 1.554, "learning_rate": 6.38879658541569e-05, "epoch": 0.4104082268619508, "percentage": 41.04, "elapsed_time": "1 day, 5:31:07", "remaining_time": "1 day, 18:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3952, "total_steps": 9627, "loss": 1.6563, "learning_rate": 6.387229058928475e-05, "epoch": 0.4105121013815311, "percentage": 41.05, "elapsed_time": "1 day, 5:31:34", "remaining_time": "1 day, 18:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3953, "total_steps": 9627, "loss": 1.6243, "learning_rate": 6.385661384712185e-05, "epoch": 0.41061597590111143, "percentage": 41.06, "elapsed_time": "1 day, 5:32:04", "remaining_time": "1 day, 18:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3954, "total_steps": 9627, "loss": 1.6521, "learning_rate": 6.384093562933765e-05, "epoch": 0.4107198504206918, "percentage": 41.07, "elapsed_time": "1 day, 5:32:32", "remaining_time": "1 day, 18:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3955, "total_steps": 9627, "loss": 1.7887, "learning_rate": 6.382525593760178e-05, "epoch": 0.41082372494027214, "percentage": 41.08, "elapsed_time": "1 day, 5:33:00", "remaining_time": "1 day, 18:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3956, "total_steps": 9627, "loss": 1.8647, "learning_rate": 6.380957477358399e-05, "epoch": 0.4109275994598525, "percentage": 41.09, "elapsed_time": "1 day, 5:33:30", "remaining_time": "1 day, 18:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3957, "total_steps": 9627, "loss": 1.8746, "learning_rate": 6.379389213895421e-05, "epoch": 0.41103147397943285, "percentage": 41.1, "elapsed_time": "1 day, 5:33:57", "remaining_time": "1 day, 18:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3958, "total_steps": 9627, "loss": 1.6782, "learning_rate": 6.377820803538253e-05, "epoch": 0.4111353484990132, "percentage": 41.11, "elapsed_time": "1 day, 5:34:27", "remaining_time": "1 day, 18:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3959, "total_steps": 9627, "loss": 1.7188, "learning_rate": 6.376252246453914e-05, "epoch": 0.41123922301859356, "percentage": 41.12, "elapsed_time": "1 day, 5:34:56", "remaining_time": "1 day, 18:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3960, "total_steps": 9627, "loss": 1.8221, "learning_rate": 6.374683542809447e-05, "epoch": 0.4113430975381739, "percentage": 41.13, "elapsed_time": "1 day, 5:35:25", "remaining_time": "1 day, 18:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3961, "total_steps": 9627, "loss": 1.7294, "learning_rate": 6.373114692771906e-05, "epoch": 0.4114469720577542, "percentage": 41.14, "elapsed_time": "1 day, 5:35:53", "remaining_time": "1 day, 18:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3962, "total_steps": 9627, "loss": 1.708, "learning_rate": 6.371545696508358e-05, "epoch": 0.4115508465773346, "percentage": 41.16, "elapsed_time": "1 day, 5:36:21", "remaining_time": "1 day, 18:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3963, "total_steps": 9627, "loss": 1.8057, "learning_rate": 6.369976554185896e-05, "epoch": 0.4116547210969149, "percentage": 41.17, "elapsed_time": "1 day, 5:36:50", "remaining_time": "1 day, 18:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3964, "total_steps": 9627, "loss": 1.6913, "learning_rate": 6.368407265971616e-05, "epoch": 0.41175859561649525, "percentage": 41.18, "elapsed_time": "1 day, 5:37:19", "remaining_time": "1 day, 18:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3965, "total_steps": 9627, "loss": 1.8158, "learning_rate": 6.366837832032635e-05, "epoch": 0.41186247013607563, "percentage": 41.19, "elapsed_time": "1 day, 5:37:47", "remaining_time": "1 day, 18:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3966, "total_steps": 9627, "loss": 1.5065, "learning_rate": 6.365268252536087e-05, "epoch": 0.41196634465565596, "percentage": 41.2, "elapsed_time": "1 day, 5:38:17", "remaining_time": "1 day, 18:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3967, "total_steps": 9627, "loss": 1.672, "learning_rate": 6.36369852764912e-05, "epoch": 0.41207021917523634, "percentage": 41.21, "elapsed_time": "1 day, 5:38:45", "remaining_time": "1 day, 18:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3968, "total_steps": 9627, "loss": 1.8548, "learning_rate": 6.362128657538897e-05, "epoch": 0.41217409369481667, "percentage": 41.22, "elapsed_time": "1 day, 5:39:13", "remaining_time": "1 day, 18:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3969, "total_steps": 9627, "loss": 1.8469, "learning_rate": 6.360558642372597e-05, "epoch": 0.412277968214397, "percentage": 41.23, "elapsed_time": "1 day, 5:39:43", "remaining_time": "1 day, 18:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3970, "total_steps": 9627, "loss": 1.6893, "learning_rate": 6.358988482317414e-05, "epoch": 0.4123818427339774, "percentage": 41.24, "elapsed_time": "1 day, 5:40:11", "remaining_time": "1 day, 18:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3971, "total_steps": 9627, "loss": 1.5002, "learning_rate": 6.357418177540558e-05, "epoch": 0.4124857172535577, "percentage": 41.25, "elapsed_time": "1 day, 5:40:39", "remaining_time": "1 day, 18:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3972, "total_steps": 9627, "loss": 1.817, "learning_rate": 6.355847728209257e-05, "epoch": 0.41258959177313803, "percentage": 41.26, "elapsed_time": "1 day, 5:41:09", "remaining_time": "1 day, 18:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3973, "total_steps": 9627, "loss": 1.7698, "learning_rate": 6.354277134490746e-05, "epoch": 0.4126934662927184, "percentage": 41.27, "elapsed_time": "1 day, 5:41:37", "remaining_time": "1 day, 18:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3974, "total_steps": 9627, "loss": 1.4967, "learning_rate": 6.352706396552285e-05, "epoch": 0.41279734081229874, "percentage": 41.28, "elapsed_time": "1 day, 5:42:07", "remaining_time": "1 day, 18:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3975, "total_steps": 9627, "loss": 1.6282, "learning_rate": 6.351135514561144e-05, "epoch": 0.41290121533187907, "percentage": 41.29, "elapsed_time": "1 day, 5:42:35", "remaining_time": "1 day, 18:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3976, "total_steps": 9627, "loss": 1.637, "learning_rate": 6.34956448868461e-05, "epoch": 0.41300508985145945, "percentage": 41.3, "elapsed_time": "1 day, 5:43:04", "remaining_time": "1 day, 18:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3977, "total_steps": 9627, "loss": 1.9794, "learning_rate": 6.347993319089985e-05, "epoch": 0.4131089643710398, "percentage": 41.31, "elapsed_time": "1 day, 5:43:32", "remaining_time": "1 day, 18:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3978, "total_steps": 9627, "loss": 1.8328, "learning_rate": 6.346422005944586e-05, "epoch": 0.4132128388906201, "percentage": 41.32, "elapsed_time": "1 day, 5:44:01", "remaining_time": "1 day, 18:13:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3979, "total_steps": 9627, "loss": 1.7727, "learning_rate": 6.344850549415746e-05, "epoch": 0.4133167134102005, "percentage": 41.33, "elapsed_time": "1 day, 5:44:30", "remaining_time": "1 day, 18:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3980, "total_steps": 9627, "loss": 1.6293, "learning_rate": 6.343278949670812e-05, "epoch": 0.4134205879297808, "percentage": 41.34, "elapsed_time": "1 day, 5:44:58", "remaining_time": "1 day, 18:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3981, "total_steps": 9627, "loss": 1.8089, "learning_rate": 6.341707206877149e-05, "epoch": 0.4135244624493612, "percentage": 41.35, "elapsed_time": "1 day, 5:45:27", "remaining_time": "1 day, 18:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3982, "total_steps": 9627, "loss": 1.793, "learning_rate": 6.340135321202134e-05, "epoch": 0.4136283369689415, "percentage": 41.36, "elapsed_time": "1 day, 5:45:57", "remaining_time": "1 day, 18:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3983, "total_steps": 9627, "loss": 1.8366, "learning_rate": 6.33856329281316e-05, "epoch": 0.41373221148852185, "percentage": 41.37, "elapsed_time": "1 day, 5:46:25", "remaining_time": "1 day, 18:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3984, "total_steps": 9627, "loss": 1.7176, "learning_rate": 6.336991121877637e-05, "epoch": 0.41383608600810223, "percentage": 41.38, "elapsed_time": "1 day, 5:46:55", "remaining_time": "1 day, 18:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3985, "total_steps": 9627, "loss": 1.8262, "learning_rate": 6.335418808562988e-05, "epoch": 0.41393996052768256, "percentage": 41.39, "elapsed_time": "1 day, 5:47:23", "remaining_time": "1 day, 18:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3986, "total_steps": 9627, "loss": 1.8285, "learning_rate": 6.333846353036654e-05, "epoch": 0.4140438350472629, "percentage": 41.4, "elapsed_time": "1 day, 5:47:52", "remaining_time": "1 day, 18:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3987, "total_steps": 9627, "loss": 1.709, "learning_rate": 6.332273755466087e-05, "epoch": 0.41414770956684327, "percentage": 41.41, "elapsed_time": "1 day, 5:48:21", "remaining_time": "1 day, 18:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3988, "total_steps": 9627, "loss": 1.7283, "learning_rate": 6.330701016018757e-05, "epoch": 0.4142515840864236, "percentage": 41.43, "elapsed_time": "1 day, 5:48:49", "remaining_time": "1 day, 18:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3989, "total_steps": 9627, "loss": 1.7227, "learning_rate": 6.329128134862148e-05, "epoch": 0.4143554586060039, "percentage": 41.44, "elapsed_time": "1 day, 5:49:19", "remaining_time": "1 day, 18:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3990, "total_steps": 9627, "loss": 1.7244, "learning_rate": 6.32755511216376e-05, "epoch": 0.4144593331255843, "percentage": 41.45, "elapsed_time": "1 day, 5:49:47", "remaining_time": "1 day, 18:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3991, "total_steps": 9627, "loss": 1.6718, "learning_rate": 6.32598194809111e-05, "epoch": 0.41456320764516463, "percentage": 41.46, "elapsed_time": "1 day, 5:50:17", "remaining_time": "1 day, 18:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3992, "total_steps": 9627, "loss": 1.584, "learning_rate": 6.324408642811726e-05, "epoch": 0.414667082164745, "percentage": 41.47, "elapsed_time": "1 day, 5:50:45", "remaining_time": "1 day, 18:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3993, "total_steps": 9627, "loss": 1.5411, "learning_rate": 6.32283519649315e-05, "epoch": 0.41477095668432534, "percentage": 41.48, "elapsed_time": "1 day, 5:51:15", "remaining_time": "1 day, 18:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3994, "total_steps": 9627, "loss": 1.8188, "learning_rate": 6.321261609302945e-05, "epoch": 0.41487483120390567, "percentage": 41.49, "elapsed_time": "1 day, 5:51:43", "remaining_time": "1 day, 18:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3995, "total_steps": 9627, "loss": 1.6147, "learning_rate": 6.319687881408683e-05, "epoch": 0.41497870572348605, "percentage": 41.5, "elapsed_time": "1 day, 5:52:12", "remaining_time": "1 day, 18:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3996, "total_steps": 9627, "loss": 1.917, "learning_rate": 6.318114012977958e-05, "epoch": 0.4150825802430664, "percentage": 41.51, "elapsed_time": "1 day, 5:52:40", "remaining_time": "1 day, 18:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3997, "total_steps": 9627, "loss": 1.7175, "learning_rate": 6.316540004178371e-05, "epoch": 0.4151864547626467, "percentage": 41.52, "elapsed_time": "1 day, 5:53:10", "remaining_time": "1 day, 18:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3998, "total_steps": 9627, "loss": 1.6544, "learning_rate": 6.314965855177544e-05, "epoch": 0.4152903292822271, "percentage": 41.53, "elapsed_time": "1 day, 5:53:38", "remaining_time": "1 day, 18:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3999, "total_steps": 9627, "loss": 1.4105, "learning_rate": 6.31339156614311e-05, "epoch": 0.4153942038018074, "percentage": 41.54, "elapsed_time": "1 day, 5:54:08", "remaining_time": "1 day, 18:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 9627, "loss": 1.7974, "learning_rate": 6.311817137242721e-05, "epoch": 0.41549807832138774, "percentage": 41.55, "elapsed_time": "1 day, 5:54:36", "remaining_time": "1 day, 18:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4001, "total_steps": 9627, "loss": 1.5556, "learning_rate": 6.310242568644035e-05, "epoch": 0.4156019528409681, "percentage": 41.56, "elapsed_time": "1 day, 5:55:06", "remaining_time": "1 day, 18:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4002, "total_steps": 9627, "loss": 1.6694, "learning_rate": 6.30866786051474e-05, "epoch": 0.41570582736054845, "percentage": 41.57, "elapsed_time": "1 day, 5:55:35", "remaining_time": "1 day, 18:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4003, "total_steps": 9627, "loss": 1.5479, "learning_rate": 6.307093013022525e-05, "epoch": 0.4158097018801288, "percentage": 41.58, "elapsed_time": "1 day, 5:56:04", "remaining_time": "1 day, 18:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4004, "total_steps": 9627, "loss": 1.6548, "learning_rate": 6.305518026335097e-05, "epoch": 0.41591357639970916, "percentage": 41.59, "elapsed_time": "1 day, 5:56:33", "remaining_time": "1 day, 18:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4005, "total_steps": 9627, "loss": 1.5989, "learning_rate": 6.303942900620185e-05, "epoch": 0.4160174509192895, "percentage": 41.6, "elapsed_time": "1 day, 5:57:01", "remaining_time": "1 day, 18:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4006, "total_steps": 9627, "loss": 1.6618, "learning_rate": 6.302367636045526e-05, "epoch": 0.41612132543886987, "percentage": 41.61, "elapsed_time": "1 day, 5:57:31", "remaining_time": "1 day, 18:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4007, "total_steps": 9627, "loss": 1.5055, "learning_rate": 6.300792232778872e-05, "epoch": 0.4162251999584502, "percentage": 41.62, "elapsed_time": "1 day, 5:57:59", "remaining_time": "1 day, 18:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4008, "total_steps": 9627, "loss": 1.9369, "learning_rate": 6.29921669098799e-05, "epoch": 0.4163290744780305, "percentage": 41.63, "elapsed_time": "1 day, 5:58:28", "remaining_time": "1 day, 18:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4009, "total_steps": 9627, "loss": 1.6275, "learning_rate": 6.297641010840665e-05, "epoch": 0.4164329489976109, "percentage": 41.64, "elapsed_time": "1 day, 5:58:57", "remaining_time": "1 day, 18:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4010, "total_steps": 9627, "loss": 1.8641, "learning_rate": 6.296065192504697e-05, "epoch": 0.41653682351719123, "percentage": 41.65, "elapsed_time": "1 day, 5:59:25", "remaining_time": "1 day, 18:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4011, "total_steps": 9627, "loss": 1.7272, "learning_rate": 6.294489236147894e-05, "epoch": 0.41664069803677156, "percentage": 41.66, "elapsed_time": "1 day, 5:59:56", "remaining_time": "1 day, 18:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4012, "total_steps": 9627, "loss": 1.683, "learning_rate": 6.292913141938084e-05, "epoch": 0.41674457255635194, "percentage": 41.67, "elapsed_time": "1 day, 6:00:23", "remaining_time": "1 day, 17:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4013, "total_steps": 9627, "loss": 1.6662, "learning_rate": 6.29133691004311e-05, "epoch": 0.41684844707593227, "percentage": 41.68, "elapsed_time": "1 day, 6:00:53", "remaining_time": "1 day, 17:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4014, "total_steps": 9627, "loss": 1.6862, "learning_rate": 6.289760540630829e-05, "epoch": 0.4169523215955126, "percentage": 41.7, "elapsed_time": "1 day, 6:01:21", "remaining_time": "1 day, 17:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4015, "total_steps": 9627, "loss": 1.7041, "learning_rate": 6.288184033869109e-05, "epoch": 0.417056196115093, "percentage": 41.71, "elapsed_time": "1 day, 6:01:50", "remaining_time": "1 day, 17:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4016, "total_steps": 9627, "loss": 1.7689, "learning_rate": 6.28660738992584e-05, "epoch": 0.4171600706346733, "percentage": 41.72, "elapsed_time": "1 day, 6:02:18", "remaining_time": "1 day, 17:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4017, "total_steps": 9627, "loss": 1.7707, "learning_rate": 6.285030608968918e-05, "epoch": 0.41726394515425363, "percentage": 41.73, "elapsed_time": "1 day, 6:02:47", "remaining_time": "1 day, 17:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4018, "total_steps": 9627, "loss": 1.5884, "learning_rate": 6.28345369116626e-05, "epoch": 0.417367819673834, "percentage": 41.74, "elapsed_time": "1 day, 6:03:16", "remaining_time": "1 day, 17:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4019, "total_steps": 9627, "loss": 1.6574, "learning_rate": 6.281876636685795e-05, "epoch": 0.41747169419341434, "percentage": 41.75, "elapsed_time": "1 day, 6:03:45", "remaining_time": "1 day, 17:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4020, "total_steps": 9627, "loss": 1.8304, "learning_rate": 6.280299445695469e-05, "epoch": 0.4175755687129947, "percentage": 41.76, "elapsed_time": "1 day, 6:04:14", "remaining_time": "1 day, 17:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4021, "total_steps": 9627, "loss": 1.5268, "learning_rate": 6.278722118363237e-05, "epoch": 0.41767944323257505, "percentage": 41.77, "elapsed_time": "1 day, 6:04:42", "remaining_time": "1 day, 17:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4022, "total_steps": 9627, "loss": 1.8324, "learning_rate": 6.277144654857074e-05, "epoch": 0.4177833177521554, "percentage": 41.78, "elapsed_time": "1 day, 6:05:10", "remaining_time": "1 day, 17:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4023, "total_steps": 9627, "loss": 1.6818, "learning_rate": 6.275567055344967e-05, "epoch": 0.41788719227173576, "percentage": 41.79, "elapsed_time": "1 day, 6:05:40", "remaining_time": "1 day, 17:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4024, "total_steps": 9627, "loss": 1.8911, "learning_rate": 6.27398931999492e-05, "epoch": 0.4179910667913161, "percentage": 41.8, "elapsed_time": "1 day, 6:06:08", "remaining_time": "1 day, 17:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4025, "total_steps": 9627, "loss": 1.7229, "learning_rate": 6.272411448974947e-05, "epoch": 0.4180949413108964, "percentage": 41.81, "elapsed_time": "1 day, 6:06:37", "remaining_time": "1 day, 17:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4026, "total_steps": 9627, "loss": 1.664, "learning_rate": 6.270833442453079e-05, "epoch": 0.4181988158304768, "percentage": 41.82, "elapsed_time": "1 day, 6:07:05", "remaining_time": "1 day, 17:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4027, "total_steps": 9627, "loss": 1.6161, "learning_rate": 6.269255300597364e-05, "epoch": 0.4183026903500571, "percentage": 41.83, "elapsed_time": "1 day, 6:07:34", "remaining_time": "1 day, 17:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4028, "total_steps": 9627, "loss": 1.7089, "learning_rate": 6.267677023575859e-05, "epoch": 0.41840656486963745, "percentage": 41.84, "elapsed_time": "1 day, 6:08:04", "remaining_time": "1 day, 17:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4029, "total_steps": 9627, "loss": 1.6041, "learning_rate": 6.26609861155664e-05, "epoch": 0.41851043938921784, "percentage": 41.85, "elapsed_time": "1 day, 6:08:33", "remaining_time": "1 day, 17:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4030, "total_steps": 9627, "loss": 1.7304, "learning_rate": 6.264520064707795e-05, "epoch": 0.41861431390879816, "percentage": 41.86, "elapsed_time": "1 day, 6:09:01", "remaining_time": "1 day, 17:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4031, "total_steps": 9627, "loss": 1.813, "learning_rate": 6.262941383197425e-05, "epoch": 0.41871818842837855, "percentage": 41.87, "elapsed_time": "1 day, 6:09:30", "remaining_time": "1 day, 17:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4032, "total_steps": 9627, "loss": 1.8182, "learning_rate": 6.261362567193651e-05, "epoch": 0.4188220629479589, "percentage": 41.88, "elapsed_time": "1 day, 6:09:58", "remaining_time": "1 day, 17:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4033, "total_steps": 9627, "loss": 1.733, "learning_rate": 6.259783616864601e-05, "epoch": 0.4189259374675392, "percentage": 41.89, "elapsed_time": "1 day, 6:10:27", "remaining_time": "1 day, 17:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4034, "total_steps": 9627, "loss": 1.8581, "learning_rate": 6.258204532378423e-05, "epoch": 0.4190298119871196, "percentage": 41.9, "elapsed_time": "1 day, 6:10:56", "remaining_time": "1 day, 17:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4035, "total_steps": 9627, "loss": 1.6578, "learning_rate": 6.256625313903278e-05, "epoch": 0.4191336865066999, "percentage": 41.91, "elapsed_time": "1 day, 6:11:25", "remaining_time": "1 day, 17:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4036, "total_steps": 9627, "loss": 1.7315, "learning_rate": 6.255045961607338e-05, "epoch": 0.41923756102628024, "percentage": 41.92, "elapsed_time": "1 day, 6:11:54", "remaining_time": "1 day, 17:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4037, "total_steps": 9627, "loss": 1.5881, "learning_rate": 6.253466475658792e-05, "epoch": 0.4193414355458606, "percentage": 41.93, "elapsed_time": "1 day, 6:12:22", "remaining_time": "1 day, 17:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4038, "total_steps": 9627, "loss": 1.719, "learning_rate": 6.251886856225844e-05, "epoch": 0.41944531006544095, "percentage": 41.94, "elapsed_time": "1 day, 6:12:52", "remaining_time": "1 day, 17:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4039, "total_steps": 9627, "loss": 1.6688, "learning_rate": 6.250307103476712e-05, "epoch": 0.4195491845850213, "percentage": 41.95, "elapsed_time": "1 day, 6:13:20", "remaining_time": "1 day, 17:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4040, "total_steps": 9627, "loss": 1.7883, "learning_rate": 6.248727217579625e-05, "epoch": 0.41965305910460166, "percentage": 41.97, "elapsed_time": "1 day, 6:13:49", "remaining_time": "1 day, 17:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4041, "total_steps": 9627, "loss": 1.8919, "learning_rate": 6.247147198702832e-05, "epoch": 0.419756933624182, "percentage": 41.98, "elapsed_time": "1 day, 6:14:17", "remaining_time": "1 day, 17:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4042, "total_steps": 9627, "loss": 1.7379, "learning_rate": 6.245567047014589e-05, "epoch": 0.4198608081437623, "percentage": 41.99, "elapsed_time": "1 day, 6:14:46", "remaining_time": "1 day, 17:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4043, "total_steps": 9627, "loss": 1.7343, "learning_rate": 6.243986762683171e-05, "epoch": 0.4199646826633427, "percentage": 42.0, "elapsed_time": "1 day, 6:15:14", "remaining_time": "1 day, 17:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4044, "total_steps": 9627, "loss": 1.8147, "learning_rate": 6.242406345876866e-05, "epoch": 0.420068557182923, "percentage": 42.01, "elapsed_time": "1 day, 6:15:44", "remaining_time": "1 day, 17:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4045, "total_steps": 9627, "loss": 1.6202, "learning_rate": 6.240825796763977e-05, "epoch": 0.4201724317025034, "percentage": 42.02, "elapsed_time": "1 day, 6:16:12", "remaining_time": "1 day, 17:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4046, "total_steps": 9627, "loss": 1.6385, "learning_rate": 6.239245115512818e-05, "epoch": 0.42027630622208373, "percentage": 42.03, "elapsed_time": "1 day, 6:16:41", "remaining_time": "1 day, 17:45:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4047, "total_steps": 9627, "loss": 1.6763, "learning_rate": 6.237664302291722e-05, "epoch": 0.42038018074166406, "percentage": 42.04, "elapsed_time": "1 day, 6:17:09", "remaining_time": "1 day, 17:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4048, "total_steps": 9627, "loss": 1.6527, "learning_rate": 6.236083357269033e-05, "epoch": 0.42048405526124444, "percentage": 42.05, "elapsed_time": "1 day, 6:17:39", "remaining_time": "1 day, 17:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4049, "total_steps": 9627, "loss": 1.7658, "learning_rate": 6.234502280613108e-05, "epoch": 0.42058792978082477, "percentage": 42.06, "elapsed_time": "1 day, 6:18:07", "remaining_time": "1 day, 17:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4050, "total_steps": 9627, "loss": 1.7382, "learning_rate": 6.232921072492318e-05, "epoch": 0.4206918043004051, "percentage": 42.07, "elapsed_time": "1 day, 6:18:37", "remaining_time": "1 day, 17:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4051, "total_steps": 9627, "loss": 1.7945, "learning_rate": 6.23133973307505e-05, "epoch": 0.4207956788199855, "percentage": 42.08, "elapsed_time": "1 day, 6:19:04", "remaining_time": "1 day, 17:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4052, "total_steps": 9627, "loss": 1.8404, "learning_rate": 6.229758262529708e-05, "epoch": 0.4208995533395658, "percentage": 42.09, "elapsed_time": "1 day, 6:19:34", "remaining_time": "1 day, 17:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4053, "total_steps": 9627, "loss": 1.619, "learning_rate": 6.228176661024703e-05, "epoch": 0.42100342785914613, "percentage": 42.1, "elapsed_time": "1 day, 6:20:03", "remaining_time": "1 day, 17:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4054, "total_steps": 9627, "loss": 1.6359, "learning_rate": 6.226594928728462e-05, "epoch": 0.4211073023787265, "percentage": 42.11, "elapsed_time": "1 day, 6:20:31", "remaining_time": "1 day, 17:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4055, "total_steps": 9627, "loss": 1.8973, "learning_rate": 6.225013065809431e-05, "epoch": 0.42121117689830684, "percentage": 42.12, "elapsed_time": "1 day, 6:21:00", "remaining_time": "1 day, 17:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4056, "total_steps": 9627, "loss": 1.6915, "learning_rate": 6.223431072436063e-05, "epoch": 0.42131505141788717, "percentage": 42.13, "elapsed_time": "1 day, 6:21:28", "remaining_time": "1 day, 17:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4057, "total_steps": 9627, "loss": 1.6772, "learning_rate": 6.221848948776828e-05, "epoch": 0.42141892593746755, "percentage": 42.14, "elapsed_time": "1 day, 6:21:58", "remaining_time": "1 day, 17:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4058, "total_steps": 9627, "loss": 1.7213, "learning_rate": 6.220266695000211e-05, "epoch": 0.4215228004570479, "percentage": 42.15, "elapsed_time": "1 day, 6:22:25", "remaining_time": "1 day, 17:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4059, "total_steps": 9627, "loss": 1.9761, "learning_rate": 6.21868431127471e-05, "epoch": 0.42162667497662826, "percentage": 42.16, "elapsed_time": "1 day, 6:22:53", "remaining_time": "1 day, 17:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4060, "total_steps": 9627, "loss": 1.7037, "learning_rate": 6.217101797768837e-05, "epoch": 0.4217305494962086, "percentage": 42.17, "elapsed_time": "1 day, 6:23:24", "remaining_time": "1 day, 17:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4061, "total_steps": 9627, "loss": 1.7218, "learning_rate": 6.215519154651116e-05, "epoch": 0.4218344240157889, "percentage": 42.18, "elapsed_time": "1 day, 6:23:51", "remaining_time": "1 day, 17:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4062, "total_steps": 9627, "loss": 1.7957, "learning_rate": 6.213936382090085e-05, "epoch": 0.4219382985353693, "percentage": 42.19, "elapsed_time": "1 day, 6:24:21", "remaining_time": "1 day, 17:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4063, "total_steps": 9627, "loss": 1.7508, "learning_rate": 6.2123534802543e-05, "epoch": 0.4220421730549496, "percentage": 42.2, "elapsed_time": "1 day, 6:24:49", "remaining_time": "1 day, 17:38:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4064, "total_steps": 9627, "loss": 1.6243, "learning_rate": 6.210770449312326e-05, "epoch": 0.42214604757452995, "percentage": 42.21, "elapsed_time": "1 day, 6:25:19", "remaining_time": "1 day, 17:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4065, "total_steps": 9627, "loss": 1.8161, "learning_rate": 6.209187289432742e-05, "epoch": 0.42224992209411033, "percentage": 42.22, "elapsed_time": "1 day, 6:25:47", "remaining_time": "1 day, 17:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4066, "total_steps": 9627, "loss": 1.6786, "learning_rate": 6.207604000784143e-05, "epoch": 0.42235379661369066, "percentage": 42.24, "elapsed_time": "1 day, 6:26:16", "remaining_time": "1 day, 17:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4067, "total_steps": 9627, "loss": 1.7703, "learning_rate": 6.206020583535141e-05, "epoch": 0.422457671133271, "percentage": 42.25, "elapsed_time": "1 day, 6:26:44", "remaining_time": "1 day, 17:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4068, "total_steps": 9627, "loss": 1.8734, "learning_rate": 6.204437037854351e-05, "epoch": 0.42256154565285137, "percentage": 42.26, "elapsed_time": "1 day, 6:27:13", "remaining_time": "1 day, 17:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4069, "total_steps": 9627, "loss": 1.7048, "learning_rate": 6.202853363910413e-05, "epoch": 0.4226654201724317, "percentage": 42.27, "elapsed_time": "1 day, 6:27:41", "remaining_time": "1 day, 17:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4070, "total_steps": 9627, "loss": 1.6683, "learning_rate": 6.201269561871975e-05, "epoch": 0.4227692946920121, "percentage": 42.28, "elapsed_time": "1 day, 6:28:10", "remaining_time": "1 day, 17:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4071, "total_steps": 9627, "loss": 1.6983, "learning_rate": 6.199685631907697e-05, "epoch": 0.4228731692115924, "percentage": 42.29, "elapsed_time": "1 day, 6:28:40", "remaining_time": "1 day, 17:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4072, "total_steps": 9627, "loss": 1.6345, "learning_rate": 6.19810157418626e-05, "epoch": 0.42297704373117273, "percentage": 42.3, "elapsed_time": "1 day, 6:29:08", "remaining_time": "1 day, 17:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4073, "total_steps": 9627, "loss": 1.6669, "learning_rate": 6.196517388876348e-05, "epoch": 0.4230809182507531, "percentage": 42.31, "elapsed_time": "1 day, 6:29:37", "remaining_time": "1 day, 17:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4074, "total_steps": 9627, "loss": 1.5462, "learning_rate": 6.194933076146668e-05, "epoch": 0.42318479277033344, "percentage": 42.32, "elapsed_time": "1 day, 6:30:06", "remaining_time": "1 day, 17:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4075, "total_steps": 9627, "loss": 1.8317, "learning_rate": 6.193348636165937e-05, "epoch": 0.42328866728991377, "percentage": 42.33, "elapsed_time": "1 day, 6:30:34", "remaining_time": "1 day, 17:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4076, "total_steps": 9627, "loss": 1.8396, "learning_rate": 6.191764069102883e-05, "epoch": 0.42339254180949415, "percentage": 42.34, "elapsed_time": "1 day, 6:31:02", "remaining_time": "1 day, 17:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4077, "total_steps": 9627, "loss": 1.7317, "learning_rate": 6.190179375126254e-05, "epoch": 0.4234964163290745, "percentage": 42.35, "elapsed_time": "1 day, 6:31:31", "remaining_time": "1 day, 17:33:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4078, "total_steps": 9627, "loss": 1.6922, "learning_rate": 6.188594554404804e-05, "epoch": 0.4236002908486548, "percentage": 42.36, "elapsed_time": "1 day, 6:32:00", "remaining_time": "1 day, 17:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4079, "total_steps": 9627, "loss": 1.7322, "learning_rate": 6.187009607107304e-05, "epoch": 0.4237041653682352, "percentage": 42.37, "elapsed_time": "1 day, 6:32:29", "remaining_time": "1 day, 17:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4080, "total_steps": 9627, "loss": 1.8053, "learning_rate": 6.185424533402543e-05, "epoch": 0.4238080398878155, "percentage": 42.38, "elapsed_time": "1 day, 6:32:57", "remaining_time": "1 day, 17:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4081, "total_steps": 9627, "loss": 1.6599, "learning_rate": 6.183839333459315e-05, "epoch": 0.42391191440739584, "percentage": 42.39, "elapsed_time": "1 day, 6:33:26", "remaining_time": "1 day, 17:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4082, "total_steps": 9627, "loss": 1.7394, "learning_rate": 6.18225400744643e-05, "epoch": 0.4240157889269762, "percentage": 42.4, "elapsed_time": "1 day, 6:33:55", "remaining_time": "1 day, 17:31:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4083, "total_steps": 9627, "loss": 1.5259, "learning_rate": 6.180668555532719e-05, "epoch": 0.42411966344655655, "percentage": 42.41, "elapsed_time": "1 day, 6:34:24", "remaining_time": "1 day, 17:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4084, "total_steps": 9627, "loss": 1.6746, "learning_rate": 6.179082977887013e-05, "epoch": 0.42422353796613693, "percentage": 42.42, "elapsed_time": "1 day, 6:34:52", "remaining_time": "1 day, 17:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4085, "total_steps": 9627, "loss": 1.6812, "learning_rate": 6.177497274678168e-05, "epoch": 0.42432741248571726, "percentage": 42.43, "elapsed_time": "1 day, 6:35:22", "remaining_time": "1 day, 17:29:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4086, "total_steps": 9627, "loss": 1.6457, "learning_rate": 6.175911446075049e-05, "epoch": 0.4244312870052976, "percentage": 42.44, "elapsed_time": "1 day, 6:35:50", "remaining_time": "1 day, 17:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4087, "total_steps": 9627, "loss": 1.7168, "learning_rate": 6.174325492246531e-05, "epoch": 0.42453516152487797, "percentage": 42.45, "elapsed_time": "1 day, 6:36:19", "remaining_time": "1 day, 17:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4088, "total_steps": 9627, "loss": 1.7847, "learning_rate": 6.17273941336151e-05, "epoch": 0.4246390360444583, "percentage": 42.46, "elapsed_time": "1 day, 6:36:48", "remaining_time": "1 day, 17:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4089, "total_steps": 9627, "loss": 1.951, "learning_rate": 6.171153209588891e-05, "epoch": 0.4247429105640386, "percentage": 42.47, "elapsed_time": "1 day, 6:37:16", "remaining_time": "1 day, 17:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4090, "total_steps": 9627, "loss": 1.4734, "learning_rate": 6.169566881097588e-05, "epoch": 0.424846785083619, "percentage": 42.48, "elapsed_time": "1 day, 6:37:44", "remaining_time": "1 day, 17:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4091, "total_steps": 9627, "loss": 1.5504, "learning_rate": 6.167980428056537e-05, "epoch": 0.42495065960319933, "percentage": 42.5, "elapsed_time": "1 day, 6:38:14", "remaining_time": "1 day, 17:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4092, "total_steps": 9627, "loss": 1.8144, "learning_rate": 6.16639385063468e-05, "epoch": 0.42505453412277966, "percentage": 42.51, "elapsed_time": "1 day, 6:38:42", "remaining_time": "1 day, 17:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4093, "total_steps": 9627, "loss": 1.5118, "learning_rate": 6.164807149000974e-05, "epoch": 0.42515840864236004, "percentage": 42.52, "elapsed_time": "1 day, 6:39:11", "remaining_time": "1 day, 17:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4094, "total_steps": 9627, "loss": 1.8641, "learning_rate": 6.163220323324395e-05, "epoch": 0.42526228316194037, "percentage": 42.53, "elapsed_time": "1 day, 6:39:38", "remaining_time": "1 day, 17:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4095, "total_steps": 9627, "loss": 1.7244, "learning_rate": 6.161633373773925e-05, "epoch": 0.4253661576815207, "percentage": 42.54, "elapsed_time": "1 day, 6:40:08", "remaining_time": "1 day, 17:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4096, "total_steps": 9627, "loss": 1.8696, "learning_rate": 6.16004630051856e-05, "epoch": 0.4254700322011011, "percentage": 42.55, "elapsed_time": "1 day, 6:40:37", "remaining_time": "1 day, 17:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4097, "total_steps": 9627, "loss": 1.7826, "learning_rate": 6.158459103727316e-05, "epoch": 0.4255739067206814, "percentage": 42.56, "elapsed_time": "1 day, 6:41:05", "remaining_time": "1 day, 17:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4098, "total_steps": 9627, "loss": 1.6452, "learning_rate": 6.15687178356921e-05, "epoch": 0.4256777812402618, "percentage": 42.57, "elapsed_time": "1 day, 6:41:34", "remaining_time": "1 day, 17:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4099, "total_steps": 9627, "loss": 1.6827, "learning_rate": 6.155284340213285e-05, "epoch": 0.4257816557598421, "percentage": 42.58, "elapsed_time": "1 day, 6:42:03", "remaining_time": "1 day, 17:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4100, "total_steps": 9627, "loss": 1.9042, "learning_rate": 6.15369677382859e-05, "epoch": 0.42588553027942244, "percentage": 42.59, "elapsed_time": "1 day, 6:42:32", "remaining_time": "1 day, 17:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4101, "total_steps": 9627, "loss": 1.643, "learning_rate": 6.152109084584186e-05, "epoch": 0.4259894047990028, "percentage": 42.6, "elapsed_time": "1 day, 6:43:00", "remaining_time": "1 day, 17:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4102, "total_steps": 9627, "loss": 1.5454, "learning_rate": 6.150521272649152e-05, "epoch": 0.42609327931858315, "percentage": 42.61, "elapsed_time": "1 day, 6:43:29", "remaining_time": "1 day, 17:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4103, "total_steps": 9627, "loss": 1.6159, "learning_rate": 6.148933338192578e-05, "epoch": 0.4261971538381635, "percentage": 42.62, "elapsed_time": "1 day, 6:43:58", "remaining_time": "1 day, 17:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4104, "total_steps": 9627, "loss": 1.8407, "learning_rate": 6.147345281383565e-05, "epoch": 0.42630102835774386, "percentage": 42.63, "elapsed_time": "1 day, 6:44:26", "remaining_time": "1 day, 17:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4105, "total_steps": 9627, "loss": 1.7704, "learning_rate": 6.145757102391227e-05, "epoch": 0.4264049028773242, "percentage": 42.64, "elapsed_time": "1 day, 6:44:55", "remaining_time": "1 day, 17:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4106, "total_steps": 9627, "loss": 1.7799, "learning_rate": 6.144168801384698e-05, "epoch": 0.4265087773969045, "percentage": 42.65, "elapsed_time": "1 day, 6:45:24", "remaining_time": "1 day, 17:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4107, "total_steps": 9627, "loss": 1.6106, "learning_rate": 6.142580378533114e-05, "epoch": 0.4266126519164849, "percentage": 42.66, "elapsed_time": "1 day, 6:45:52", "remaining_time": "1 day, 17:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4108, "total_steps": 9627, "loss": 1.6198, "learning_rate": 6.140991834005632e-05, "epoch": 0.4267165264360652, "percentage": 42.67, "elapsed_time": "1 day, 6:46:21", "remaining_time": "1 day, 17:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4109, "total_steps": 9627, "loss": 1.7884, "learning_rate": 6.139403167971422e-05, "epoch": 0.4268204009556456, "percentage": 42.68, "elapsed_time": "1 day, 6:46:49", "remaining_time": "1 day, 17:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4110, "total_steps": 9627, "loss": 1.7371, "learning_rate": 6.13781438059966e-05, "epoch": 0.42692427547522593, "percentage": 42.69, "elapsed_time": "1 day, 6:47:19", "remaining_time": "1 day, 17:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4111, "total_steps": 9627, "loss": 1.6047, "learning_rate": 6.136225472059545e-05, "epoch": 0.42702814999480626, "percentage": 42.7, "elapsed_time": "1 day, 6:47:47", "remaining_time": "1 day, 17:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4112, "total_steps": 9627, "loss": 1.6329, "learning_rate": 6.134636442520277e-05, "epoch": 0.42713202451438664, "percentage": 42.71, "elapsed_time": "1 day, 6:48:16", "remaining_time": "1 day, 17:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4113, "total_steps": 9627, "loss": 1.711, "learning_rate": 6.13304729215108e-05, "epoch": 0.42723589903396697, "percentage": 42.72, "elapsed_time": "1 day, 6:48:44", "remaining_time": "1 day, 17:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4114, "total_steps": 9627, "loss": 1.6623, "learning_rate": 6.131458021121184e-05, "epoch": 0.4273397735535473, "percentage": 42.73, "elapsed_time": "1 day, 6:49:13", "remaining_time": "1 day, 17:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4115, "total_steps": 9627, "loss": 1.8319, "learning_rate": 6.129868629599832e-05, "epoch": 0.4274436480731277, "percentage": 42.74, "elapsed_time": "1 day, 6:49:42", "remaining_time": "1 day, 17:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4116, "total_steps": 9627, "loss": 1.8514, "learning_rate": 6.128279117756288e-05, "epoch": 0.427547522592708, "percentage": 42.75, "elapsed_time": "1 day, 6:50:09", "remaining_time": "1 day, 17:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4117, "total_steps": 9627, "loss": 1.7907, "learning_rate": 6.126689485759818e-05, "epoch": 0.42765139711228833, "percentage": 42.77, "elapsed_time": "1 day, 6:50:39", "remaining_time": "1 day, 17:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4118, "total_steps": 9627, "loss": 1.5299, "learning_rate": 6.125099733779706e-05, "epoch": 0.4277552716318687, "percentage": 42.78, "elapsed_time": "1 day, 6:51:06", "remaining_time": "1 day, 17:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4119, "total_steps": 9627, "loss": 1.6515, "learning_rate": 6.12350986198525e-05, "epoch": 0.42785914615144904, "percentage": 42.79, "elapsed_time": "1 day, 6:51:36", "remaining_time": "1 day, 17:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4120, "total_steps": 9627, "loss": 1.9308, "learning_rate": 6.121919870545755e-05, "epoch": 0.42796302067102937, "percentage": 42.8, "elapsed_time": "1 day, 6:52:04", "remaining_time": "1 day, 17:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4121, "total_steps": 9627, "loss": 1.9438, "learning_rate": 6.120329759630546e-05, "epoch": 0.42806689519060975, "percentage": 42.81, "elapsed_time": "1 day, 6:52:34", "remaining_time": "1 day, 17:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4122, "total_steps": 9627, "loss": 1.8285, "learning_rate": 6.118739529408956e-05, "epoch": 0.4281707697101901, "percentage": 42.82, "elapsed_time": "1 day, 6:53:02", "remaining_time": "1 day, 17:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4123, "total_steps": 9627, "loss": 1.7948, "learning_rate": 6.117149180050332e-05, "epoch": 0.42827464422977046, "percentage": 42.83, "elapsed_time": "1 day, 6:53:30", "remaining_time": "1 day, 17:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4124, "total_steps": 9627, "loss": 1.6341, "learning_rate": 6.115558711724036e-05, "epoch": 0.4283785187493508, "percentage": 42.84, "elapsed_time": "1 day, 6:53:59", "remaining_time": "1 day, 17:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4125, "total_steps": 9627, "loss": 1.6512, "learning_rate": 6.113968124599439e-05, "epoch": 0.4284823932689311, "percentage": 42.85, "elapsed_time": "1 day, 6:54:27", "remaining_time": "1 day, 17:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4126, "total_steps": 9627, "loss": 1.7734, "learning_rate": 6.112377418845925e-05, "epoch": 0.4285862677885115, "percentage": 42.86, "elapsed_time": "1 day, 6:54:56", "remaining_time": "1 day, 17:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4127, "total_steps": 9627, "loss": 1.8773, "learning_rate": 6.110786594632892e-05, "epoch": 0.4286901423080918, "percentage": 42.87, "elapsed_time": "1 day, 6:55:25", "remaining_time": "1 day, 17:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4128, "total_steps": 9627, "loss": 1.6428, "learning_rate": 6.109195652129753e-05, "epoch": 0.42879401682767215, "percentage": 42.88, "elapsed_time": "1 day, 6:55:52", "remaining_time": "1 day, 17:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4129, "total_steps": 9627, "loss": 1.5291, "learning_rate": 6.107604591505928e-05, "epoch": 0.42889789134725254, "percentage": 42.89, "elapsed_time": "1 day, 6:56:22", "remaining_time": "1 day, 17:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4130, "total_steps": 9627, "loss": 1.8709, "learning_rate": 6.106013412930853e-05, "epoch": 0.42900176586683286, "percentage": 42.9, "elapsed_time": "1 day, 6:56:50", "remaining_time": "1 day, 17:11:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4131, "total_steps": 9627, "loss": 2.1084, "learning_rate": 6.10442211657398e-05, "epoch": 0.4291056403864132, "percentage": 42.91, "elapsed_time": "1 day, 6:57:19", "remaining_time": "1 day, 17:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4132, "total_steps": 9627, "loss": 1.7182, "learning_rate": 6.1028307026047624e-05, "epoch": 0.42920951490599357, "percentage": 42.92, "elapsed_time": "1 day, 6:57:47", "remaining_time": "1 day, 17:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4133, "total_steps": 9627, "loss": 1.7323, "learning_rate": 6.1012391711926795e-05, "epoch": 0.4293133894255739, "percentage": 42.93, "elapsed_time": "1 day, 6:58:17", "remaining_time": "1 day, 17:10:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4134, "total_steps": 9627, "loss": 1.7496, "learning_rate": 6.099647522507216e-05, "epoch": 0.4294172639451542, "percentage": 42.94, "elapsed_time": "1 day, 6:58:45", "remaining_time": "1 day, 17:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4135, "total_steps": 9627, "loss": 1.781, "learning_rate": 6.098055756717866e-05, "epoch": 0.4295211384647346, "percentage": 42.95, "elapsed_time": "1 day, 6:59:13", "remaining_time": "1 day, 17:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4136, "total_steps": 9627, "loss": 1.7705, "learning_rate": 6.0964638739941447e-05, "epoch": 0.42962501298431494, "percentage": 42.96, "elapsed_time": "1 day, 6:59:43", "remaining_time": "1 day, 17:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4137, "total_steps": 9627, "loss": 1.7518, "learning_rate": 6.094871874505572e-05, "epoch": 0.4297288875038953, "percentage": 42.97, "elapsed_time": "1 day, 7:00:11", "remaining_time": "1 day, 17:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4138, "total_steps": 9627, "loss": 1.6859, "learning_rate": 6.093279758421687e-05, "epoch": 0.42983276202347565, "percentage": 42.98, "elapsed_time": "1 day, 7:00:39", "remaining_time": "1 day, 17:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4139, "total_steps": 9627, "loss": 1.5105, "learning_rate": 6.0916875259120366e-05, "epoch": 0.42993663654305597, "percentage": 42.99, "elapsed_time": "1 day, 7:01:08", "remaining_time": "1 day, 17:07:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4140, "total_steps": 9627, "loss": 1.7621, "learning_rate": 6.090095177146178e-05, "epoch": 0.43004051106263635, "percentage": 43.0, "elapsed_time": "1 day, 7:01:37", "remaining_time": "1 day, 17:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4141, "total_steps": 9627, "loss": 1.8687, "learning_rate": 6.088502712293687e-05, "epoch": 0.4301443855822167, "percentage": 43.01, "elapsed_time": "1 day, 7:02:06", "remaining_time": "1 day, 17:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4142, "total_steps": 9627, "loss": 1.6906, "learning_rate": 6.086910131524147e-05, "epoch": 0.430248260101797, "percentage": 43.02, "elapsed_time": "1 day, 7:02:34", "remaining_time": "1 day, 17:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4143, "total_steps": 9627, "loss": 1.7431, "learning_rate": 6.085317435007156e-05, "epoch": 0.4303521346213774, "percentage": 43.04, "elapsed_time": "1 day, 7:03:03", "remaining_time": "1 day, 17:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4144, "total_steps": 9627, "loss": 1.7628, "learning_rate": 6.0837246229123246e-05, "epoch": 0.4304560091409577, "percentage": 43.05, "elapsed_time": "1 day, 7:03:30", "remaining_time": "1 day, 17:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4145, "total_steps": 9627, "loss": 1.4422, "learning_rate": 6.0821316954092745e-05, "epoch": 0.43055988366053805, "percentage": 43.06, "elapsed_time": "1 day, 7:04:00", "remaining_time": "1 day, 17:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4146, "total_steps": 9627, "loss": 1.6521, "learning_rate": 6.08053865266764e-05, "epoch": 0.43066375818011843, "percentage": 43.07, "elapsed_time": "1 day, 7:04:27", "remaining_time": "1 day, 17:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4147, "total_steps": 9627, "loss": 1.9144, "learning_rate": 6.078945494857068e-05, "epoch": 0.43076763269969875, "percentage": 43.08, "elapsed_time": "1 day, 7:04:57", "remaining_time": "1 day, 17:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4148, "total_steps": 9627, "loss": 1.6819, "learning_rate": 6.077352222147214e-05, "epoch": 0.43087150721927914, "percentage": 43.09, "elapsed_time": "1 day, 7:05:26", "remaining_time": "1 day, 17:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4149, "total_steps": 9627, "loss": 1.7586, "learning_rate": 6.075758834707754e-05, "epoch": 0.43097538173885946, "percentage": 43.1, "elapsed_time": "1 day, 7:05:54", "remaining_time": "1 day, 17:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4150, "total_steps": 9627, "loss": 1.8504, "learning_rate": 6.0741653327083703e-05, "epoch": 0.4310792562584398, "percentage": 43.11, "elapsed_time": "1 day, 7:06:23", "remaining_time": "1 day, 17:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4151, "total_steps": 9627, "loss": 1.7859, "learning_rate": 6.072571716318756e-05, "epoch": 0.4311831307780202, "percentage": 43.12, "elapsed_time": "1 day, 7:06:52", "remaining_time": "1 day, 17:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4152, "total_steps": 9627, "loss": 1.6534, "learning_rate": 6.0709779857086214e-05, "epoch": 0.4312870052976005, "percentage": 43.13, "elapsed_time": "1 day, 7:07:21", "remaining_time": "1 day, 17:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4153, "total_steps": 9627, "loss": 1.5697, "learning_rate": 6.069384141047686e-05, "epoch": 0.43139087981718083, "percentage": 43.14, "elapsed_time": "1 day, 7:07:49", "remaining_time": "1 day, 17:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4154, "total_steps": 9627, "loss": 1.6565, "learning_rate": 6.067790182505678e-05, "epoch": 0.4314947543367612, "percentage": 43.15, "elapsed_time": "1 day, 7:08:18", "remaining_time": "1 day, 17:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4155, "total_steps": 9627, "loss": 1.6159, "learning_rate": 6.066196110252347e-05, "epoch": 0.43159862885634154, "percentage": 43.16, "elapsed_time": "1 day, 7:08:46", "remaining_time": "1 day, 17:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4156, "total_steps": 9627, "loss": 1.4971, "learning_rate": 6.064601924457447e-05, "epoch": 0.43170250337592186, "percentage": 43.17, "elapsed_time": "1 day, 7:09:15", "remaining_time": "1 day, 17:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4157, "total_steps": 9627, "loss": 1.6329, "learning_rate": 6.0630076252907445e-05, "epoch": 0.43180637789550225, "percentage": 43.18, "elapsed_time": "1 day, 7:09:43", "remaining_time": "1 day, 17:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4158, "total_steps": 9627, "loss": 1.7333, "learning_rate": 6.061413212922022e-05, "epoch": 0.4319102524150826, "percentage": 43.19, "elapsed_time": "1 day, 7:10:11", "remaining_time": "1 day, 16:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4159, "total_steps": 9627, "loss": 1.6936, "learning_rate": 6.059818687521074e-05, "epoch": 0.4320141269346629, "percentage": 43.2, "elapsed_time": "1 day, 7:10:40", "remaining_time": "1 day, 16:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4160, "total_steps": 9627, "loss": 1.7692, "learning_rate": 6.0582240492577015e-05, "epoch": 0.4321180014542433, "percentage": 43.21, "elapsed_time": "1 day, 7:11:08", "remaining_time": "1 day, 16:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4161, "total_steps": 9627, "loss": 1.6549, "learning_rate": 6.056629298301722e-05, "epoch": 0.4322218759738236, "percentage": 43.22, "elapsed_time": "1 day, 7:11:37", "remaining_time": "1 day, 16:58:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4162, "total_steps": 9627, "loss": 1.8607, "learning_rate": 6.0550344348229626e-05, "epoch": 0.432325750493404, "percentage": 43.23, "elapsed_time": "1 day, 7:12:05", "remaining_time": "1 day, 16:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4163, "total_steps": 9627, "loss": 1.6305, "learning_rate": 6.053439458991268e-05, "epoch": 0.4324296250129843, "percentage": 43.24, "elapsed_time": "1 day, 7:12:34", "remaining_time": "1 day, 16:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4164, "total_steps": 9627, "loss": 1.5788, "learning_rate": 6.051844370976487e-05, "epoch": 0.43253349953256465, "percentage": 43.25, "elapsed_time": "1 day, 7:13:03", "remaining_time": "1 day, 16:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4165, "total_steps": 9627, "loss": 1.6356, "learning_rate": 6.050249170948484e-05, "epoch": 0.43263737405214503, "percentage": 43.26, "elapsed_time": "1 day, 7:13:31", "remaining_time": "1 day, 16:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4166, "total_steps": 9627, "loss": 1.7449, "learning_rate": 6.048653859077138e-05, "epoch": 0.43274124857172536, "percentage": 43.27, "elapsed_time": "1 day, 7:14:00", "remaining_time": "1 day, 16:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4167, "total_steps": 9627, "loss": 1.648, "learning_rate": 6.0470584355323375e-05, "epoch": 0.4328451230913057, "percentage": 43.28, "elapsed_time": "1 day, 7:14:27", "remaining_time": "1 day, 16:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4168, "total_steps": 9627, "loss": 1.8709, "learning_rate": 6.045462900483978e-05, "epoch": 0.43294899761088607, "percentage": 43.29, "elapsed_time": "1 day, 7:14:57", "remaining_time": "1 day, 16:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4169, "total_steps": 9627, "loss": 1.7013, "learning_rate": 6.0438672541019755e-05, "epoch": 0.4330528721304664, "percentage": 43.31, "elapsed_time": "1 day, 7:15:25", "remaining_time": "1 day, 16:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4170, "total_steps": 9627, "loss": 1.6795, "learning_rate": 6.042271496556254e-05, "epoch": 0.4331567466500467, "percentage": 43.32, "elapsed_time": "1 day, 7:15:54", "remaining_time": "1 day, 16:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4171, "total_steps": 9627, "loss": 1.7468, "learning_rate": 6.040675628016746e-05, "epoch": 0.4332606211696271, "percentage": 43.33, "elapsed_time": "1 day, 7:16:22", "remaining_time": "1 day, 16:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4172, "total_steps": 9627, "loss": 1.7661, "learning_rate": 6.039079648653403e-05, "epoch": 0.43336449568920743, "percentage": 43.34, "elapsed_time": "1 day, 7:16:51", "remaining_time": "1 day, 16:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4173, "total_steps": 9627, "loss": 1.6341, "learning_rate": 6.037483558636183e-05, "epoch": 0.4334683702087878, "percentage": 43.35, "elapsed_time": "1 day, 7:17:19", "remaining_time": "1 day, 16:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4174, "total_steps": 9627, "loss": 1.7788, "learning_rate": 6.035887358135056e-05, "epoch": 0.43357224472836814, "percentage": 43.36, "elapsed_time": "1 day, 7:17:48", "remaining_time": "1 day, 16:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4175, "total_steps": 9627, "loss": 1.8262, "learning_rate": 6.0342910473200054e-05, "epoch": 0.43367611924794847, "percentage": 43.37, "elapsed_time": "1 day, 7:18:16", "remaining_time": "1 day, 16:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4176, "total_steps": 9627, "loss": 1.7661, "learning_rate": 6.032694626361025e-05, "epoch": 0.43377999376752885, "percentage": 43.38, "elapsed_time": "1 day, 7:18:45", "remaining_time": "1 day, 16:52:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4177, "total_steps": 9627, "loss": 1.5742, "learning_rate": 6.0310980954281234e-05, "epoch": 0.4338838682871092, "percentage": 43.39, "elapsed_time": "1 day, 7:19:12", "remaining_time": "1 day, 16:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4178, "total_steps": 9627, "loss": 1.66, "learning_rate": 6.029501454691318e-05, "epoch": 0.4339877428066895, "percentage": 43.4, "elapsed_time": "1 day, 7:19:42", "remaining_time": "1 day, 16:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4179, "total_steps": 9627, "loss": 1.6484, "learning_rate": 6.027904704320636e-05, "epoch": 0.4340916173262699, "percentage": 43.41, "elapsed_time": "1 day, 7:20:09", "remaining_time": "1 day, 16:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4180, "total_steps": 9627, "loss": 1.7898, "learning_rate": 6.026307844486123e-05, "epoch": 0.4341954918458502, "percentage": 43.42, "elapsed_time": "1 day, 7:20:38", "remaining_time": "1 day, 16:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4181, "total_steps": 9627, "loss": 1.6147, "learning_rate": 6.024710875357831e-05, "epoch": 0.43429936636543054, "percentage": 43.43, "elapsed_time": "1 day, 7:21:06", "remaining_time": "1 day, 16:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4182, "total_steps": 9627, "loss": 1.685, "learning_rate": 6.02311379710582e-05, "epoch": 0.4344032408850109, "percentage": 43.44, "elapsed_time": "1 day, 7:21:34", "remaining_time": "1 day, 16:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4183, "total_steps": 9627, "loss": 1.8715, "learning_rate": 6.021516609900173e-05, "epoch": 0.43450711540459125, "percentage": 43.45, "elapsed_time": "1 day, 7:22:04", "remaining_time": "1 day, 16:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4184, "total_steps": 9627, "loss": 1.6407, "learning_rate": 6.019919313910976e-05, "epoch": 0.4346109899241716, "percentage": 43.46, "elapsed_time": "1 day, 7:22:31", "remaining_time": "1 day, 16:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4185, "total_steps": 9627, "loss": 1.6688, "learning_rate": 6.0183219093083244e-05, "epoch": 0.43471486444375196, "percentage": 43.47, "elapsed_time": "1 day, 7:23:00", "remaining_time": "1 day, 16:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4186, "total_steps": 9627, "loss": 1.8047, "learning_rate": 6.016724396262335e-05, "epoch": 0.4348187389633323, "percentage": 43.48, "elapsed_time": "1 day, 7:23:28", "remaining_time": "1 day, 16:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4187, "total_steps": 9627, "loss": 1.7502, "learning_rate": 6.015126774943128e-05, "epoch": 0.43492261348291267, "percentage": 43.49, "elapsed_time": "1 day, 7:23:56", "remaining_time": "1 day, 16:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4188, "total_steps": 9627, "loss": 1.8191, "learning_rate": 6.013529045520838e-05, "epoch": 0.435026488002493, "percentage": 43.5, "elapsed_time": "1 day, 7:24:25", "remaining_time": "1 day, 16:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4189, "total_steps": 9627, "loss": 1.6365, "learning_rate": 6.011931208165611e-05, "epoch": 0.4351303625220733, "percentage": 43.51, "elapsed_time": "1 day, 7:24:53", "remaining_time": "1 day, 16:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4190, "total_steps": 9627, "loss": 1.7451, "learning_rate": 6.0103332630476017e-05, "epoch": 0.4352342370416537, "percentage": 43.52, "elapsed_time": "1 day, 7:25:22", "remaining_time": "1 day, 16:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4191, "total_steps": 9627, "loss": 1.7397, "learning_rate": 6.008735210336982e-05, "epoch": 0.43533811156123403, "percentage": 43.53, "elapsed_time": "1 day, 7:25:51", "remaining_time": "1 day, 16:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4192, "total_steps": 9627, "loss": 1.5615, "learning_rate": 6.00713705020393e-05, "epoch": 0.43544198608081436, "percentage": 43.54, "elapsed_time": "1 day, 7:26:18", "remaining_time": "1 day, 16:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4193, "total_steps": 9627, "loss": 1.8237, "learning_rate": 6.005538782818638e-05, "epoch": 0.43554586060039474, "percentage": 43.55, "elapsed_time": "1 day, 7:26:47", "remaining_time": "1 day, 16:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4194, "total_steps": 9627, "loss": 1.7932, "learning_rate": 6.003940408351311e-05, "epoch": 0.43564973511997507, "percentage": 43.56, "elapsed_time": "1 day, 7:27:15", "remaining_time": "1 day, 16:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4195, "total_steps": 9627, "loss": 1.6768, "learning_rate": 6.0023419269721613e-05, "epoch": 0.4357536096395554, "percentage": 43.58, "elapsed_time": "1 day, 7:27:43", "remaining_time": "1 day, 16:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4196, "total_steps": 9627, "loss": 1.513, "learning_rate": 6.000743338851413e-05, "epoch": 0.4358574841591358, "percentage": 43.59, "elapsed_time": "1 day, 7:28:12", "remaining_time": "1 day, 16:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4197, "total_steps": 9627, "loss": 1.7438, "learning_rate": 5.999144644159307e-05, "epoch": 0.4359613586787161, "percentage": 43.6, "elapsed_time": "1 day, 7:28:40", "remaining_time": "1 day, 16:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4198, "total_steps": 9627, "loss": 1.7892, "learning_rate": 5.997545843066089e-05, "epoch": 0.43606523319829643, "percentage": 43.61, "elapsed_time": "1 day, 7:29:10", "remaining_time": "1 day, 16:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4199, "total_steps": 9627, "loss": 1.6238, "learning_rate": 5.995946935742019e-05, "epoch": 0.4361691077178768, "percentage": 43.62, "elapsed_time": "1 day, 7:29:37", "remaining_time": "1 day, 16:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4200, "total_steps": 9627, "loss": 1.5195, "learning_rate": 5.994347922357372e-05, "epoch": 0.43627298223745714, "percentage": 43.63, "elapsed_time": "1 day, 7:30:06", "remaining_time": "1 day, 16:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4201, "total_steps": 9627, "loss": 1.9181, "learning_rate": 5.992748803082425e-05, "epoch": 0.4363768567570375, "percentage": 43.64, "elapsed_time": "1 day, 7:30:35", "remaining_time": "1 day, 16:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4202, "total_steps": 9627, "loss": 1.767, "learning_rate": 5.991149578087476e-05, "epoch": 0.43648073127661785, "percentage": 43.65, "elapsed_time": "1 day, 7:31:03", "remaining_time": "1 day, 16:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4203, "total_steps": 9627, "loss": 1.8537, "learning_rate": 5.9895502475428265e-05, "epoch": 0.4365846057961982, "percentage": 43.66, "elapsed_time": "1 day, 7:31:32", "remaining_time": "1 day, 16:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4204, "total_steps": 9627, "loss": 1.6446, "learning_rate": 5.9879508116187947e-05, "epoch": 0.43668848031577856, "percentage": 43.67, "elapsed_time": "1 day, 7:31:59", "remaining_time": "1 day, 16:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4205, "total_steps": 9627, "loss": 1.7255, "learning_rate": 5.9863512704857085e-05, "epoch": 0.4367923548353589, "percentage": 43.68, "elapsed_time": "1 day, 7:32:28", "remaining_time": "1 day, 16:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4206, "total_steps": 9627, "loss": 1.6686, "learning_rate": 5.9847516243139055e-05, "epoch": 0.4368962293549392, "percentage": 43.69, "elapsed_time": "1 day, 7:32:56", "remaining_time": "1 day, 16:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4207, "total_steps": 9627, "loss": 1.563, "learning_rate": 5.9831518732737344e-05, "epoch": 0.4370001038745196, "percentage": 43.7, "elapsed_time": "1 day, 7:33:25", "remaining_time": "1 day, 16:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4208, "total_steps": 9627, "loss": 1.6068, "learning_rate": 5.981552017535561e-05, "epoch": 0.4371039783940999, "percentage": 43.71, "elapsed_time": "1 day, 7:33:52", "remaining_time": "1 day, 16:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4209, "total_steps": 9627, "loss": 1.7952, "learning_rate": 5.979952057269752e-05, "epoch": 0.43720785291368025, "percentage": 43.72, "elapsed_time": "1 day, 7:34:22", "remaining_time": "1 day, 16:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4210, "total_steps": 9627, "loss": 1.66, "learning_rate": 5.9783519926466924e-05, "epoch": 0.43731172743326063, "percentage": 43.73, "elapsed_time": "1 day, 7:34:49", "remaining_time": "1 day, 16:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4211, "total_steps": 9627, "loss": 1.6255, "learning_rate": 5.976751823836778e-05, "epoch": 0.43741560195284096, "percentage": 43.74, "elapsed_time": "1 day, 7:35:18", "remaining_time": "1 day, 16:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4212, "total_steps": 9627, "loss": 1.5188, "learning_rate": 5.975151551010412e-05, "epoch": 0.43751947647242134, "percentage": 43.75, "elapsed_time": "1 day, 7:35:47", "remaining_time": "1 day, 16:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4213, "total_steps": 9627, "loss": 1.6951, "learning_rate": 5.973551174338014e-05, "epoch": 0.43762335099200167, "percentage": 43.76, "elapsed_time": "1 day, 7:36:14", "remaining_time": "1 day, 16:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4214, "total_steps": 9627, "loss": 1.5638, "learning_rate": 5.9719506939900094e-05, "epoch": 0.437727225511582, "percentage": 43.77, "elapsed_time": "1 day, 7:36:42", "remaining_time": "1 day, 16:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4215, "total_steps": 9627, "loss": 1.8339, "learning_rate": 5.9703501101368374e-05, "epoch": 0.4378311000311624, "percentage": 43.78, "elapsed_time": "1 day, 7:37:11", "remaining_time": "1 day, 16:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4216, "total_steps": 9627, "loss": 1.723, "learning_rate": 5.968749422948947e-05, "epoch": 0.4379349745507427, "percentage": 43.79, "elapsed_time": "1 day, 7:37:39", "remaining_time": "1 day, 16:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4217, "total_steps": 9627, "loss": 1.6502, "learning_rate": 5.967148632596801e-05, "epoch": 0.43803884907032303, "percentage": 43.8, "elapsed_time": "1 day, 7:38:08", "remaining_time": "1 day, 16:35:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4218, "total_steps": 9627, "loss": 1.8315, "learning_rate": 5.965547739250867e-05, "epoch": 0.4381427235899034, "percentage": 43.81, "elapsed_time": "1 day, 7:38:37", "remaining_time": "1 day, 16:34:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4219, "total_steps": 9627, "loss": 1.7273, "learning_rate": 5.963946743081633e-05, "epoch": 0.43824659810948374, "percentage": 43.82, "elapsed_time": "1 day, 7:39:03", "remaining_time": "1 day, 16:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4220, "total_steps": 9627, "loss": 1.7344, "learning_rate": 5.962345644259589e-05, "epoch": 0.43835047262906407, "percentage": 43.84, "elapsed_time": "1 day, 7:39:33", "remaining_time": "1 day, 16:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4221, "total_steps": 9627, "loss": 1.771, "learning_rate": 5.9607444429552405e-05, "epoch": 0.43845434714864445, "percentage": 43.85, "elapsed_time": "1 day, 7:40:01", "remaining_time": "1 day, 16:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4222, "total_steps": 9627, "loss": 1.7933, "learning_rate": 5.959143139339104e-05, "epoch": 0.4385582216682248, "percentage": 43.86, "elapsed_time": "1 day, 7:40:30", "remaining_time": "1 day, 16:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4223, "total_steps": 9627, "loss": 1.667, "learning_rate": 5.957541733581704e-05, "epoch": 0.4386620961878051, "percentage": 43.87, "elapsed_time": "1 day, 7:40:57", "remaining_time": "1 day, 16:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4224, "total_steps": 9627, "loss": 1.6835, "learning_rate": 5.955940225853577e-05, "epoch": 0.4387659707073855, "percentage": 43.88, "elapsed_time": "1 day, 7:41:25", "remaining_time": "1 day, 16:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4225, "total_steps": 9627, "loss": 1.7532, "learning_rate": 5.9543386163252744e-05, "epoch": 0.4388698452269658, "percentage": 43.89, "elapsed_time": "1 day, 7:41:53", "remaining_time": "1 day, 16:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4226, "total_steps": 9627, "loss": 1.5813, "learning_rate": 5.952736905167352e-05, "epoch": 0.4389737197465462, "percentage": 43.9, "elapsed_time": "1 day, 7:42:22", "remaining_time": "1 day, 16:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4227, "total_steps": 9627, "loss": 1.8791, "learning_rate": 5.951135092550382e-05, "epoch": 0.4390775942661265, "percentage": 43.91, "elapsed_time": "1 day, 7:42:50", "remaining_time": "1 day, 16:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4228, "total_steps": 9627, "loss": 1.6862, "learning_rate": 5.949533178644943e-05, "epoch": 0.43918146878570685, "percentage": 43.92, "elapsed_time": "1 day, 7:43:19", "remaining_time": "1 day, 16:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4229, "total_steps": 9627, "loss": 1.7341, "learning_rate": 5.9479311636216274e-05, "epoch": 0.43928534330528723, "percentage": 43.93, "elapsed_time": "1 day, 7:43:47", "remaining_time": "1 day, 16:30:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4230, "total_steps": 9627, "loss": 1.6987, "learning_rate": 5.946329047651037e-05, "epoch": 0.43938921782486756, "percentage": 43.94, "elapsed_time": "1 day, 7:44:14", "remaining_time": "1 day, 16:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4231, "total_steps": 9627, "loss": 1.7809, "learning_rate": 5.944726830903785e-05, "epoch": 0.4394930923444479, "percentage": 43.95, "elapsed_time": "1 day, 7:44:43", "remaining_time": "1 day, 16:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4232, "total_steps": 9627, "loss": 1.7338, "learning_rate": 5.9431245135504934e-05, "epoch": 0.43959696686402827, "percentage": 43.96, "elapsed_time": "1 day, 7:45:12", "remaining_time": "1 day, 16:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4233, "total_steps": 9627, "loss": 1.5948, "learning_rate": 5.941522095761799e-05, "epoch": 0.4397008413836086, "percentage": 43.97, "elapsed_time": "1 day, 7:45:41", "remaining_time": "1 day, 16:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4234, "total_steps": 9627, "loss": 1.2893, "learning_rate": 5.939919577708346e-05, "epoch": 0.4398047159031889, "percentage": 43.98, "elapsed_time": "1 day, 7:46:08", "remaining_time": "1 day, 16:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4235, "total_steps": 9627, "loss": 1.6906, "learning_rate": 5.938316959560788e-05, "epoch": 0.4399085904227693, "percentage": 43.99, "elapsed_time": "1 day, 7:46:37", "remaining_time": "1 day, 16:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4236, "total_steps": 9627, "loss": 1.7074, "learning_rate": 5.9367142414897945e-05, "epoch": 0.44001246494234963, "percentage": 44.0, "elapsed_time": "1 day, 7:47:05", "remaining_time": "1 day, 16:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4237, "total_steps": 9627, "loss": 1.7486, "learning_rate": 5.935111423666041e-05, "epoch": 0.44011633946192996, "percentage": 44.01, "elapsed_time": "1 day, 7:47:34", "remaining_time": "1 day, 16:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4238, "total_steps": 9627, "loss": 1.7472, "learning_rate": 5.933508506260214e-05, "epoch": 0.44022021398151034, "percentage": 44.02, "elapsed_time": "1 day, 7:48:01", "remaining_time": "1 day, 16:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4239, "total_steps": 9627, "loss": 1.8697, "learning_rate": 5.9319054894430126e-05, "epoch": 0.44032408850109067, "percentage": 44.03, "elapsed_time": "1 day, 7:48:31", "remaining_time": "1 day, 16:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4240, "total_steps": 9627, "loss": 1.5873, "learning_rate": 5.930302373385145e-05, "epoch": 0.44042796302067105, "percentage": 44.04, "elapsed_time": "1 day, 7:48:58", "remaining_time": "1 day, 16:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4241, "total_steps": 9627, "loss": 1.71, "learning_rate": 5.928699158257333e-05, "epoch": 0.4405318375402514, "percentage": 44.05, "elapsed_time": "1 day, 7:49:27", "remaining_time": "1 day, 16:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4242, "total_steps": 9627, "loss": 1.8128, "learning_rate": 5.9270958442303035e-05, "epoch": 0.4406357120598317, "percentage": 44.06, "elapsed_time": "1 day, 7:49:55", "remaining_time": "1 day, 16:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4243, "total_steps": 9627, "loss": 1.7892, "learning_rate": 5.9254924314748e-05, "epoch": 0.4407395865794121, "percentage": 44.07, "elapsed_time": "1 day, 7:50:24", "remaining_time": "1 day, 16:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4244, "total_steps": 9627, "loss": 1.7573, "learning_rate": 5.923888920161571e-05, "epoch": 0.4408434610989924, "percentage": 44.08, "elapsed_time": "1 day, 7:50:51", "remaining_time": "1 day, 16:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4245, "total_steps": 9627, "loss": 1.7848, "learning_rate": 5.922285310461378e-05, "epoch": 0.44094733561857274, "percentage": 44.09, "elapsed_time": "1 day, 7:51:19", "remaining_time": "1 day, 16:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4246, "total_steps": 9627, "loss": 1.7333, "learning_rate": 5.920681602544993e-05, "epoch": 0.4410512101381531, "percentage": 44.11, "elapsed_time": "1 day, 7:51:48", "remaining_time": "1 day, 16:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4247, "total_steps": 9627, "loss": 1.6265, "learning_rate": 5.9190777965832e-05, "epoch": 0.44115508465773345, "percentage": 44.12, "elapsed_time": "1 day, 7:52:16", "remaining_time": "1 day, 16:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4248, "total_steps": 9627, "loss": 1.5993, "learning_rate": 5.917473892746791e-05, "epoch": 0.4412589591773138, "percentage": 44.13, "elapsed_time": "1 day, 7:52:44", "remaining_time": "1 day, 16:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4249, "total_steps": 9627, "loss": 1.7911, "learning_rate": 5.915869891206567e-05, "epoch": 0.44136283369689416, "percentage": 44.14, "elapsed_time": "1 day, 7:53:12", "remaining_time": "1 day, 16:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4250, "total_steps": 9627, "loss": 1.487, "learning_rate": 5.9142657921333466e-05, "epoch": 0.4414667082164745, "percentage": 44.15, "elapsed_time": "1 day, 7:53:41", "remaining_time": "1 day, 16:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4251, "total_steps": 9627, "loss": 1.5246, "learning_rate": 5.912661595697948e-05, "epoch": 0.4415705827360549, "percentage": 44.16, "elapsed_time": "1 day, 7:54:09", "remaining_time": "1 day, 16:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4252, "total_steps": 9627, "loss": 1.7199, "learning_rate": 5.91105730207121e-05, "epoch": 0.4416744572556352, "percentage": 44.17, "elapsed_time": "1 day, 7:54:37", "remaining_time": "1 day, 16:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4253, "total_steps": 9627, "loss": 1.6264, "learning_rate": 5.909452911423976e-05, "epoch": 0.4417783317752155, "percentage": 44.18, "elapsed_time": "1 day, 7:55:06", "remaining_time": "1 day, 16:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4254, "total_steps": 9627, "loss": 1.5363, "learning_rate": 5.9078484239271e-05, "epoch": 0.4418822062947959, "percentage": 44.19, "elapsed_time": "1 day, 7:55:34", "remaining_time": "1 day, 16:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4255, "total_steps": 9627, "loss": 1.7037, "learning_rate": 5.9062438397514496e-05, "epoch": 0.44198608081437624, "percentage": 44.2, "elapsed_time": "1 day, 7:56:01", "remaining_time": "1 day, 16:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4256, "total_steps": 9627, "loss": 1.7508, "learning_rate": 5.904639159067898e-05, "epoch": 0.44208995533395656, "percentage": 44.21, "elapsed_time": "1 day, 7:56:29", "remaining_time": "1 day, 16:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4257, "total_steps": 9627, "loss": 1.7378, "learning_rate": 5.9030343820473335e-05, "epoch": 0.44219382985353695, "percentage": 44.22, "elapsed_time": "1 day, 7:56:58", "remaining_time": "1 day, 16:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4258, "total_steps": 9627, "loss": 1.838, "learning_rate": 5.9014295088606505e-05, "epoch": 0.4422977043731173, "percentage": 44.23, "elapsed_time": "1 day, 7:57:26", "remaining_time": "1 day, 16:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4259, "total_steps": 9627, "loss": 1.8126, "learning_rate": 5.899824539678758e-05, "epoch": 0.4424015788926976, "percentage": 44.24, "elapsed_time": "1 day, 7:57:54", "remaining_time": "1 day, 16:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4260, "total_steps": 9627, "loss": 1.5948, "learning_rate": 5.898219474672568e-05, "epoch": 0.442505453412278, "percentage": 44.25, "elapsed_time": "1 day, 7:58:22", "remaining_time": "1 day, 16:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4261, "total_steps": 9627, "loss": 1.5256, "learning_rate": 5.896614314013012e-05, "epoch": 0.4426093279318583, "percentage": 44.26, "elapsed_time": "1 day, 7:58:51", "remaining_time": "1 day, 16:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4262, "total_steps": 9627, "loss": 1.762, "learning_rate": 5.8950090578710246e-05, "epoch": 0.44271320245143864, "percentage": 44.27, "elapsed_time": "1 day, 7:59:18", "remaining_time": "1 day, 16:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4263, "total_steps": 9627, "loss": 1.8018, "learning_rate": 5.893403706417554e-05, "epoch": 0.442817076971019, "percentage": 44.28, "elapsed_time": "1 day, 7:59:47", "remaining_time": "1 day, 16:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4264, "total_steps": 9627, "loss": 1.717, "learning_rate": 5.89179825982356e-05, "epoch": 0.44292095149059935, "percentage": 44.29, "elapsed_time": "1 day, 8:00:16", "remaining_time": "1 day, 16:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4265, "total_steps": 9627, "loss": 1.8017, "learning_rate": 5.8901927182600035e-05, "epoch": 0.44302482601017973, "percentage": 44.3, "elapsed_time": "1 day, 8:00:43", "remaining_time": "1 day, 16:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4266, "total_steps": 9627, "loss": 1.8363, "learning_rate": 5.88858708189787e-05, "epoch": 0.44312870052976006, "percentage": 44.31, "elapsed_time": "1 day, 8:01:12", "remaining_time": "1 day, 16:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4267, "total_steps": 9627, "loss": 1.5213, "learning_rate": 5.886981350908142e-05, "epoch": 0.4432325750493404, "percentage": 44.32, "elapsed_time": "1 day, 8:01:40", "remaining_time": "1 day, 16:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4268, "total_steps": 9627, "loss": 1.6166, "learning_rate": 5.885375525461817e-05, "epoch": 0.44333644956892077, "percentage": 44.33, "elapsed_time": "1 day, 8:02:08", "remaining_time": "1 day, 16:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4269, "total_steps": 9627, "loss": 1.7148, "learning_rate": 5.883769605729907e-05, "epoch": 0.4434403240885011, "percentage": 44.34, "elapsed_time": "1 day, 8:02:37", "remaining_time": "1 day, 16:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4270, "total_steps": 9627, "loss": 1.5109, "learning_rate": 5.882163591883427e-05, "epoch": 0.4435441986080814, "percentage": 44.35, "elapsed_time": "1 day, 8:03:05", "remaining_time": "1 day, 16:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4271, "total_steps": 9627, "loss": 1.6773, "learning_rate": 5.8805574840934067e-05, "epoch": 0.4436480731276618, "percentage": 44.36, "elapsed_time": "1 day, 8:03:33", "remaining_time": "1 day, 16:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4272, "total_steps": 9627, "loss": 1.6551, "learning_rate": 5.878951282530881e-05, "epoch": 0.44375194764724213, "percentage": 44.38, "elapsed_time": "1 day, 8:04:00", "remaining_time": "1 day, 16:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4273, "total_steps": 9627, "loss": 1.7879, "learning_rate": 5.877344987366902e-05, "epoch": 0.44385582216682246, "percentage": 44.39, "elapsed_time": "1 day, 8:04:30", "remaining_time": "1 day, 16:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4274, "total_steps": 9627, "loss": 1.705, "learning_rate": 5.875738598772522e-05, "epoch": 0.44395969668640284, "percentage": 44.4, "elapsed_time": "1 day, 8:04:57", "remaining_time": "1 day, 16:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4275, "total_steps": 9627, "loss": 1.7977, "learning_rate": 5.874132116918816e-05, "epoch": 0.44406357120598317, "percentage": 44.41, "elapsed_time": "1 day, 8:05:25", "remaining_time": "1 day, 16:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4276, "total_steps": 9627, "loss": 1.6302, "learning_rate": 5.8725255419768565e-05, "epoch": 0.4441674457255635, "percentage": 44.42, "elapsed_time": "1 day, 8:05:54", "remaining_time": "1 day, 16:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4277, "total_steps": 9627, "loss": 1.8449, "learning_rate": 5.870918874117731e-05, "epoch": 0.4442713202451439, "percentage": 44.43, "elapsed_time": "1 day, 8:06:21", "remaining_time": "1 day, 16:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4278, "total_steps": 9627, "loss": 1.7231, "learning_rate": 5.869312113512542e-05, "epoch": 0.4443751947647242, "percentage": 44.44, "elapsed_time": "1 day, 8:06:51", "remaining_time": "1 day, 16:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4279, "total_steps": 9627, "loss": 1.6797, "learning_rate": 5.867705260332391e-05, "epoch": 0.4444790692843046, "percentage": 44.45, "elapsed_time": "1 day, 8:07:18", "remaining_time": "1 day, 16:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4280, "total_steps": 9627, "loss": 1.7341, "learning_rate": 5.866098314748401e-05, "epoch": 0.4445829438038849, "percentage": 44.46, "elapsed_time": "1 day, 8:07:46", "remaining_time": "1 day, 16:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4281, "total_steps": 9627, "loss": 1.685, "learning_rate": 5.864491276931694e-05, "epoch": 0.44468681832346524, "percentage": 44.47, "elapsed_time": "1 day, 8:08:14", "remaining_time": "1 day, 16:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4282, "total_steps": 9627, "loss": 1.7268, "learning_rate": 5.862884147053409e-05, "epoch": 0.4447906928430456, "percentage": 44.48, "elapsed_time": "1 day, 8:08:42", "remaining_time": "1 day, 16:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4283, "total_steps": 9627, "loss": 1.5863, "learning_rate": 5.861276925284694e-05, "epoch": 0.44489456736262595, "percentage": 44.49, "elapsed_time": "1 day, 8:09:10", "remaining_time": "1 day, 16:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4284, "total_steps": 9627, "loss": 1.6242, "learning_rate": 5.8596696117967054e-05, "epoch": 0.4449984418822063, "percentage": 44.5, "elapsed_time": "1 day, 8:09:38", "remaining_time": "1 day, 16:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4285, "total_steps": 9627, "loss": 1.5881, "learning_rate": 5.8580622067606083e-05, "epoch": 0.44510231640178666, "percentage": 44.51, "elapsed_time": "1 day, 8:10:07", "remaining_time": "1 day, 16:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4286, "total_steps": 9627, "loss": 1.815, "learning_rate": 5.8564547103475795e-05, "epoch": 0.445206190921367, "percentage": 44.52, "elapsed_time": "1 day, 8:10:34", "remaining_time": "1 day, 16:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4287, "total_steps": 9627, "loss": 1.6837, "learning_rate": 5.854847122728805e-05, "epoch": 0.4453100654409473, "percentage": 44.53, "elapsed_time": "1 day, 8:11:01", "remaining_time": "1 day, 16:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4288, "total_steps": 9627, "loss": 1.7351, "learning_rate": 5.853239444075479e-05, "epoch": 0.4454139399605277, "percentage": 44.54, "elapsed_time": "1 day, 8:11:31", "remaining_time": "1 day, 16:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4289, "total_steps": 9627, "loss": 1.6621, "learning_rate": 5.8516316745588085e-05, "epoch": 0.445517814480108, "percentage": 44.55, "elapsed_time": "1 day, 8:11:58", "remaining_time": "1 day, 16:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4290, "total_steps": 9627, "loss": 1.7465, "learning_rate": 5.850023814350006e-05, "epoch": 0.4456216889996884, "percentage": 44.56, "elapsed_time": "1 day, 8:12:26", "remaining_time": "1 day, 16:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4291, "total_steps": 9627, "loss": 1.6812, "learning_rate": 5.848415863620299e-05, "epoch": 0.44572556351926873, "percentage": 44.57, "elapsed_time": "1 day, 8:12:55", "remaining_time": "1 day, 16:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4292, "total_steps": 9627, "loss": 1.6243, "learning_rate": 5.846807822540922e-05, "epoch": 0.44582943803884906, "percentage": 44.58, "elapsed_time": "1 day, 8:13:23", "remaining_time": "1 day, 16:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4293, "total_steps": 9627, "loss": 1.7954, "learning_rate": 5.8451996912831156e-05, "epoch": 0.44593331255842944, "percentage": 44.59, "elapsed_time": "1 day, 8:13:51", "remaining_time": "1 day, 16:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4294, "total_steps": 9627, "loss": 1.6049, "learning_rate": 5.8435914700181347e-05, "epoch": 0.44603718707800977, "percentage": 44.6, "elapsed_time": "1 day, 8:14:19", "remaining_time": "1 day, 16:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4295, "total_steps": 9627, "loss": 1.9193, "learning_rate": 5.8419831589172426e-05, "epoch": 0.4461410615975901, "percentage": 44.61, "elapsed_time": "1 day, 8:14:47", "remaining_time": "1 day, 16:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4296, "total_steps": 9627, "loss": 1.6742, "learning_rate": 5.840374758151711e-05, "epoch": 0.4462449361171705, "percentage": 44.62, "elapsed_time": "1 day, 8:15:14", "remaining_time": "1 day, 16:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4297, "total_steps": 9627, "loss": 1.9509, "learning_rate": 5.838766267892825e-05, "epoch": 0.4463488106367508, "percentage": 44.63, "elapsed_time": "1 day, 8:15:43", "remaining_time": "1 day, 16:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4298, "total_steps": 9627, "loss": 1.8231, "learning_rate": 5.837157688311873e-05, "epoch": 0.44645268515633113, "percentage": 44.65, "elapsed_time": "1 day, 8:16:11", "remaining_time": "1 day, 16:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4299, "total_steps": 9627, "loss": 1.7526, "learning_rate": 5.8355490195801566e-05, "epoch": 0.4465565596759115, "percentage": 44.66, "elapsed_time": "1 day, 8:16:39", "remaining_time": "1 day, 16:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4300, "total_steps": 9627, "loss": 1.749, "learning_rate": 5.8339402618689885e-05, "epoch": 0.44666043419549184, "percentage": 44.67, "elapsed_time": "1 day, 8:17:06", "remaining_time": "1 day, 15:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4301, "total_steps": 9627, "loss": 2.0137, "learning_rate": 5.832331415349687e-05, "epoch": 0.44676430871507217, "percentage": 44.68, "elapsed_time": "1 day, 8:17:36", "remaining_time": "1 day, 15:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4302, "total_steps": 9627, "loss": 1.7437, "learning_rate": 5.83072248019358e-05, "epoch": 0.44686818323465255, "percentage": 44.69, "elapsed_time": "1 day, 8:18:03", "remaining_time": "1 day, 15:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4303, "total_steps": 9627, "loss": 1.9, "learning_rate": 5.829113456572012e-05, "epoch": 0.4469720577542329, "percentage": 44.7, "elapsed_time": "1 day, 8:18:31", "remaining_time": "1 day, 15:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4304, "total_steps": 9627, "loss": 1.5549, "learning_rate": 5.827504344656326e-05, "epoch": 0.44707593227381326, "percentage": 44.71, "elapsed_time": "1 day, 8:18:59", "remaining_time": "1 day, 15:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4305, "total_steps": 9627, "loss": 1.7203, "learning_rate": 5.825895144617883e-05, "epoch": 0.4471798067933936, "percentage": 44.72, "elapsed_time": "1 day, 8:19:28", "remaining_time": "1 day, 15:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4306, "total_steps": 9627, "loss": 1.7229, "learning_rate": 5.82428585662805e-05, "epoch": 0.4472836813129739, "percentage": 44.73, "elapsed_time": "1 day, 8:19:56", "remaining_time": "1 day, 15:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4307, "total_steps": 9627, "loss": 1.6764, "learning_rate": 5.822676480858201e-05, "epoch": 0.4473875558325543, "percentage": 44.74, "elapsed_time": "1 day, 8:20:24", "remaining_time": "1 day, 15:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4308, "total_steps": 9627, "loss": 1.8381, "learning_rate": 5.821067017479727e-05, "epoch": 0.4474914303521346, "percentage": 44.75, "elapsed_time": "1 day, 8:20:51", "remaining_time": "1 day, 15:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4309, "total_steps": 9627, "loss": 2.1298, "learning_rate": 5.819457466664018e-05, "epoch": 0.44759530487171495, "percentage": 44.76, "elapsed_time": "1 day, 8:21:19", "remaining_time": "1 day, 15:55:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4310, "total_steps": 9627, "loss": 1.7621, "learning_rate": 5.81784782858248e-05, "epoch": 0.44769917939129533, "percentage": 44.77, "elapsed_time": "1 day, 8:21:47", "remaining_time": "1 day, 15:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4311, "total_steps": 9627, "loss": 1.7275, "learning_rate": 5.816238103406529e-05, "epoch": 0.44780305391087566, "percentage": 44.78, "elapsed_time": "1 day, 8:22:16", "remaining_time": "1 day, 15:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4312, "total_steps": 9627, "loss": 1.7021, "learning_rate": 5.814628291307587e-05, "epoch": 0.447906928430456, "percentage": 44.79, "elapsed_time": "1 day, 8:22:44", "remaining_time": "1 day, 15:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4313, "total_steps": 9627, "loss": 1.8654, "learning_rate": 5.813018392457086e-05, "epoch": 0.44801080295003637, "percentage": 44.8, "elapsed_time": "1 day, 8:23:11", "remaining_time": "1 day, 15:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4314, "total_steps": 9627, "loss": 1.7, "learning_rate": 5.8114084070264686e-05, "epoch": 0.4481146774696167, "percentage": 44.81, "elapsed_time": "1 day, 8:23:39", "remaining_time": "1 day, 15:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4315, "total_steps": 9627, "loss": 1.611, "learning_rate": 5.8097983351871844e-05, "epoch": 0.448218551989197, "percentage": 44.82, "elapsed_time": "1 day, 8:24:07", "remaining_time": "1 day, 15:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4316, "total_steps": 9627, "loss": 2.0493, "learning_rate": 5.808188177110694e-05, "epoch": 0.4483224265087774, "percentage": 44.83, "elapsed_time": "1 day, 8:24:36", "remaining_time": "1 day, 15:52:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4317, "total_steps": 9627, "loss": 1.8463, "learning_rate": 5.806577932968467e-05, "epoch": 0.44842630102835773, "percentage": 44.84, "elapsed_time": "1 day, 8:25:04", "remaining_time": "1 day, 15:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4318, "total_steps": 9627, "loss": 1.649, "learning_rate": 5.804967602931981e-05, "epoch": 0.4485301755479381, "percentage": 44.85, "elapsed_time": "1 day, 8:25:30", "remaining_time": "1 day, 15:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4319, "total_steps": 9627, "loss": 1.8159, "learning_rate": 5.803357187172726e-05, "epoch": 0.44863405006751844, "percentage": 44.86, "elapsed_time": "1 day, 8:26:00", "remaining_time": "1 day, 15:51:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4320, "total_steps": 9627, "loss": 1.6689, "learning_rate": 5.801746685862197e-05, "epoch": 0.44873792458709877, "percentage": 44.87, "elapsed_time": "1 day, 8:26:27", "remaining_time": "1 day, 15:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4321, "total_steps": 9627, "loss": 1.5459, "learning_rate": 5.8001360991718976e-05, "epoch": 0.44884179910667915, "percentage": 44.88, "elapsed_time": "1 day, 8:26:55", "remaining_time": "1 day, 15:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4322, "total_steps": 9627, "loss": 1.6249, "learning_rate": 5.798525427273347e-05, "epoch": 0.4489456736262595, "percentage": 44.89, "elapsed_time": "1 day, 8:27:23", "remaining_time": "1 day, 15:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4323, "total_steps": 9627, "loss": 1.7092, "learning_rate": 5.796914670338067e-05, "epoch": 0.4490495481458398, "percentage": 44.9, "elapsed_time": "1 day, 8:27:51", "remaining_time": "1 day, 15:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4324, "total_steps": 9627, "loss": 1.8151, "learning_rate": 5.795303828537589e-05, "epoch": 0.4491534226654202, "percentage": 44.92, "elapsed_time": "1 day, 8:28:18", "remaining_time": "1 day, 15:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4325, "total_steps": 9627, "loss": 1.7309, "learning_rate": 5.7936929020434585e-05, "epoch": 0.4492572971850005, "percentage": 44.93, "elapsed_time": "1 day, 8:28:47", "remaining_time": "1 day, 15:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4326, "total_steps": 9627, "loss": 1.7786, "learning_rate": 5.792081891027224e-05, "epoch": 0.44936117170458084, "percentage": 44.94, "elapsed_time": "1 day, 8:29:15", "remaining_time": "1 day, 15:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4327, "total_steps": 9627, "loss": 1.9491, "learning_rate": 5.790470795660447e-05, "epoch": 0.4494650462241612, "percentage": 44.95, "elapsed_time": "1 day, 8:29:42", "remaining_time": "1 day, 15:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4328, "total_steps": 9627, "loss": 1.7364, "learning_rate": 5.788859616114697e-05, "epoch": 0.44956892074374155, "percentage": 44.96, "elapsed_time": "1 day, 8:30:12", "remaining_time": "1 day, 15:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4329, "total_steps": 9627, "loss": 1.7383, "learning_rate": 5.787248352561549e-05, "epoch": 0.44967279526332193, "percentage": 44.97, "elapsed_time": "1 day, 8:30:40", "remaining_time": "1 day, 15:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4330, "total_steps": 9627, "loss": 1.4243, "learning_rate": 5.785637005172595e-05, "epoch": 0.44977666978290226, "percentage": 44.98, "elapsed_time": "1 day, 8:31:07", "remaining_time": "1 day, 15:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4331, "total_steps": 9627, "loss": 1.6868, "learning_rate": 5.784025574119427e-05, "epoch": 0.4498805443024826, "percentage": 44.99, "elapsed_time": "1 day, 8:31:36", "remaining_time": "1 day, 15:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4332, "total_steps": 9627, "loss": 1.5136, "learning_rate": 5.78241405957365e-05, "epoch": 0.44998441882206297, "percentage": 45.0, "elapsed_time": "1 day, 8:32:03", "remaining_time": "1 day, 15:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4333, "total_steps": 9627, "loss": 1.6864, "learning_rate": 5.78080246170688e-05, "epoch": 0.4500882933416433, "percentage": 45.01, "elapsed_time": "1 day, 8:32:32", "remaining_time": "1 day, 15:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4334, "total_steps": 9627, "loss": 1.6707, "learning_rate": 5.7791907806907395e-05, "epoch": 0.4501921678612236, "percentage": 45.02, "elapsed_time": "1 day, 8:33:00", "remaining_time": "1 day, 15:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4335, "total_steps": 9627, "loss": 1.5942, "learning_rate": 5.777579016696856e-05, "epoch": 0.450296042380804, "percentage": 45.03, "elapsed_time": "1 day, 8:33:28", "remaining_time": "1 day, 15:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4336, "total_steps": 9627, "loss": 1.5599, "learning_rate": 5.7759671698968745e-05, "epoch": 0.45039991690038433, "percentage": 45.04, "elapsed_time": "1 day, 8:33:55", "remaining_time": "1 day, 15:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4337, "total_steps": 9627, "loss": 1.7982, "learning_rate": 5.774355240462441e-05, "epoch": 0.45050379141996466, "percentage": 45.05, "elapsed_time": "1 day, 8:34:24", "remaining_time": "1 day, 15:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4338, "total_steps": 9627, "loss": 1.7028, "learning_rate": 5.772743228565215e-05, "epoch": 0.45060766593954504, "percentage": 45.06, "elapsed_time": "1 day, 8:34:52", "remaining_time": "1 day, 15:43:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4339, "total_steps": 9627, "loss": 1.7354, "learning_rate": 5.771131134376863e-05, "epoch": 0.45071154045912537, "percentage": 45.07, "elapsed_time": "1 day, 8:35:20", "remaining_time": "1 day, 15:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4340, "total_steps": 9627, "loss": 1.647, "learning_rate": 5.76951895806906e-05, "epoch": 0.4508154149787057, "percentage": 45.08, "elapsed_time": "1 day, 8:35:48", "remaining_time": "1 day, 15:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4341, "total_steps": 9627, "loss": 1.825, "learning_rate": 5.76790669981349e-05, "epoch": 0.4509192894982861, "percentage": 45.09, "elapsed_time": "1 day, 8:36:16", "remaining_time": "1 day, 15:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4342, "total_steps": 9627, "loss": 1.611, "learning_rate": 5.766294359781848e-05, "epoch": 0.4510231640178664, "percentage": 45.1, "elapsed_time": "1 day, 8:36:44", "remaining_time": "1 day, 15:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4343, "total_steps": 9627, "loss": 1.7403, "learning_rate": 5.764681938145832e-05, "epoch": 0.4511270385374468, "percentage": 45.11, "elapsed_time": "1 day, 8:37:12", "remaining_time": "1 day, 15:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4344, "total_steps": 9627, "loss": 1.5556, "learning_rate": 5.763069435077155e-05, "epoch": 0.4512309130570271, "percentage": 45.12, "elapsed_time": "1 day, 8:37:40", "remaining_time": "1 day, 15:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4345, "total_steps": 9627, "loss": 1.6155, "learning_rate": 5.761456850747536e-05, "epoch": 0.45133478757660744, "percentage": 45.13, "elapsed_time": "1 day, 8:38:09", "remaining_time": "1 day, 15:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4346, "total_steps": 9627, "loss": 1.462, "learning_rate": 5.759844185328701e-05, "epoch": 0.4514386620961878, "percentage": 45.14, "elapsed_time": "1 day, 8:38:36", "remaining_time": "1 day, 15:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4347, "total_steps": 9627, "loss": 1.6177, "learning_rate": 5.7582314389923876e-05, "epoch": 0.45154253661576815, "percentage": 45.15, "elapsed_time": "1 day, 8:39:05", "remaining_time": "1 day, 15:39:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4348, "total_steps": 9627, "loss": 1.782, "learning_rate": 5.756618611910343e-05, "epoch": 0.4516464111353485, "percentage": 45.16, "elapsed_time": "1 day, 8:39:33", "remaining_time": "1 day, 15:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4349, "total_steps": 9627, "loss": 1.7076, "learning_rate": 5.7550057042543137e-05, "epoch": 0.45175028565492886, "percentage": 45.18, "elapsed_time": "1 day, 8:40:01", "remaining_time": "1 day, 15:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4350, "total_steps": 9627, "loss": 1.6074, "learning_rate": 5.753392716196069e-05, "epoch": 0.4518541601745092, "percentage": 45.19, "elapsed_time": "1 day, 8:40:28", "remaining_time": "1 day, 15:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4351, "total_steps": 9627, "loss": 1.8871, "learning_rate": 5.751779647907376e-05, "epoch": 0.4519580346940895, "percentage": 45.2, "elapsed_time": "1 day, 8:40:57", "remaining_time": "1 day, 15:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4352, "total_steps": 9627, "loss": 1.7228, "learning_rate": 5.7501664995600134e-05, "epoch": 0.4520619092136699, "percentage": 45.21, "elapsed_time": "1 day, 8:41:25", "remaining_time": "1 day, 15:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4353, "total_steps": 9627, "loss": 1.5237, "learning_rate": 5.748553271325772e-05, "epoch": 0.4521657837332502, "percentage": 45.22, "elapsed_time": "1 day, 8:41:52", "remaining_time": "1 day, 15:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4354, "total_steps": 9627, "loss": 1.6773, "learning_rate": 5.746939963376445e-05, "epoch": 0.45226965825283055, "percentage": 45.23, "elapsed_time": "1 day, 8:42:21", "remaining_time": "1 day, 15:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4355, "total_steps": 9627, "loss": 1.7949, "learning_rate": 5.745326575883839e-05, "epoch": 0.45237353277241094, "percentage": 45.24, "elapsed_time": "1 day, 8:42:48", "remaining_time": "1 day, 15:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4356, "total_steps": 9627, "loss": 1.6454, "learning_rate": 5.743713109019766e-05, "epoch": 0.45247740729199126, "percentage": 45.25, "elapsed_time": "1 day, 8:43:17", "remaining_time": "1 day, 15:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4357, "total_steps": 9627, "loss": 1.6265, "learning_rate": 5.742099562956048e-05, "epoch": 0.45258128181157165, "percentage": 45.26, "elapsed_time": "1 day, 8:43:45", "remaining_time": "1 day, 15:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4358, "total_steps": 9627, "loss": 1.6872, "learning_rate": 5.740485937864515e-05, "epoch": 0.45268515633115197, "percentage": 45.27, "elapsed_time": "1 day, 8:44:12", "remaining_time": "1 day, 15:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4359, "total_steps": 9627, "loss": 1.8138, "learning_rate": 5.7388722339170066e-05, "epoch": 0.4527890308507323, "percentage": 45.28, "elapsed_time": "1 day, 8:44:41", "remaining_time": "1 day, 15:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4360, "total_steps": 9627, "loss": 1.5788, "learning_rate": 5.7372584512853665e-05, "epoch": 0.4528929053703127, "percentage": 45.29, "elapsed_time": "1 day, 8:45:09", "remaining_time": "1 day, 15:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4361, "total_steps": 9627, "loss": 1.8203, "learning_rate": 5.7356445901414545e-05, "epoch": 0.452996779889893, "percentage": 45.3, "elapsed_time": "1 day, 8:45:36", "remaining_time": "1 day, 15:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4362, "total_steps": 9627, "loss": 1.6614, "learning_rate": 5.734030650657132e-05, "epoch": 0.45310065440947334, "percentage": 45.31, "elapsed_time": "1 day, 8:46:06", "remaining_time": "1 day, 15:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4363, "total_steps": 9627, "loss": 1.851, "learning_rate": 5.73241663300427e-05, "epoch": 0.4532045289290537, "percentage": 45.32, "elapsed_time": "1 day, 8:46:32", "remaining_time": "1 day, 15:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4364, "total_steps": 9627, "loss": 1.6255, "learning_rate": 5.730802537354749e-05, "epoch": 0.45330840344863405, "percentage": 45.33, "elapsed_time": "1 day, 8:47:01", "remaining_time": "1 day, 15:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4365, "total_steps": 9627, "loss": 1.4243, "learning_rate": 5.729188363880459e-05, "epoch": 0.45341227796821437, "percentage": 45.34, "elapsed_time": "1 day, 8:47:29", "remaining_time": "1 day, 15:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4366, "total_steps": 9627, "loss": 1.8354, "learning_rate": 5.727574112753296e-05, "epoch": 0.45351615248779475, "percentage": 45.35, "elapsed_time": "1 day, 8:47:56", "remaining_time": "1 day, 15:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4367, "total_steps": 9627, "loss": 1.5944, "learning_rate": 5.725959784145165e-05, "epoch": 0.4536200270073751, "percentage": 45.36, "elapsed_time": "1 day, 8:48:24", "remaining_time": "1 day, 15:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4368, "total_steps": 9627, "loss": 1.7066, "learning_rate": 5.72434537822798e-05, "epoch": 0.45372390152695546, "percentage": 45.37, "elapsed_time": "1 day, 8:48:52", "remaining_time": "1 day, 15:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4369, "total_steps": 9627, "loss": 1.7554, "learning_rate": 5.722730895173662e-05, "epoch": 0.4538277760465358, "percentage": 45.38, "elapsed_time": "1 day, 8:49:20", "remaining_time": "1 day, 15:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4370, "total_steps": 9627, "loss": 1.4915, "learning_rate": 5.721116335154142e-05, "epoch": 0.4539316505661161, "percentage": 45.39, "elapsed_time": "1 day, 8:49:48", "remaining_time": "1 day, 15:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4371, "total_steps": 9627, "loss": 1.6267, "learning_rate": 5.719501698341356e-05, "epoch": 0.4540355250856965, "percentage": 45.4, "elapsed_time": "1 day, 8:50:15", "remaining_time": "1 day, 15:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4372, "total_steps": 9627, "loss": 1.6264, "learning_rate": 5.7178869849072526e-05, "epoch": 0.45413939960527683, "percentage": 45.41, "elapsed_time": "1 day, 8:50:43", "remaining_time": "1 day, 15:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4373, "total_steps": 9627, "loss": 1.7784, "learning_rate": 5.716272195023785e-05, "epoch": 0.45424327412485715, "percentage": 45.42, "elapsed_time": "1 day, 8:51:12", "remaining_time": "1 day, 15:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4374, "total_steps": 9627, "loss": 1.7885, "learning_rate": 5.7146573288629145e-05, "epoch": 0.45434714864443754, "percentage": 45.43, "elapsed_time": "1 day, 8:51:39", "remaining_time": "1 day, 15:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4375, "total_steps": 9627, "loss": 1.6938, "learning_rate": 5.713042386596614e-05, "epoch": 0.45445102316401786, "percentage": 45.45, "elapsed_time": "1 day, 8:52:08", "remaining_time": "1 day, 15:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4376, "total_steps": 9627, "loss": 1.5404, "learning_rate": 5.7114273683968625e-05, "epoch": 0.4545548976835982, "percentage": 45.46, "elapsed_time": "1 day, 8:52:36", "remaining_time": "1 day, 15:27:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4377, "total_steps": 9627, "loss": 1.6948, "learning_rate": 5.709812274435643e-05, "epoch": 0.4546587722031786, "percentage": 45.47, "elapsed_time": "1 day, 8:53:03", "remaining_time": "1 day, 15:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4378, "total_steps": 9627, "loss": 1.6687, "learning_rate": 5.708197104884955e-05, "epoch": 0.4547626467227589, "percentage": 45.48, "elapsed_time": "1 day, 8:53:32", "remaining_time": "1 day, 15:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4379, "total_steps": 9627, "loss": 1.5973, "learning_rate": 5.706581859916799e-05, "epoch": 0.45486652124233923, "percentage": 45.49, "elapsed_time": "1 day, 8:53:59", "remaining_time": "1 day, 15:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4380, "total_steps": 9627, "loss": 1.6266, "learning_rate": 5.704966539703185e-05, "epoch": 0.4549703957619196, "percentage": 45.5, "elapsed_time": "1 day, 8:54:28", "remaining_time": "1 day, 15:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4381, "total_steps": 9627, "loss": 1.7119, "learning_rate": 5.7033511444161355e-05, "epoch": 0.45507427028149994, "percentage": 45.51, "elapsed_time": "1 day, 8:54:54", "remaining_time": "1 day, 15:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4382, "total_steps": 9627, "loss": 1.9857, "learning_rate": 5.701735674227675e-05, "epoch": 0.4551781448010803, "percentage": 45.52, "elapsed_time": "1 day, 8:55:24", "remaining_time": "1 day, 15:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4383, "total_steps": 9627, "loss": 1.9188, "learning_rate": 5.7001201293098386e-05, "epoch": 0.45528201932066065, "percentage": 45.53, "elapsed_time": "1 day, 8:55:50", "remaining_time": "1 day, 15:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4384, "total_steps": 9627, "loss": 1.7152, "learning_rate": 5.69850450983467e-05, "epoch": 0.455385893840241, "percentage": 45.54, "elapsed_time": "1 day, 8:56:19", "remaining_time": "1 day, 15:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4385, "total_steps": 9627, "loss": 1.7644, "learning_rate": 5.6968888159742184e-05, "epoch": 0.45548976835982136, "percentage": 45.55, "elapsed_time": "1 day, 8:56:47", "remaining_time": "1 day, 15:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4386, "total_steps": 9627, "loss": 1.6811, "learning_rate": 5.695273047900544e-05, "epoch": 0.4555936428794017, "percentage": 45.56, "elapsed_time": "1 day, 8:57:15", "remaining_time": "1 day, 15:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4387, "total_steps": 9627, "loss": 1.8516, "learning_rate": 5.693657205785715e-05, "epoch": 0.455697517398982, "percentage": 45.57, "elapsed_time": "1 day, 8:57:43", "remaining_time": "1 day, 15:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4388, "total_steps": 9627, "loss": 1.8134, "learning_rate": 5.6920412898018026e-05, "epoch": 0.4558013919185624, "percentage": 45.58, "elapsed_time": "1 day, 8:58:12", "remaining_time": "1 day, 15:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4389, "total_steps": 9627, "loss": 1.8296, "learning_rate": 5.690425300120893e-05, "epoch": 0.4559052664381427, "percentage": 45.59, "elapsed_time": "1 day, 8:58:39", "remaining_time": "1 day, 15:21:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4390, "total_steps": 9627, "loss": 1.7926, "learning_rate": 5.6888092369150734e-05, "epoch": 0.45600914095772305, "percentage": 45.6, "elapsed_time": "1 day, 8:59:07", "remaining_time": "1 day, 15:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4391, "total_steps": 9627, "loss": 1.8088, "learning_rate": 5.6871931003564414e-05, "epoch": 0.45611301547730343, "percentage": 45.61, "elapsed_time": "1 day, 8:59:35", "remaining_time": "1 day, 15:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4392, "total_steps": 9627, "loss": 1.5183, "learning_rate": 5.685576890617107e-05, "epoch": 0.45621688999688376, "percentage": 45.62, "elapsed_time": "1 day, 9:00:03", "remaining_time": "1 day, 15:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4393, "total_steps": 9627, "loss": 1.6363, "learning_rate": 5.683960607869179e-05, "epoch": 0.45632076451646414, "percentage": 45.63, "elapsed_time": "1 day, 9:00:31", "remaining_time": "1 day, 15:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4394, "total_steps": 9627, "loss": 1.5937, "learning_rate": 5.6823442522847835e-05, "epoch": 0.45642463903604447, "percentage": 45.64, "elapsed_time": "1 day, 9:00:58", "remaining_time": "1 day, 15:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4395, "total_steps": 9627, "loss": 1.723, "learning_rate": 5.680727824036046e-05, "epoch": 0.4565285135556248, "percentage": 45.65, "elapsed_time": "1 day, 9:01:27", "remaining_time": "1 day, 15:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4396, "total_steps": 9627, "loss": 1.5769, "learning_rate": 5.6791113232951063e-05, "epoch": 0.4566323880752052, "percentage": 45.66, "elapsed_time": "1 day, 9:01:55", "remaining_time": "1 day, 15:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4397, "total_steps": 9627, "loss": 1.7898, "learning_rate": 5.677494750234108e-05, "epoch": 0.4567362625947855, "percentage": 45.67, "elapsed_time": "1 day, 9:02:22", "remaining_time": "1 day, 15:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4398, "total_steps": 9627, "loss": 1.7079, "learning_rate": 5.675878105025203e-05, "epoch": 0.45684013711436583, "percentage": 45.68, "elapsed_time": "1 day, 9:02:51", "remaining_time": "1 day, 15:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4399, "total_steps": 9627, "loss": 1.5216, "learning_rate": 5.674261387840551e-05, "epoch": 0.4569440116339462, "percentage": 45.69, "elapsed_time": "1 day, 9:03:18", "remaining_time": "1 day, 15:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4400, "total_steps": 9627, "loss": 1.6415, "learning_rate": 5.6726445988523224e-05, "epoch": 0.45704788615352654, "percentage": 45.7, "elapsed_time": "1 day, 9:03:47", "remaining_time": "1 day, 15:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4401, "total_steps": 9627, "loss": 1.7626, "learning_rate": 5.67102773823269e-05, "epoch": 0.45715176067310687, "percentage": 45.72, "elapsed_time": "1 day, 9:04:14", "remaining_time": "1 day, 15:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4402, "total_steps": 9627, "loss": 1.6487, "learning_rate": 5.669410806153838e-05, "epoch": 0.45725563519268725, "percentage": 45.73, "elapsed_time": "1 day, 9:04:42", "remaining_time": "1 day, 15:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4403, "total_steps": 9627, "loss": 1.7431, "learning_rate": 5.667793802787957e-05, "epoch": 0.4573595097122676, "percentage": 45.74, "elapsed_time": "1 day, 9:05:10", "remaining_time": "1 day, 15:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4404, "total_steps": 9627, "loss": 1.6595, "learning_rate": 5.6661767283072444e-05, "epoch": 0.4574633842318479, "percentage": 45.75, "elapsed_time": "1 day, 9:05:39", "remaining_time": "1 day, 15:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4405, "total_steps": 9627, "loss": 1.8235, "learning_rate": 5.664559582883906e-05, "epoch": 0.4575672587514283, "percentage": 45.76, "elapsed_time": "1 day, 9:06:06", "remaining_time": "1 day, 15:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4406, "total_steps": 9627, "loss": 1.7427, "learning_rate": 5.662942366690157e-05, "epoch": 0.4576711332710086, "percentage": 45.77, "elapsed_time": "1 day, 9:06:34", "remaining_time": "1 day, 15:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4407, "total_steps": 9627, "loss": 1.7745, "learning_rate": 5.6613250798982156e-05, "epoch": 0.457775007790589, "percentage": 45.78, "elapsed_time": "1 day, 9:07:02", "remaining_time": "1 day, 15:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4408, "total_steps": 9627, "loss": 1.7777, "learning_rate": 5.659707722680313e-05, "epoch": 0.4578788823101693, "percentage": 45.79, "elapsed_time": "1 day, 9:07:30", "remaining_time": "1 day, 15:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4409, "total_steps": 9627, "loss": 1.5845, "learning_rate": 5.6580902952086836e-05, "epoch": 0.45798275682974965, "percentage": 45.8, "elapsed_time": "1 day, 9:07:58", "remaining_time": "1 day, 15:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4410, "total_steps": 9627, "loss": 1.5669, "learning_rate": 5.656472797655571e-05, "epoch": 0.45808663134933003, "percentage": 45.81, "elapsed_time": "1 day, 9:08:25", "remaining_time": "1 day, 15:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4411, "total_steps": 9627, "loss": 1.5851, "learning_rate": 5.6548552301932265e-05, "epoch": 0.45819050586891036, "percentage": 45.82, "elapsed_time": "1 day, 9:08:54", "remaining_time": "1 day, 15:11:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4412, "total_steps": 9627, "loss": 1.8875, "learning_rate": 5.6532375929939075e-05, "epoch": 0.4582943803884907, "percentage": 45.83, "elapsed_time": "1 day, 9:09:21", "remaining_time": "1 day, 15:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4413, "total_steps": 9627, "loss": 1.6262, "learning_rate": 5.65161988622988e-05, "epoch": 0.45839825490807107, "percentage": 45.84, "elapsed_time": "1 day, 9:09:49", "remaining_time": "1 day, 15:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4414, "total_steps": 9627, "loss": 1.5766, "learning_rate": 5.650002110073418e-05, "epoch": 0.4585021294276514, "percentage": 45.85, "elapsed_time": "1 day, 9:10:17", "remaining_time": "1 day, 15:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4415, "total_steps": 9627, "loss": 1.5854, "learning_rate": 5.648384264696802e-05, "epoch": 0.4586060039472317, "percentage": 45.86, "elapsed_time": "1 day, 9:10:45", "remaining_time": "1 day, 15:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4416, "total_steps": 9627, "loss": 1.6934, "learning_rate": 5.6467663502723175e-05, "epoch": 0.4587098784668121, "percentage": 45.87, "elapsed_time": "1 day, 9:11:12", "remaining_time": "1 day, 15:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4417, "total_steps": 9627, "loss": 1.7554, "learning_rate": 5.645148366972264e-05, "epoch": 0.45881375298639243, "percentage": 45.88, "elapsed_time": "1 day, 9:11:41", "remaining_time": "1 day, 15:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4418, "total_steps": 9627, "loss": 1.4804, "learning_rate": 5.643530314968941e-05, "epoch": 0.45891762750597276, "percentage": 45.89, "elapsed_time": "1 day, 9:12:09", "remaining_time": "1 day, 15:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4419, "total_steps": 9627, "loss": 1.6639, "learning_rate": 5.6419121944346585e-05, "epoch": 0.45902150202555314, "percentage": 45.9, "elapsed_time": "1 day, 9:12:36", "remaining_time": "1 day, 15:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4420, "total_steps": 9627, "loss": 1.7626, "learning_rate": 5.640294005541735e-05, "epoch": 0.45912537654513347, "percentage": 45.91, "elapsed_time": "1 day, 9:13:05", "remaining_time": "1 day, 15:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4421, "total_steps": 9627, "loss": 1.7363, "learning_rate": 5.638675748462493e-05, "epoch": 0.45922925106471385, "percentage": 45.92, "elapsed_time": "1 day, 9:13:32", "remaining_time": "1 day, 15:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4422, "total_steps": 9627, "loss": 1.725, "learning_rate": 5.637057423369268e-05, "epoch": 0.4593331255842942, "percentage": 45.93, "elapsed_time": "1 day, 9:14:01", "remaining_time": "1 day, 15:07:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4423, "total_steps": 9627, "loss": 1.8253, "learning_rate": 5.635439030434395e-05, "epoch": 0.4594370001038745, "percentage": 45.94, "elapsed_time": "1 day, 9:14:28", "remaining_time": "1 day, 15:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4424, "total_steps": 9627, "loss": 1.6797, "learning_rate": 5.6338205698302224e-05, "epoch": 0.4595408746234549, "percentage": 45.95, "elapsed_time": "1 day, 9:14:56", "remaining_time": "1 day, 15:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4425, "total_steps": 9627, "loss": 1.7569, "learning_rate": 5.6322020417291034e-05, "epoch": 0.4596447491430352, "percentage": 45.96, "elapsed_time": "1 day, 9:15:23", "remaining_time": "1 day, 15:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4426, "total_steps": 9627, "loss": 1.8999, "learning_rate": 5.630583446303399e-05, "epoch": 0.45974862366261554, "percentage": 45.97, "elapsed_time": "1 day, 9:15:52", "remaining_time": "1 day, 15:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4427, "total_steps": 9627, "loss": 1.5374, "learning_rate": 5.6289647837254744e-05, "epoch": 0.4598524981821959, "percentage": 45.99, "elapsed_time": "1 day, 9:16:20", "remaining_time": "1 day, 15:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4428, "total_steps": 9627, "loss": 1.7143, "learning_rate": 5.627346054167707e-05, "epoch": 0.45995637270177625, "percentage": 46.0, "elapsed_time": "1 day, 9:16:48", "remaining_time": "1 day, 15:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4429, "total_steps": 9627, "loss": 1.8177, "learning_rate": 5.625727257802479e-05, "epoch": 0.4600602472213566, "percentage": 46.01, "elapsed_time": "1 day, 9:17:15", "remaining_time": "1 day, 15:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4430, "total_steps": 9627, "loss": 1.8531, "learning_rate": 5.624108394802178e-05, "epoch": 0.46016412174093696, "percentage": 46.02, "elapsed_time": "1 day, 9:17:44", "remaining_time": "1 day, 15:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4431, "total_steps": 9627, "loss": 1.6969, "learning_rate": 5.6224894653392035e-05, "epoch": 0.4602679962605173, "percentage": 46.03, "elapsed_time": "1 day, 9:18:11", "remaining_time": "1 day, 15:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4432, "total_steps": 9627, "loss": 1.5994, "learning_rate": 5.6208704695859535e-05, "epoch": 0.46037187078009767, "percentage": 46.04, "elapsed_time": "1 day, 9:18:39", "remaining_time": "1 day, 15:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4433, "total_steps": 9627, "loss": 1.6662, "learning_rate": 5.619251407714843e-05, "epoch": 0.460475745299678, "percentage": 46.05, "elapsed_time": "1 day, 9:19:07", "remaining_time": "1 day, 15:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4434, "total_steps": 9627, "loss": 1.7509, "learning_rate": 5.617632279898288e-05, "epoch": 0.4605796198192583, "percentage": 46.06, "elapsed_time": "1 day, 9:19:34", "remaining_time": "1 day, 15:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4435, "total_steps": 9627, "loss": 1.6896, "learning_rate": 5.6160130863087115e-05, "epoch": 0.4606834943388387, "percentage": 46.07, "elapsed_time": "1 day, 9:20:03", "remaining_time": "1 day, 15:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4436, "total_steps": 9627, "loss": 1.6231, "learning_rate": 5.614393827118548e-05, "epoch": 0.46078736885841903, "percentage": 46.08, "elapsed_time": "1 day, 9:20:30", "remaining_time": "1 day, 15:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4437, "total_steps": 9627, "loss": 1.6131, "learning_rate": 5.6127745025002344e-05, "epoch": 0.46089124337799936, "percentage": 46.09, "elapsed_time": "1 day, 9:20:58", "remaining_time": "1 day, 15:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4438, "total_steps": 9627, "loss": 1.7206, "learning_rate": 5.611155112626215e-05, "epoch": 0.46099511789757974, "percentage": 46.1, "elapsed_time": "1 day, 9:21:26", "remaining_time": "1 day, 15:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4439, "total_steps": 9627, "loss": 1.6558, "learning_rate": 5.609535657668945e-05, "epoch": 0.46109899241716007, "percentage": 46.11, "elapsed_time": "1 day, 9:21:53", "remaining_time": "1 day, 14:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4440, "total_steps": 9627, "loss": 1.7243, "learning_rate": 5.6079161378008805e-05, "epoch": 0.4612028669367404, "percentage": 46.12, "elapsed_time": "1 day, 9:22:22", "remaining_time": "1 day, 14:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4441, "total_steps": 9627, "loss": 1.7576, "learning_rate": 5.606296553194489e-05, "epoch": 0.4613067414563208, "percentage": 46.13, "elapsed_time": "1 day, 9:22:49", "remaining_time": "1 day, 14:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4442, "total_steps": 9627, "loss": 1.5866, "learning_rate": 5.6046769040222446e-05, "epoch": 0.4614106159759011, "percentage": 46.14, "elapsed_time": "1 day, 9:23:17", "remaining_time": "1 day, 14:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4443, "total_steps": 9627, "loss": 1.6697, "learning_rate": 5.603057190456628e-05, "epoch": 0.46151449049548143, "percentage": 46.15, "elapsed_time": "1 day, 9:23:45", "remaining_time": "1 day, 14:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4444, "total_steps": 9627, "loss": 1.4743, "learning_rate": 5.601437412670121e-05, "epoch": 0.4616183650150618, "percentage": 46.16, "elapsed_time": "1 day, 9:24:13", "remaining_time": "1 day, 14:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4445, "total_steps": 9627, "loss": 1.7079, "learning_rate": 5.5998175708352255e-05, "epoch": 0.46172223953464214, "percentage": 46.17, "elapsed_time": "1 day, 9:24:40", "remaining_time": "1 day, 14:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4446, "total_steps": 9627, "loss": 1.6898, "learning_rate": 5.598197665124434e-05, "epoch": 0.4618261140542225, "percentage": 46.18, "elapsed_time": "1 day, 9:25:08", "remaining_time": "1 day, 14:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4447, "total_steps": 9627, "loss": 1.686, "learning_rate": 5.596577695710258e-05, "epoch": 0.46192998857380285, "percentage": 46.19, "elapsed_time": "1 day, 9:25:37", "remaining_time": "1 day, 14:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4448, "total_steps": 9627, "loss": 1.6314, "learning_rate": 5.594957662765211e-05, "epoch": 0.4620338630933832, "percentage": 46.2, "elapsed_time": "1 day, 9:26:04", "remaining_time": "1 day, 14:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4449, "total_steps": 9627, "loss": 1.6829, "learning_rate": 5.5933375664618134e-05, "epoch": 0.46213773761296356, "percentage": 46.21, "elapsed_time": "1 day, 9:26:31", "remaining_time": "1 day, 14:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4450, "total_steps": 9627, "loss": 1.9202, "learning_rate": 5.591717406972594e-05, "epoch": 0.4622416121325439, "percentage": 46.22, "elapsed_time": "1 day, 9:26:59", "remaining_time": "1 day, 14:54:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4451, "total_steps": 9627, "loss": 1.7383, "learning_rate": 5.590097184470087e-05, "epoch": 0.4623454866521242, "percentage": 46.23, "elapsed_time": "1 day, 9:27:26", "remaining_time": "1 day, 14:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4452, "total_steps": 9627, "loss": 1.7811, "learning_rate": 5.588476899126832e-05, "epoch": 0.4624493611717046, "percentage": 46.24, "elapsed_time": "1 day, 9:27:53", "remaining_time": "1 day, 14:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4453, "total_steps": 9627, "loss": 1.6378, "learning_rate": 5.586856551115378e-05, "epoch": 0.4625532356912849, "percentage": 46.26, "elapsed_time": "1 day, 9:28:23", "remaining_time": "1 day, 14:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4454, "total_steps": 9627, "loss": 1.7076, "learning_rate": 5.585236140608279e-05, "epoch": 0.46265711021086525, "percentage": 46.27, "elapsed_time": "1 day, 9:28:50", "remaining_time": "1 day, 14:53:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4455, "total_steps": 9627, "loss": 1.7697, "learning_rate": 5.583615667778094e-05, "epoch": 0.46276098473044563, "percentage": 46.28, "elapsed_time": "1 day, 9:29:18", "remaining_time": "1 day, 14:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4456, "total_steps": 9627, "loss": 1.5478, "learning_rate": 5.581995132797394e-05, "epoch": 0.46286485925002596, "percentage": 46.29, "elapsed_time": "1 day, 9:29:46", "remaining_time": "1 day, 14:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4457, "total_steps": 9627, "loss": 1.7247, "learning_rate": 5.5803745358387526e-05, "epoch": 0.4629687337696063, "percentage": 46.3, "elapsed_time": "1 day, 9:30:13", "remaining_time": "1 day, 14:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4458, "total_steps": 9627, "loss": 1.768, "learning_rate": 5.578753877074749e-05, "epoch": 0.46307260828918667, "percentage": 46.31, "elapsed_time": "1 day, 9:30:41", "remaining_time": "1 day, 14:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4459, "total_steps": 9627, "loss": 1.7182, "learning_rate": 5.577133156677975e-05, "epoch": 0.463176482808767, "percentage": 46.32, "elapsed_time": "1 day, 9:31:09", "remaining_time": "1 day, 14:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4460, "total_steps": 9627, "loss": 1.8411, "learning_rate": 5.575512374821018e-05, "epoch": 0.4632803573283474, "percentage": 46.33, "elapsed_time": "1 day, 9:31:37", "remaining_time": "1 day, 14:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4461, "total_steps": 9627, "loss": 1.6013, "learning_rate": 5.573891531676484e-05, "epoch": 0.4633842318479277, "percentage": 46.34, "elapsed_time": "1 day, 9:32:04", "remaining_time": "1 day, 14:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4462, "total_steps": 9627, "loss": 1.8274, "learning_rate": 5.572270627416979e-05, "epoch": 0.46348810636750803, "percentage": 46.35, "elapsed_time": "1 day, 9:32:32", "remaining_time": "1 day, 14:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4463, "total_steps": 9627, "loss": 1.8865, "learning_rate": 5.5706496622151136e-05, "epoch": 0.4635919808870884, "percentage": 46.36, "elapsed_time": "1 day, 9:33:00", "remaining_time": "1 day, 14:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4464, "total_steps": 9627, "loss": 1.6921, "learning_rate": 5.569028636243513e-05, "epoch": 0.46369585540666874, "percentage": 46.37, "elapsed_time": "1 day, 9:33:27", "remaining_time": "1 day, 14:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4465, "total_steps": 9627, "loss": 1.6099, "learning_rate": 5.5674075496748e-05, "epoch": 0.46379972992624907, "percentage": 46.38, "elapsed_time": "1 day, 9:33:54", "remaining_time": "1 day, 14:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4466, "total_steps": 9627, "loss": 1.7032, "learning_rate": 5.56578640268161e-05, "epoch": 0.46390360444582945, "percentage": 46.39, "elapsed_time": "1 day, 9:34:23", "remaining_time": "1 day, 14:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4467, "total_steps": 9627, "loss": 1.7474, "learning_rate": 5.5641651954365803e-05, "epoch": 0.4640074789654098, "percentage": 46.4, "elapsed_time": "1 day, 9:34:50", "remaining_time": "1 day, 14:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4468, "total_steps": 9627, "loss": 1.7868, "learning_rate": 5.562543928112358e-05, "epoch": 0.4641113534849901, "percentage": 46.41, "elapsed_time": "1 day, 9:35:19", "remaining_time": "1 day, 14:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4469, "total_steps": 9627, "loss": 1.684, "learning_rate": 5.560922600881595e-05, "epoch": 0.4642152280045705, "percentage": 46.42, "elapsed_time": "1 day, 9:35:46", "remaining_time": "1 day, 14:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4470, "total_steps": 9627, "loss": 1.601, "learning_rate": 5.559301213916952e-05, "epoch": 0.4643191025241508, "percentage": 46.43, "elapsed_time": "1 day, 9:36:14", "remaining_time": "1 day, 14:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4471, "total_steps": 9627, "loss": 1.773, "learning_rate": 5.557679767391091e-05, "epoch": 0.4644229770437312, "percentage": 46.44, "elapsed_time": "1 day, 9:36:41", "remaining_time": "1 day, 14:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4472, "total_steps": 9627, "loss": 1.7059, "learning_rate": 5.5560582614766845e-05, "epoch": 0.4645268515633115, "percentage": 46.45, "elapsed_time": "1 day, 9:37:10", "remaining_time": "1 day, 14:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4473, "total_steps": 9627, "loss": 1.7463, "learning_rate": 5.5544366963464134e-05, "epoch": 0.46463072608289185, "percentage": 46.46, "elapsed_time": "1 day, 9:37:37", "remaining_time": "1 day, 14:44:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4474, "total_steps": 9627, "loss": 1.6543, "learning_rate": 5.552815072172955e-05, "epoch": 0.46473460060247224, "percentage": 46.47, "elapsed_time": "1 day, 9:38:06", "remaining_time": "1 day, 14:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4475, "total_steps": 9627, "loss": 1.6462, "learning_rate": 5.5511933891290056e-05, "epoch": 0.46483847512205256, "percentage": 46.48, "elapsed_time": "1 day, 9:38:33", "remaining_time": "1 day, 14:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4476, "total_steps": 9627, "loss": 1.656, "learning_rate": 5.5495716473872604e-05, "epoch": 0.4649423496416329, "percentage": 46.49, "elapsed_time": "1 day, 9:39:01", "remaining_time": "1 day, 14:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4477, "total_steps": 9627, "loss": 1.7544, "learning_rate": 5.5479498471204196e-05, "epoch": 0.4650462241612133, "percentage": 46.5, "elapsed_time": "1 day, 9:39:28", "remaining_time": "1 day, 14:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4478, "total_steps": 9627, "loss": 1.5076, "learning_rate": 5.546327988501196e-05, "epoch": 0.4651500986807936, "percentage": 46.52, "elapsed_time": "1 day, 9:39:57", "remaining_time": "1 day, 14:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4479, "total_steps": 9627, "loss": 1.638, "learning_rate": 5.544706071702302e-05, "epoch": 0.4652539732003739, "percentage": 46.53, "elapsed_time": "1 day, 9:40:23", "remaining_time": "1 day, 14:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4480, "total_steps": 9627, "loss": 1.5985, "learning_rate": 5.5430840968964615e-05, "epoch": 0.4653578477199543, "percentage": 46.54, "elapsed_time": "1 day, 9:40:52", "remaining_time": "1 day, 14:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4481, "total_steps": 9627, "loss": 1.7247, "learning_rate": 5.541462064256401e-05, "epoch": 0.46546172223953464, "percentage": 46.55, "elapsed_time": "1 day, 9:41:19", "remaining_time": "1 day, 14:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4482, "total_steps": 9627, "loss": 1.8184, "learning_rate": 5.5398399739548524e-05, "epoch": 0.46556559675911496, "percentage": 46.56, "elapsed_time": "1 day, 9:41:47", "remaining_time": "1 day, 14:40:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4483, "total_steps": 9627, "loss": 1.8839, "learning_rate": 5.538217826164558e-05, "epoch": 0.46566947127869535, "percentage": 46.57, "elapsed_time": "1 day, 9:42:14", "remaining_time": "1 day, 14:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4484, "total_steps": 9627, "loss": 1.5911, "learning_rate": 5.5365956210582634e-05, "epoch": 0.4657733457982757, "percentage": 46.58, "elapsed_time": "1 day, 9:42:42", "remaining_time": "1 day, 14:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4485, "total_steps": 9627, "loss": 1.7894, "learning_rate": 5.5349733588087216e-05, "epoch": 0.46587722031785606, "percentage": 46.59, "elapsed_time": "1 day, 9:43:09", "remaining_time": "1 day, 14:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4486, "total_steps": 9627, "loss": 1.7112, "learning_rate": 5.533351039588689e-05, "epoch": 0.4659810948374364, "percentage": 46.6, "elapsed_time": "1 day, 9:43:38", "remaining_time": "1 day, 14:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4487, "total_steps": 9627, "loss": 1.7559, "learning_rate": 5.531728663570933e-05, "epoch": 0.4660849693570167, "percentage": 46.61, "elapsed_time": "1 day, 9:44:06", "remaining_time": "1 day, 14:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4488, "total_steps": 9627, "loss": 1.6631, "learning_rate": 5.53010623092822e-05, "epoch": 0.4661888438765971, "percentage": 46.62, "elapsed_time": "1 day, 9:44:33", "remaining_time": "1 day, 14:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4489, "total_steps": 9627, "loss": 1.736, "learning_rate": 5.5284837418333294e-05, "epoch": 0.4662927183961774, "percentage": 46.63, "elapsed_time": "1 day, 9:45:01", "remaining_time": "1 day, 14:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4490, "total_steps": 9627, "loss": 1.8165, "learning_rate": 5.5268611964590425e-05, "epoch": 0.46639659291575775, "percentage": 46.64, "elapsed_time": "1 day, 9:45:29", "remaining_time": "1 day, 14:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4491, "total_steps": 9627, "loss": 1.8559, "learning_rate": 5.525238594978146e-05, "epoch": 0.46650046743533813, "percentage": 46.65, "elapsed_time": "1 day, 9:45:57", "remaining_time": "1 day, 14:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4492, "total_steps": 9627, "loss": 1.5622, "learning_rate": 5.523615937563438e-05, "epoch": 0.46660434195491846, "percentage": 46.66, "elapsed_time": "1 day, 9:46:24", "remaining_time": "1 day, 14:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4493, "total_steps": 9627, "loss": 1.6647, "learning_rate": 5.521993224387717e-05, "epoch": 0.4667082164744988, "percentage": 46.67, "elapsed_time": "1 day, 9:46:52", "remaining_time": "1 day, 14:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4494, "total_steps": 9627, "loss": 1.7663, "learning_rate": 5.520370455623789e-05, "epoch": 0.46681209099407917, "percentage": 46.68, "elapsed_time": "1 day, 9:47:20", "remaining_time": "1 day, 14:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4495, "total_steps": 9627, "loss": 1.8218, "learning_rate": 5.518747631444467e-05, "epoch": 0.4669159655136595, "percentage": 46.69, "elapsed_time": "1 day, 9:47:48", "remaining_time": "1 day, 14:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4496, "total_steps": 9627, "loss": 1.6427, "learning_rate": 5.517124752022569e-05, "epoch": 0.4670198400332398, "percentage": 46.7, "elapsed_time": "1 day, 9:48:15", "remaining_time": "1 day, 14:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4497, "total_steps": 9627, "loss": 1.5317, "learning_rate": 5.515501817530917e-05, "epoch": 0.4671237145528202, "percentage": 46.71, "elapsed_time": "1 day, 9:48:44", "remaining_time": "1 day, 14:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4498, "total_steps": 9627, "loss": 1.736, "learning_rate": 5.513878828142344e-05, "epoch": 0.46722758907240053, "percentage": 46.72, "elapsed_time": "1 day, 9:49:11", "remaining_time": "1 day, 14:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4499, "total_steps": 9627, "loss": 1.7212, "learning_rate": 5.5122557840296815e-05, "epoch": 0.4673314635919809, "percentage": 46.73, "elapsed_time": "1 day, 9:49:40", "remaining_time": "1 day, 14:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4500, "total_steps": 9627, "loss": 1.6732, "learning_rate": 5.5106326853657764e-05, "epoch": 0.46743533811156124, "percentage": 46.74, "elapsed_time": "1 day, 9:50:07", "remaining_time": "1 day, 14:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4501, "total_steps": 9627, "loss": 1.8326, "learning_rate": 5.5090095323234735e-05, "epoch": 0.46753921263114157, "percentage": 46.75, "elapsed_time": "1 day, 9:50:34", "remaining_time": "1 day, 14:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4502, "total_steps": 9627, "loss": 1.8159, "learning_rate": 5.507386325075625e-05, "epoch": 0.46764308715072195, "percentage": 46.76, "elapsed_time": "1 day, 9:51:03", "remaining_time": "1 day, 14:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4503, "total_steps": 9627, "loss": 1.8045, "learning_rate": 5.505763063795091e-05, "epoch": 0.4677469616703023, "percentage": 46.77, "elapsed_time": "1 day, 9:51:30", "remaining_time": "1 day, 14:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4504, "total_steps": 9627, "loss": 1.7684, "learning_rate": 5.504139748654735e-05, "epoch": 0.4678508361898826, "percentage": 46.79, "elapsed_time": "1 day, 9:51:59", "remaining_time": "1 day, 14:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4505, "total_steps": 9627, "loss": 1.7299, "learning_rate": 5.5025163798274283e-05, "epoch": 0.467954710709463, "percentage": 46.8, "elapsed_time": "1 day, 9:52:26", "remaining_time": "1 day, 14:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4506, "total_steps": 9627, "loss": 1.8735, "learning_rate": 5.500892957486048e-05, "epoch": 0.4680585852290433, "percentage": 46.81, "elapsed_time": "1 day, 9:52:54", "remaining_time": "1 day, 14:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4507, "total_steps": 9627, "loss": 1.6187, "learning_rate": 5.499269481803474e-05, "epoch": 0.46816245974862364, "percentage": 46.82, "elapsed_time": "1 day, 9:53:21", "remaining_time": "1 day, 14:29:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4508, "total_steps": 9627, "loss": 1.8866, "learning_rate": 5.497645952952596e-05, "epoch": 0.468266334268204, "percentage": 46.83, "elapsed_time": "1 day, 9:53:50", "remaining_time": "1 day, 14:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4509, "total_steps": 9627, "loss": 1.6358, "learning_rate": 5.496022371106304e-05, "epoch": 0.46837020878778435, "percentage": 46.84, "elapsed_time": "1 day, 9:54:18", "remaining_time": "1 day, 14:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4510, "total_steps": 9627, "loss": 1.6527, "learning_rate": 5.4943987364374985e-05, "epoch": 0.46847408330736473, "percentage": 46.85, "elapsed_time": "1 day, 9:54:46", "remaining_time": "1 day, 14:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4511, "total_steps": 9627, "loss": 1.571, "learning_rate": 5.492775049119085e-05, "epoch": 0.46857795782694506, "percentage": 46.86, "elapsed_time": "1 day, 9:55:13", "remaining_time": "1 day, 14:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4512, "total_steps": 9627, "loss": 1.8012, "learning_rate": 5.491151309323973e-05, "epoch": 0.4686818323465254, "percentage": 46.87, "elapsed_time": "1 day, 9:55:42", "remaining_time": "1 day, 14:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4513, "total_steps": 9627, "loss": 1.7915, "learning_rate": 5.489527517225076e-05, "epoch": 0.46878570686610577, "percentage": 46.88, "elapsed_time": "1 day, 9:56:10", "remaining_time": "1 day, 14:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4514, "total_steps": 9627, "loss": 1.6541, "learning_rate": 5.487903672995318e-05, "epoch": 0.4688895813856861, "percentage": 46.89, "elapsed_time": "1 day, 9:56:39", "remaining_time": "1 day, 14:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4515, "total_steps": 9627, "loss": 1.7457, "learning_rate": 5.486279776807626e-05, "epoch": 0.4689934559052664, "percentage": 46.9, "elapsed_time": "1 day, 9:57:06", "remaining_time": "1 day, 14:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4516, "total_steps": 9627, "loss": 1.5523, "learning_rate": 5.484655828834929e-05, "epoch": 0.4690973304248468, "percentage": 46.91, "elapsed_time": "1 day, 9:57:34", "remaining_time": "1 day, 14:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4517, "total_steps": 9627, "loss": 1.7419, "learning_rate": 5.483031829250167e-05, "epoch": 0.46920120494442713, "percentage": 46.92, "elapsed_time": "1 day, 9:58:03", "remaining_time": "1 day, 14:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4518, "total_steps": 9627, "loss": 1.7789, "learning_rate": 5.481407778226284e-05, "epoch": 0.46930507946400746, "percentage": 46.93, "elapsed_time": "1 day, 9:58:30", "remaining_time": "1 day, 14:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4519, "total_steps": 9627, "loss": 1.6478, "learning_rate": 5.4797836759362256e-05, "epoch": 0.46940895398358784, "percentage": 46.94, "elapsed_time": "1 day, 9:58:59", "remaining_time": "1 day, 14:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4520, "total_steps": 9627, "loss": 1.5748, "learning_rate": 5.478159522552949e-05, "epoch": 0.46951282850316817, "percentage": 46.95, "elapsed_time": "1 day, 9:59:27", "remaining_time": "1 day, 14:24:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4521, "total_steps": 9627, "loss": 1.7942, "learning_rate": 5.476535318249414e-05, "epoch": 0.4696167030227485, "percentage": 46.96, "elapsed_time": "1 day, 9:59:54", "remaining_time": "1 day, 14:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4522, "total_steps": 9627, "loss": 1.6272, "learning_rate": 5.4749110631985846e-05, "epoch": 0.4697205775423289, "percentage": 46.97, "elapsed_time": "1 day, 10:00:24", "remaining_time": "1 day, 14:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4523, "total_steps": 9627, "loss": 1.7511, "learning_rate": 5.4732867575734314e-05, "epoch": 0.4698244520619092, "percentage": 46.98, "elapsed_time": "1 day, 10:00:51", "remaining_time": "1 day, 14:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4524, "total_steps": 9627, "loss": 1.7224, "learning_rate": 5.4716624015469284e-05, "epoch": 0.4699283265814896, "percentage": 46.99, "elapsed_time": "1 day, 10:01:20", "remaining_time": "1 day, 14:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4525, "total_steps": 9627, "loss": 1.6125, "learning_rate": 5.470037995292061e-05, "epoch": 0.4700322011010699, "percentage": 47.0, "elapsed_time": "1 day, 10:01:47", "remaining_time": "1 day, 14:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4526, "total_steps": 9627, "loss": 1.6888, "learning_rate": 5.468413538981814e-05, "epoch": 0.47013607562065024, "percentage": 47.01, "elapsed_time": "1 day, 10:02:16", "remaining_time": "1 day, 14:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4527, "total_steps": 9627, "loss": 1.7642, "learning_rate": 5.466789032789176e-05, "epoch": 0.4702399501402306, "percentage": 47.02, "elapsed_time": "1 day, 10:02:43", "remaining_time": "1 day, 14:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4528, "total_steps": 9627, "loss": 1.6372, "learning_rate": 5.465164476887149e-05, "epoch": 0.47034382465981095, "percentage": 47.03, "elapsed_time": "1 day, 10:03:12", "remaining_time": "1 day, 14:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4529, "total_steps": 9627, "loss": 1.7026, "learning_rate": 5.463539871448735e-05, "epoch": 0.4704476991793913, "percentage": 47.04, "elapsed_time": "1 day, 10:03:39", "remaining_time": "1 day, 14:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4530, "total_steps": 9627, "loss": 1.513, "learning_rate": 5.461915216646938e-05, "epoch": 0.47055157369897166, "percentage": 47.06, "elapsed_time": "1 day, 10:04:08", "remaining_time": "1 day, 14:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4531, "total_steps": 9627, "loss": 1.6832, "learning_rate": 5.4602905126547744e-05, "epoch": 0.470655448218552, "percentage": 47.07, "elapsed_time": "1 day, 10:04:37", "remaining_time": "1 day, 14:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4532, "total_steps": 9627, "loss": 1.5767, "learning_rate": 5.4586657596452615e-05, "epoch": 0.4707593227381323, "percentage": 47.08, "elapsed_time": "1 day, 10:05:04", "remaining_time": "1 day, 14:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4533, "total_steps": 9627, "loss": 1.6025, "learning_rate": 5.4570409577914215e-05, "epoch": 0.4708631972577127, "percentage": 47.09, "elapsed_time": "1 day, 10:05:34", "remaining_time": "1 day, 14:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4534, "total_steps": 9627, "loss": 1.6899, "learning_rate": 5.455416107266287e-05, "epoch": 0.470967071777293, "percentage": 47.1, "elapsed_time": "1 day, 10:06:01", "remaining_time": "1 day, 14:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4535, "total_steps": 9627, "loss": 1.7355, "learning_rate": 5.453791208242889e-05, "epoch": 0.47107094629687335, "percentage": 47.11, "elapsed_time": "1 day, 10:06:30", "remaining_time": "1 day, 14:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4536, "total_steps": 9627, "loss": 1.9148, "learning_rate": 5.452166260894267e-05, "epoch": 0.47117482081645373, "percentage": 47.12, "elapsed_time": "1 day, 10:06:58", "remaining_time": "1 day, 14:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4537, "total_steps": 9627, "loss": 1.7175, "learning_rate": 5.450541265393464e-05, "epoch": 0.47127869533603406, "percentage": 47.13, "elapsed_time": "1 day, 10:07:26", "remaining_time": "1 day, 14:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4538, "total_steps": 9627, "loss": 1.8146, "learning_rate": 5.4489162219135314e-05, "epoch": 0.47138256985561444, "percentage": 47.14, "elapsed_time": "1 day, 10:07:54", "remaining_time": "1 day, 14:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4539, "total_steps": 9627, "loss": 1.8353, "learning_rate": 5.447291130627522e-05, "epoch": 0.47148644437519477, "percentage": 47.15, "elapsed_time": "1 day, 10:08:23", "remaining_time": "1 day, 14:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4540, "total_steps": 9627, "loss": 1.672, "learning_rate": 5.4456659917084975e-05, "epoch": 0.4715903188947751, "percentage": 47.16, "elapsed_time": "1 day, 10:08:51", "remaining_time": "1 day, 14:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4541, "total_steps": 9627, "loss": 1.7119, "learning_rate": 5.44404080532952e-05, "epoch": 0.4716941934143555, "percentage": 47.17, "elapsed_time": "1 day, 10:09:20", "remaining_time": "1 day, 14:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4542, "total_steps": 9627, "loss": 1.9569, "learning_rate": 5.442415571663661e-05, "epoch": 0.4717980679339358, "percentage": 47.18, "elapsed_time": "1 day, 10:09:47", "remaining_time": "1 day, 14:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4543, "total_steps": 9627, "loss": 1.5407, "learning_rate": 5.440790290883997e-05, "epoch": 0.47190194245351613, "percentage": 47.19, "elapsed_time": "1 day, 10:10:15", "remaining_time": "1 day, 14:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4544, "total_steps": 9627, "loss": 1.7799, "learning_rate": 5.439164963163601e-05, "epoch": 0.4720058169730965, "percentage": 47.2, "elapsed_time": "1 day, 10:10:43", "remaining_time": "1 day, 14:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4545, "total_steps": 9627, "loss": 1.6902, "learning_rate": 5.437539588675564e-05, "epoch": 0.47210969149267684, "percentage": 47.21, "elapsed_time": "1 day, 10:11:13", "remaining_time": "1 day, 14:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4546, "total_steps": 9627, "loss": 1.7341, "learning_rate": 5.435914167592975e-05, "epoch": 0.47221356601225717, "percentage": 47.22, "elapsed_time": "1 day, 10:11:40", "remaining_time": "1 day, 14:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4547, "total_steps": 9627, "loss": 1.7448, "learning_rate": 5.434288700088925e-05, "epoch": 0.47231744053183755, "percentage": 47.23, "elapsed_time": "1 day, 10:12:09", "remaining_time": "1 day, 14:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4548, "total_steps": 9627, "loss": 1.6007, "learning_rate": 5.432663186336517e-05, "epoch": 0.4724213150514179, "percentage": 47.24, "elapsed_time": "1 day, 10:12:37", "remaining_time": "1 day, 14:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4549, "total_steps": 9627, "loss": 1.6348, "learning_rate": 5.431037626508856e-05, "epoch": 0.47252518957099826, "percentage": 47.25, "elapsed_time": "1 day, 10:13:06", "remaining_time": "1 day, 14:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4550, "total_steps": 9627, "loss": 1.6318, "learning_rate": 5.429412020779049e-05, "epoch": 0.4726290640905786, "percentage": 47.26, "elapsed_time": "1 day, 10:13:33", "remaining_time": "1 day, 14:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4551, "total_steps": 9627, "loss": 1.7079, "learning_rate": 5.427786369320211e-05, "epoch": 0.4727329386101589, "percentage": 47.27, "elapsed_time": "1 day, 10:14:02", "remaining_time": "1 day, 14:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4552, "total_steps": 9627, "loss": 1.5058, "learning_rate": 5.4261606723054604e-05, "epoch": 0.4728368131297393, "percentage": 47.28, "elapsed_time": "1 day, 10:14:31", "remaining_time": "1 day, 14:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4553, "total_steps": 9627, "loss": 1.7662, "learning_rate": 5.424534929907924e-05, "epoch": 0.4729406876493196, "percentage": 47.29, "elapsed_time": "1 day, 10:14:58", "remaining_time": "1 day, 14:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4554, "total_steps": 9627, "loss": 1.6387, "learning_rate": 5.422909142300729e-05, "epoch": 0.47304456216889995, "percentage": 47.3, "elapsed_time": "1 day, 10:15:26", "remaining_time": "1 day, 14:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4555, "total_steps": 9627, "loss": 1.9062, "learning_rate": 5.4212833096570085e-05, "epoch": 0.47314843668848033, "percentage": 47.31, "elapsed_time": "1 day, 10:15:56", "remaining_time": "1 day, 14:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4556, "total_steps": 9627, "loss": 1.779, "learning_rate": 5.419657432149903e-05, "epoch": 0.47325231120806066, "percentage": 47.33, "elapsed_time": "1 day, 10:16:23", "remaining_time": "1 day, 14:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4557, "total_steps": 9627, "loss": 1.7205, "learning_rate": 5.418031509952554e-05, "epoch": 0.473356185727641, "percentage": 47.34, "elapsed_time": "1 day, 10:16:52", "remaining_time": "1 day, 14:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4558, "total_steps": 9627, "loss": 1.8187, "learning_rate": 5.4164055432381076e-05, "epoch": 0.47346006024722137, "percentage": 47.35, "elapsed_time": "1 day, 10:17:19", "remaining_time": "1 day, 14:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4559, "total_steps": 9627, "loss": 1.7266, "learning_rate": 5.414779532179721e-05, "epoch": 0.4735639347668017, "percentage": 47.36, "elapsed_time": "1 day, 10:17:48", "remaining_time": "1 day, 14:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4560, "total_steps": 9627, "loss": 1.6847, "learning_rate": 5.41315347695055e-05, "epoch": 0.473667809286382, "percentage": 47.37, "elapsed_time": "1 day, 10:18:16", "remaining_time": "1 day, 14:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4561, "total_steps": 9627, "loss": 1.5548, "learning_rate": 5.4115273777237554e-05, "epoch": 0.4737716838059624, "percentage": 47.38, "elapsed_time": "1 day, 10:18:44", "remaining_time": "1 day, 14:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4562, "total_steps": 9627, "loss": 1.6328, "learning_rate": 5.4099012346725054e-05, "epoch": 0.47387555832554273, "percentage": 47.39, "elapsed_time": "1 day, 10:19:13", "remaining_time": "1 day, 14:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4563, "total_steps": 9627, "loss": 1.7856, "learning_rate": 5.4082750479699715e-05, "epoch": 0.4739794328451231, "percentage": 47.4, "elapsed_time": "1 day, 10:19:41", "remaining_time": "1 day, 14:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4564, "total_steps": 9627, "loss": 1.6751, "learning_rate": 5.406648817789329e-05, "epoch": 0.47408330736470344, "percentage": 47.41, "elapsed_time": "1 day, 10:20:09", "remaining_time": "1 day, 14:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4565, "total_steps": 9627, "loss": 1.793, "learning_rate": 5.40502254430376e-05, "epoch": 0.47418718188428377, "percentage": 47.42, "elapsed_time": "1 day, 10:20:38", "remaining_time": "1 day, 14:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4566, "total_steps": 9627, "loss": 1.5738, "learning_rate": 5.403396227686449e-05, "epoch": 0.47429105640386415, "percentage": 47.43, "elapsed_time": "1 day, 10:21:05", "remaining_time": "1 day, 14:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4567, "total_steps": 9627, "loss": 1.7443, "learning_rate": 5.4017698681105865e-05, "epoch": 0.4743949309234445, "percentage": 47.44, "elapsed_time": "1 day, 10:21:34", "remaining_time": "1 day, 14:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4568, "total_steps": 9627, "loss": 1.6522, "learning_rate": 5.400143465749368e-05, "epoch": 0.4744988054430248, "percentage": 47.45, "elapsed_time": "1 day, 10:22:02", "remaining_time": "1 day, 14:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4569, "total_steps": 9627, "loss": 1.7336, "learning_rate": 5.398517020775989e-05, "epoch": 0.4746026799626052, "percentage": 47.46, "elapsed_time": "1 day, 10:22:31", "remaining_time": "1 day, 14:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4570, "total_steps": 9627, "loss": 1.7395, "learning_rate": 5.39689053336366e-05, "epoch": 0.4747065544821855, "percentage": 47.47, "elapsed_time": "1 day, 10:22:59", "remaining_time": "1 day, 14:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4571, "total_steps": 9627, "loss": 1.5726, "learning_rate": 5.3952640036855825e-05, "epoch": 0.47481042900176584, "percentage": 47.48, "elapsed_time": "1 day, 10:23:28", "remaining_time": "1 day, 14:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4572, "total_steps": 9627, "loss": 2.0233, "learning_rate": 5.3936374319149705e-05, "epoch": 0.4749143035213462, "percentage": 47.49, "elapsed_time": "1 day, 10:23:57", "remaining_time": "1 day, 14:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4573, "total_steps": 9627, "loss": 1.539, "learning_rate": 5.392010818225044e-05, "epoch": 0.47501817804092655, "percentage": 47.5, "elapsed_time": "1 day, 10:24:25", "remaining_time": "1 day, 14:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4574, "total_steps": 9627, "loss": 1.767, "learning_rate": 5.390384162789024e-05, "epoch": 0.4751220525605069, "percentage": 47.51, "elapsed_time": "1 day, 10:24:52", "remaining_time": "1 day, 14:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4575, "total_steps": 9627, "loss": 1.7017, "learning_rate": 5.3887574657801346e-05, "epoch": 0.47522592708008726, "percentage": 47.52, "elapsed_time": "1 day, 10:25:20", "remaining_time": "1 day, 14:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4576, "total_steps": 9627, "loss": 1.6445, "learning_rate": 5.3871307273716074e-05, "epoch": 0.4753298015996676, "percentage": 47.53, "elapsed_time": "1 day, 10:25:50", "remaining_time": "1 day, 14:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4577, "total_steps": 9627, "loss": 1.7336, "learning_rate": 5.3855039477366775e-05, "epoch": 0.47543367611924797, "percentage": 47.54, "elapsed_time": "1 day, 10:26:17", "remaining_time": "1 day, 13:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4578, "total_steps": 9627, "loss": 1.6598, "learning_rate": 5.3838771270485854e-05, "epoch": 0.4755375506388283, "percentage": 47.55, "elapsed_time": "1 day, 10:26:46", "remaining_time": "1 day, 13:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4579, "total_steps": 9627, "loss": 1.5692, "learning_rate": 5.3822502654805725e-05, "epoch": 0.4756414251584086, "percentage": 47.56, "elapsed_time": "1 day, 10:27:14", "remaining_time": "1 day, 13:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4580, "total_steps": 9627, "loss": 1.687, "learning_rate": 5.3806233632058876e-05, "epoch": 0.475745299677989, "percentage": 47.57, "elapsed_time": "1 day, 10:27:42", "remaining_time": "1 day, 13:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4581, "total_steps": 9627, "loss": 1.6507, "learning_rate": 5.378996420397784e-05, "epoch": 0.47584917419756934, "percentage": 47.58, "elapsed_time": "1 day, 10:28:10", "remaining_time": "1 day, 13:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4582, "total_steps": 9627, "loss": 1.782, "learning_rate": 5.377369437229518e-05, "epoch": 0.47595304871714966, "percentage": 47.6, "elapsed_time": "1 day, 10:28:40", "remaining_time": "1 day, 13:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4583, "total_steps": 9627, "loss": 1.7035, "learning_rate": 5.375742413874351e-05, "epoch": 0.47605692323673005, "percentage": 47.61, "elapsed_time": "1 day, 10:29:07", "remaining_time": "1 day, 13:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4584, "total_steps": 9627, "loss": 1.6678, "learning_rate": 5.3741153505055475e-05, "epoch": 0.47616079775631037, "percentage": 47.62, "elapsed_time": "1 day, 10:29:36", "remaining_time": "1 day, 13:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4585, "total_steps": 9627, "loss": 1.7662, "learning_rate": 5.372488247296378e-05, "epoch": 0.4762646722758907, "percentage": 47.63, "elapsed_time": "1 day, 10:30:04", "remaining_time": "1 day, 13:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4586, "total_steps": 9627, "loss": 1.7769, "learning_rate": 5.370861104420114e-05, "epoch": 0.4763685467954711, "percentage": 47.64, "elapsed_time": "1 day, 10:30:32", "remaining_time": "1 day, 13:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4587, "total_steps": 9627, "loss": 1.4977, "learning_rate": 5.369233922050036e-05, "epoch": 0.4764724213150514, "percentage": 47.65, "elapsed_time": "1 day, 10:31:01", "remaining_time": "1 day, 13:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4588, "total_steps": 9627, "loss": 1.7031, "learning_rate": 5.3676067003594255e-05, "epoch": 0.4765762958346318, "percentage": 47.66, "elapsed_time": "1 day, 10:31:29", "remaining_time": "1 day, 13:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4589, "total_steps": 9627, "loss": 1.6961, "learning_rate": 5.365979439521569e-05, "epoch": 0.4766801703542121, "percentage": 47.67, "elapsed_time": "1 day, 10:31:58", "remaining_time": "1 day, 13:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4590, "total_steps": 9627, "loss": 1.8117, "learning_rate": 5.364352139709758e-05, "epoch": 0.47678404487379245, "percentage": 47.68, "elapsed_time": "1 day, 10:32:25", "remaining_time": "1 day, 13:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4591, "total_steps": 9627, "loss": 1.6322, "learning_rate": 5.362724801097284e-05, "epoch": 0.47688791939337283, "percentage": 47.69, "elapsed_time": "1 day, 10:32:54", "remaining_time": "1 day, 13:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4592, "total_steps": 9627, "loss": 1.7273, "learning_rate": 5.3610974238574495e-05, "epoch": 0.47699179391295315, "percentage": 47.7, "elapsed_time": "1 day, 10:33:23", "remaining_time": "1 day, 13:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4593, "total_steps": 9627, "loss": 1.824, "learning_rate": 5.359470008163556e-05, "epoch": 0.4770956684325335, "percentage": 47.71, "elapsed_time": "1 day, 10:33:52", "remaining_time": "1 day, 13:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4594, "total_steps": 9627, "loss": 1.5924, "learning_rate": 5.35784255418891e-05, "epoch": 0.47719954295211386, "percentage": 47.72, "elapsed_time": "1 day, 10:34:19", "remaining_time": "1 day, 13:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4595, "total_steps": 9627, "loss": 1.7402, "learning_rate": 5.356215062106823e-05, "epoch": 0.4773034174716942, "percentage": 47.73, "elapsed_time": "1 day, 10:34:48", "remaining_time": "1 day, 13:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4596, "total_steps": 9627, "loss": 1.861, "learning_rate": 5.354587532090611e-05, "epoch": 0.4774072919912745, "percentage": 47.74, "elapsed_time": "1 day, 10:35:16", "remaining_time": "1 day, 13:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4597, "total_steps": 9627, "loss": 1.8382, "learning_rate": 5.352959964313592e-05, "epoch": 0.4775111665108549, "percentage": 47.75, "elapsed_time": "1 day, 10:35:45", "remaining_time": "1 day, 13:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4598, "total_steps": 9627, "loss": 1.6581, "learning_rate": 5.3513323589490924e-05, "epoch": 0.47761504103043523, "percentage": 47.76, "elapsed_time": "1 day, 10:36:14", "remaining_time": "1 day, 13:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4599, "total_steps": 9627, "loss": 1.5309, "learning_rate": 5.349704716170435e-05, "epoch": 0.47771891555001555, "percentage": 47.77, "elapsed_time": "1 day, 10:36:42", "remaining_time": "1 day, 13:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4600, "total_steps": 9627, "loss": 1.7319, "learning_rate": 5.348077036150954e-05, "epoch": 0.47782279006959594, "percentage": 47.78, "elapsed_time": "1 day, 10:37:11", "remaining_time": "1 day, 13:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4601, "total_steps": 9627, "loss": 1.7603, "learning_rate": 5.346449319063983e-05, "epoch": 0.47792666458917626, "percentage": 47.79, "elapsed_time": "1 day, 10:37:38", "remaining_time": "1 day, 13:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4602, "total_steps": 9627, "loss": 1.5944, "learning_rate": 5.34482156508286e-05, "epoch": 0.47803053910875665, "percentage": 47.8, "elapsed_time": "1 day, 10:38:06", "remaining_time": "1 day, 13:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4603, "total_steps": 9627, "loss": 1.5459, "learning_rate": 5.343193774380933e-05, "epoch": 0.478134413628337, "percentage": 47.81, "elapsed_time": "1 day, 10:38:36", "remaining_time": "1 day, 13:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4604, "total_steps": 9627, "loss": 1.6581, "learning_rate": 5.341565947131546e-05, "epoch": 0.4782382881479173, "percentage": 47.82, "elapsed_time": "1 day, 10:39:03", "remaining_time": "1 day, 13:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4605, "total_steps": 9627, "loss": 1.6475, "learning_rate": 5.3399380835080493e-05, "epoch": 0.4783421626674977, "percentage": 47.83, "elapsed_time": "1 day, 10:39:33", "remaining_time": "1 day, 13:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4606, "total_steps": 9627, "loss": 1.7491, "learning_rate": 5.338310183683799e-05, "epoch": 0.478446037187078, "percentage": 47.84, "elapsed_time": "1 day, 10:40:00", "remaining_time": "1 day, 13:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4607, "total_steps": 9627, "loss": 1.7748, "learning_rate": 5.3366822478321524e-05, "epoch": 0.47854991170665834, "percentage": 47.85, "elapsed_time": "1 day, 10:40:29", "remaining_time": "1 day, 13:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4608, "total_steps": 9627, "loss": 1.6662, "learning_rate": 5.335054276126471e-05, "epoch": 0.4786537862262387, "percentage": 47.87, "elapsed_time": "1 day, 10:40:57", "remaining_time": "1 day, 13:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4609, "total_steps": 9627, "loss": 1.8815, "learning_rate": 5.333426268740125e-05, "epoch": 0.47875766074581905, "percentage": 47.88, "elapsed_time": "1 day, 10:41:25", "remaining_time": "1 day, 13:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4610, "total_steps": 9627, "loss": 1.5864, "learning_rate": 5.331798225846482e-05, "epoch": 0.4788615352653994, "percentage": 47.89, "elapsed_time": "1 day, 10:41:54", "remaining_time": "1 day, 13:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4611, "total_steps": 9627, "loss": 1.6708, "learning_rate": 5.330170147618914e-05, "epoch": 0.47896540978497976, "percentage": 47.9, "elapsed_time": "1 day, 10:42:23", "remaining_time": "1 day, 13:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4612, "total_steps": 9627, "loss": 1.8315, "learning_rate": 5.3285420342308035e-05, "epoch": 0.4790692843045601, "percentage": 47.91, "elapsed_time": "1 day, 10:42:52", "remaining_time": "1 day, 13:44:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4613, "total_steps": 9627, "loss": 1.6449, "learning_rate": 5.326913885855527e-05, "epoch": 0.47917315882414047, "percentage": 47.92, "elapsed_time": "1 day, 10:43:19", "remaining_time": "1 day, 13:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4614, "total_steps": 9627, "loss": 1.5407, "learning_rate": 5.325285702666473e-05, "epoch": 0.4792770333437208, "percentage": 47.93, "elapsed_time": "1 day, 10:43:48", "remaining_time": "1 day, 13:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4615, "total_steps": 9627, "loss": 1.6642, "learning_rate": 5.323657484837028e-05, "epoch": 0.4793809078633011, "percentage": 47.94, "elapsed_time": "1 day, 10:44:16", "remaining_time": "1 day, 13:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4616, "total_steps": 9627, "loss": 1.6084, "learning_rate": 5.3220292325405854e-05, "epoch": 0.4794847823828815, "percentage": 47.95, "elapsed_time": "1 day, 10:44:45", "remaining_time": "1 day, 13:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4617, "total_steps": 9627, "loss": 1.9207, "learning_rate": 5.320400945950542e-05, "epoch": 0.47958865690246183, "percentage": 47.96, "elapsed_time": "1 day, 10:45:14", "remaining_time": "1 day, 13:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4618, "total_steps": 9627, "loss": 1.6418, "learning_rate": 5.318772625240298e-05, "epoch": 0.47969253142204216, "percentage": 47.97, "elapsed_time": "1 day, 10:45:42", "remaining_time": "1 day, 13:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4619, "total_steps": 9627, "loss": 1.6963, "learning_rate": 5.3171442705832554e-05, "epoch": 0.47979640594162254, "percentage": 47.98, "elapsed_time": "1 day, 10:46:10", "remaining_time": "1 day, 13:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4620, "total_steps": 9627, "loss": 1.5201, "learning_rate": 5.315515882152822e-05, "epoch": 0.47990028046120287, "percentage": 47.99, "elapsed_time": "1 day, 10:46:39", "remaining_time": "1 day, 13:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4621, "total_steps": 9627, "loss": 1.5179, "learning_rate": 5.313887460122408e-05, "epoch": 0.4800041549807832, "percentage": 48.0, "elapsed_time": "1 day, 10:47:07", "remaining_time": "1 day, 13:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4622, "total_steps": 9627, "loss": 1.7967, "learning_rate": 5.312259004665426e-05, "epoch": 0.4801080295003636, "percentage": 48.01, "elapsed_time": "1 day, 10:47:36", "remaining_time": "1 day, 13:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4623, "total_steps": 9627, "loss": 1.4864, "learning_rate": 5.310630515955297e-05, "epoch": 0.4802119040199439, "percentage": 48.02, "elapsed_time": "1 day, 10:48:06", "remaining_time": "1 day, 13:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4624, "total_steps": 9627, "loss": 1.7526, "learning_rate": 5.309001994165442e-05, "epoch": 0.48031577853952423, "percentage": 48.03, "elapsed_time": "1 day, 10:48:33", "remaining_time": "1 day, 13:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4625, "total_steps": 9627, "loss": 1.5733, "learning_rate": 5.307373439469283e-05, "epoch": 0.4804196530591046, "percentage": 48.04, "elapsed_time": "1 day, 10:49:02", "remaining_time": "1 day, 13:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4626, "total_steps": 9627, "loss": 1.541, "learning_rate": 5.305744852040253e-05, "epoch": 0.48052352757868494, "percentage": 48.05, "elapsed_time": "1 day, 10:49:30", "remaining_time": "1 day, 13:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4627, "total_steps": 9627, "loss": 1.6238, "learning_rate": 5.304116232051779e-05, "epoch": 0.4806274020982653, "percentage": 48.06, "elapsed_time": "1 day, 10:50:00", "remaining_time": "1 day, 13:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4628, "total_steps": 9627, "loss": 1.9604, "learning_rate": 5.3024875796773e-05, "epoch": 0.48073127661784565, "percentage": 48.07, "elapsed_time": "1 day, 10:50:28", "remaining_time": "1 day, 13:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4629, "total_steps": 9627, "loss": 1.4643, "learning_rate": 5.3008588950902524e-05, "epoch": 0.480835151137426, "percentage": 48.08, "elapsed_time": "1 day, 10:50:56", "remaining_time": "1 day, 13:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4630, "total_steps": 9627, "loss": 1.6453, "learning_rate": 5.2992301784640785e-05, "epoch": 0.48093902565700636, "percentage": 48.09, "elapsed_time": "1 day, 10:51:25", "remaining_time": "1 day, 13:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4631, "total_steps": 9627, "loss": 1.6807, "learning_rate": 5.2976014299722263e-05, "epoch": 0.4810429001765867, "percentage": 48.1, "elapsed_time": "1 day, 10:51:53", "remaining_time": "1 day, 13:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4632, "total_steps": 9627, "loss": 1.7978, "learning_rate": 5.2959726497881425e-05, "epoch": 0.481146774696167, "percentage": 48.11, "elapsed_time": "1 day, 10:52:22", "remaining_time": "1 day, 13:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4633, "total_steps": 9627, "loss": 1.7011, "learning_rate": 5.29434383808528e-05, "epoch": 0.4812506492157474, "percentage": 48.13, "elapsed_time": "1 day, 10:52:50", "remaining_time": "1 day, 13:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4634, "total_steps": 9627, "loss": 1.6109, "learning_rate": 5.292714995037096e-05, "epoch": 0.4813545237353277, "percentage": 48.14, "elapsed_time": "1 day, 10:53:19", "remaining_time": "1 day, 13:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4635, "total_steps": 9627, "loss": 1.6175, "learning_rate": 5.291086120817047e-05, "epoch": 0.48145839825490805, "percentage": 48.15, "elapsed_time": "1 day, 10:53:48", "remaining_time": "1 day, 13:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4636, "total_steps": 9627, "loss": 1.5225, "learning_rate": 5.289457215598595e-05, "epoch": 0.48156227277448843, "percentage": 48.16, "elapsed_time": "1 day, 10:54:16", "remaining_time": "1 day, 13:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4637, "total_steps": 9627, "loss": 1.7701, "learning_rate": 5.28782827955521e-05, "epoch": 0.48166614729406876, "percentage": 48.17, "elapsed_time": "1 day, 10:54:45", "remaining_time": "1 day, 13:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4638, "total_steps": 9627, "loss": 1.6871, "learning_rate": 5.286199312860358e-05, "epoch": 0.4817700218136491, "percentage": 48.18, "elapsed_time": "1 day, 10:55:13", "remaining_time": "1 day, 13:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4639, "total_steps": 9627, "loss": 1.7912, "learning_rate": 5.2845703156875106e-05, "epoch": 0.48187389633322947, "percentage": 48.19, "elapsed_time": "1 day, 10:55:42", "remaining_time": "1 day, 13:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4640, "total_steps": 9627, "loss": 1.6757, "learning_rate": 5.282941288210146e-05, "epoch": 0.4819777708528098, "percentage": 48.2, "elapsed_time": "1 day, 10:56:10", "remaining_time": "1 day, 13:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4641, "total_steps": 9627, "loss": 1.8312, "learning_rate": 5.2813122306017396e-05, "epoch": 0.4820816453723902, "percentage": 48.21, "elapsed_time": "1 day, 10:56:38", "remaining_time": "1 day, 13:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4642, "total_steps": 9627, "loss": 1.6572, "learning_rate": 5.279683143035775e-05, "epoch": 0.4821855198919705, "percentage": 48.22, "elapsed_time": "1 day, 10:57:07", "remaining_time": "1 day, 13:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4643, "total_steps": 9627, "loss": 1.6622, "learning_rate": 5.278054025685739e-05, "epoch": 0.48228939441155083, "percentage": 48.23, "elapsed_time": "1 day, 10:57:35", "remaining_time": "1 day, 13:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4644, "total_steps": 9627, "loss": 1.578, "learning_rate": 5.276424878725116e-05, "epoch": 0.4823932689311312, "percentage": 48.24, "elapsed_time": "1 day, 10:58:04", "remaining_time": "1 day, 13:31:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4645, "total_steps": 9627, "loss": 1.6593, "learning_rate": 5.2747957023274005e-05, "epoch": 0.48249714345071154, "percentage": 48.25, "elapsed_time": "1 day, 10:58:31", "remaining_time": "1 day, 13:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4646, "total_steps": 9627, "loss": 1.6828, "learning_rate": 5.2731664966660864e-05, "epoch": 0.48260101797029187, "percentage": 48.26, "elapsed_time": "1 day, 10:59:01", "remaining_time": "1 day, 13:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4647, "total_steps": 9627, "loss": 1.8237, "learning_rate": 5.271537261914672e-05, "epoch": 0.48270489248987225, "percentage": 48.27, "elapsed_time": "1 day, 10:59:29", "remaining_time": "1 day, 13:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4648, "total_steps": 9627, "loss": 1.6222, "learning_rate": 5.269907998246656e-05, "epoch": 0.4828087670094526, "percentage": 48.28, "elapsed_time": "1 day, 10:59:59", "remaining_time": "1 day, 13:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4649, "total_steps": 9627, "loss": 1.6672, "learning_rate": 5.268278705835544e-05, "epoch": 0.4829126415290329, "percentage": 48.29, "elapsed_time": "1 day, 11:00:26", "remaining_time": "1 day, 13:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4650, "total_steps": 9627, "loss": 1.7731, "learning_rate": 5.266649384854841e-05, "epoch": 0.4830165160486133, "percentage": 48.3, "elapsed_time": "1 day, 11:00:55", "remaining_time": "1 day, 13:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4651, "total_steps": 9627, "loss": 1.7711, "learning_rate": 5.265020035478061e-05, "epoch": 0.4831203905681936, "percentage": 48.31, "elapsed_time": "1 day, 11:01:23", "remaining_time": "1 day, 13:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4652, "total_steps": 9627, "loss": 1.4701, "learning_rate": 5.263390657878712e-05, "epoch": 0.483224265087774, "percentage": 48.32, "elapsed_time": "1 day, 11:01:51", "remaining_time": "1 day, 13:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4653, "total_steps": 9627, "loss": 1.6486, "learning_rate": 5.2617612522303136e-05, "epoch": 0.4833281396073543, "percentage": 48.33, "elapsed_time": "1 day, 11:02:20", "remaining_time": "1 day, 13:27:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4654, "total_steps": 9627, "loss": 1.6641, "learning_rate": 5.2601318187063855e-05, "epoch": 0.48343201412693465, "percentage": 48.34, "elapsed_time": "1 day, 11:02:49", "remaining_time": "1 day, 13:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4655, "total_steps": 9627, "loss": 1.5608, "learning_rate": 5.258502357480445e-05, "epoch": 0.48353588864651503, "percentage": 48.35, "elapsed_time": "1 day, 11:03:16", "remaining_time": "1 day, 13:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4656, "total_steps": 9627, "loss": 1.6617, "learning_rate": 5.256872868726021e-05, "epoch": 0.48363976316609536, "percentage": 48.36, "elapsed_time": "1 day, 11:03:46", "remaining_time": "1 day, 13:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4657, "total_steps": 9627, "loss": 1.8598, "learning_rate": 5.255243352616641e-05, "epoch": 0.4837436376856757, "percentage": 48.37, "elapsed_time": "1 day, 11:04:14", "remaining_time": "1 day, 13:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4658, "total_steps": 9627, "loss": 1.8134, "learning_rate": 5.253613809325834e-05, "epoch": 0.48384751220525607, "percentage": 48.38, "elapsed_time": "1 day, 11:04:42", "remaining_time": "1 day, 13:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4659, "total_steps": 9627, "loss": 1.5018, "learning_rate": 5.251984239027133e-05, "epoch": 0.4839513867248364, "percentage": 48.4, "elapsed_time": "1 day, 11:05:10", "remaining_time": "1 day, 13:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4660, "total_steps": 9627, "loss": 1.7079, "learning_rate": 5.2503546418940784e-05, "epoch": 0.4840552612444167, "percentage": 48.41, "elapsed_time": "1 day, 11:05:39", "remaining_time": "1 day, 13:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4661, "total_steps": 9627, "loss": 1.7178, "learning_rate": 5.248725018100207e-05, "epoch": 0.4841591357639971, "percentage": 48.42, "elapsed_time": "1 day, 11:06:06", "remaining_time": "1 day, 13:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4662, "total_steps": 9627, "loss": 1.455, "learning_rate": 5.2470953678190615e-05, "epoch": 0.48426301028357743, "percentage": 48.43, "elapsed_time": "1 day, 11:06:37", "remaining_time": "1 day, 13:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4663, "total_steps": 9627, "loss": 1.8562, "learning_rate": 5.2454656912241864e-05, "epoch": 0.48436688480315776, "percentage": 48.44, "elapsed_time": "1 day, 11:07:05", "remaining_time": "1 day, 13:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4664, "total_steps": 9627, "loss": 1.5738, "learning_rate": 5.2438359884891285e-05, "epoch": 0.48447075932273814, "percentage": 48.45, "elapsed_time": "1 day, 11:07:33", "remaining_time": "1 day, 13:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4665, "total_steps": 9627, "loss": 1.69, "learning_rate": 5.242206259787441e-05, "epoch": 0.48457463384231847, "percentage": 48.46, "elapsed_time": "1 day, 11:08:00", "remaining_time": "1 day, 13:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4666, "total_steps": 9627, "loss": 1.7648, "learning_rate": 5.2405765052926755e-05, "epoch": 0.48467850836189885, "percentage": 48.47, "elapsed_time": "1 day, 11:08:30", "remaining_time": "1 day, 13:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4667, "total_steps": 9627, "loss": 1.6886, "learning_rate": 5.23894672517839e-05, "epoch": 0.4847823828814792, "percentage": 48.48, "elapsed_time": "1 day, 11:08:57", "remaining_time": "1 day, 13:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4668, "total_steps": 9627, "loss": 1.6023, "learning_rate": 5.237316919618143e-05, "epoch": 0.4848862574010595, "percentage": 48.49, "elapsed_time": "1 day, 11:09:27", "remaining_time": "1 day, 13:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4669, "total_steps": 9627, "loss": 1.7436, "learning_rate": 5.2356870887854926e-05, "epoch": 0.4849901319206399, "percentage": 48.5, "elapsed_time": "1 day, 11:09:55", "remaining_time": "1 day, 13:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4670, "total_steps": 9627, "loss": 1.7422, "learning_rate": 5.234057232854006e-05, "epoch": 0.4850940064402202, "percentage": 48.51, "elapsed_time": "1 day, 11:10:23", "remaining_time": "1 day, 13:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4671, "total_steps": 9627, "loss": 1.6793, "learning_rate": 5.232427351997251e-05, "epoch": 0.48519788095980054, "percentage": 48.52, "elapsed_time": "1 day, 11:10:52", "remaining_time": "1 day, 13:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4672, "total_steps": 9627, "loss": 1.6998, "learning_rate": 5.2307974463887944e-05, "epoch": 0.4853017554793809, "percentage": 48.53, "elapsed_time": "1 day, 11:11:20", "remaining_time": "1 day, 13:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4673, "total_steps": 9627, "loss": 1.7607, "learning_rate": 5.229167516202211e-05, "epoch": 0.48540562999896125, "percentage": 48.54, "elapsed_time": "1 day, 11:11:48", "remaining_time": "1 day, 13:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4674, "total_steps": 9627, "loss": 1.707, "learning_rate": 5.2275375616110755e-05, "epoch": 0.4855095045185416, "percentage": 48.55, "elapsed_time": "1 day, 11:12:16", "remaining_time": "1 day, 13:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4675, "total_steps": 9627, "loss": 1.765, "learning_rate": 5.2259075827889644e-05, "epoch": 0.48561337903812196, "percentage": 48.56, "elapsed_time": "1 day, 11:12:46", "remaining_time": "1 day, 13:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4676, "total_steps": 9627, "loss": 1.6677, "learning_rate": 5.224277579909458e-05, "epoch": 0.4857172535577023, "percentage": 48.57, "elapsed_time": "1 day, 11:13:14", "remaining_time": "1 day, 13:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4677, "total_steps": 9627, "loss": 1.5869, "learning_rate": 5.222647553146138e-05, "epoch": 0.4858211280772826, "percentage": 48.58, "elapsed_time": "1 day, 11:13:42", "remaining_time": "1 day, 13:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4678, "total_steps": 9627, "loss": 1.6596, "learning_rate": 5.221017502672589e-05, "epoch": 0.485925002596863, "percentage": 48.59, "elapsed_time": "1 day, 11:14:11", "remaining_time": "1 day, 13:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4679, "total_steps": 9627, "loss": 1.75, "learning_rate": 5.219387428662402e-05, "epoch": 0.4860288771164433, "percentage": 48.6, "elapsed_time": "1 day, 11:14:40", "remaining_time": "1 day, 13:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4680, "total_steps": 9627, "loss": 1.5169, "learning_rate": 5.2177573312891646e-05, "epoch": 0.4861327516360237, "percentage": 48.61, "elapsed_time": "1 day, 11:15:08", "remaining_time": "1 day, 13:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4681, "total_steps": 9627, "loss": 1.8167, "learning_rate": 5.21612721072647e-05, "epoch": 0.48623662615560403, "percentage": 48.62, "elapsed_time": "1 day, 11:15:36", "remaining_time": "1 day, 13:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4682, "total_steps": 9627, "loss": 1.6114, "learning_rate": 5.214497067147914e-05, "epoch": 0.48634050067518436, "percentage": 48.63, "elapsed_time": "1 day, 11:16:05", "remaining_time": "1 day, 13:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4683, "total_steps": 9627, "loss": 1.6924, "learning_rate": 5.212866900727093e-05, "epoch": 0.48644437519476474, "percentage": 48.64, "elapsed_time": "1 day, 11:16:33", "remaining_time": "1 day, 13:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4684, "total_steps": 9627, "loss": 1.6505, "learning_rate": 5.211236711637607e-05, "epoch": 0.48654824971434507, "percentage": 48.65, "elapsed_time": "1 day, 11:17:03", "remaining_time": "1 day, 13:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4685, "total_steps": 9627, "loss": 1.9258, "learning_rate": 5.209606500053059e-05, "epoch": 0.4866521242339254, "percentage": 48.67, "elapsed_time": "1 day, 11:17:30", "remaining_time": "1 day, 13:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4686, "total_steps": 9627, "loss": 1.7348, "learning_rate": 5.207976266147053e-05, "epoch": 0.4867559987535058, "percentage": 48.68, "elapsed_time": "1 day, 11:17:59", "remaining_time": "1 day, 13:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4687, "total_steps": 9627, "loss": 1.6395, "learning_rate": 5.206346010093198e-05, "epoch": 0.4868598732730861, "percentage": 48.69, "elapsed_time": "1 day, 11:18:27", "remaining_time": "1 day, 13:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4688, "total_steps": 9627, "loss": 1.846, "learning_rate": 5.204715732065103e-05, "epoch": 0.48696374779266643, "percentage": 48.7, "elapsed_time": "1 day, 11:18:56", "remaining_time": "1 day, 13:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4689, "total_steps": 9627, "loss": 1.4251, "learning_rate": 5.203085432236379e-05, "epoch": 0.4870676223122468, "percentage": 48.71, "elapsed_time": "1 day, 11:19:25", "remaining_time": "1 day, 13:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4690, "total_steps": 9627, "loss": 1.6869, "learning_rate": 5.201455110780641e-05, "epoch": 0.48717149683182714, "percentage": 48.72, "elapsed_time": "1 day, 11:19:54", "remaining_time": "1 day, 13:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4691, "total_steps": 9627, "loss": 1.8586, "learning_rate": 5.199824767871503e-05, "epoch": 0.4872753713514075, "percentage": 48.73, "elapsed_time": "1 day, 11:20:22", "remaining_time": "1 day, 13:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4692, "total_steps": 9627, "loss": 1.6928, "learning_rate": 5.198194403682588e-05, "epoch": 0.48737924587098785, "percentage": 48.74, "elapsed_time": "1 day, 11:20:51", "remaining_time": "1 day, 13:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4693, "total_steps": 9627, "loss": 1.8182, "learning_rate": 5.1965640183875144e-05, "epoch": 0.4874831203905682, "percentage": 48.75, "elapsed_time": "1 day, 11:21:19", "remaining_time": "1 day, 13:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4694, "total_steps": 9627, "loss": 1.8115, "learning_rate": 5.194933612159906e-05, "epoch": 0.48758699491014856, "percentage": 48.76, "elapsed_time": "1 day, 11:21:48", "remaining_time": "1 day, 13:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4695, "total_steps": 9627, "loss": 1.7725, "learning_rate": 5.193303185173388e-05, "epoch": 0.4876908694297289, "percentage": 48.77, "elapsed_time": "1 day, 11:22:16", "remaining_time": "1 day, 13:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4696, "total_steps": 9627, "loss": 1.823, "learning_rate": 5.191672737601591e-05, "epoch": 0.4877947439493092, "percentage": 48.78, "elapsed_time": "1 day, 11:22:46", "remaining_time": "1 day, 13:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4697, "total_steps": 9627, "loss": 1.5653, "learning_rate": 5.1900422696181396e-05, "epoch": 0.4878986184688896, "percentage": 48.79, "elapsed_time": "1 day, 11:23:13", "remaining_time": "1 day, 13:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4698, "total_steps": 9627, "loss": 1.7653, "learning_rate": 5.1884117813966705e-05, "epoch": 0.4880024929884699, "percentage": 48.8, "elapsed_time": "1 day, 11:23:41", "remaining_time": "1 day, 13:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4699, "total_steps": 9627, "loss": 1.7976, "learning_rate": 5.186781273110816e-05, "epoch": 0.48810636750805025, "percentage": 48.81, "elapsed_time": "1 day, 11:24:10", "remaining_time": "1 day, 13:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4700, "total_steps": 9627, "loss": 1.6952, "learning_rate": 5.1851507449342104e-05, "epoch": 0.48821024202763064, "percentage": 48.82, "elapsed_time": "1 day, 11:24:39", "remaining_time": "1 day, 13:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4701, "total_steps": 9627, "loss": 1.6622, "learning_rate": 5.183520197040498e-05, "epoch": 0.48831411654721096, "percentage": 48.83, "elapsed_time": "1 day, 11:25:07", "remaining_time": "1 day, 13:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4702, "total_steps": 9627, "loss": 1.7436, "learning_rate": 5.1818896296033145e-05, "epoch": 0.4884179910667913, "percentage": 48.84, "elapsed_time": "1 day, 11:25:36", "remaining_time": "1 day, 13:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4703, "total_steps": 9627, "loss": 1.6381, "learning_rate": 5.180259042796306e-05, "epoch": 0.4885218655863717, "percentage": 48.85, "elapsed_time": "1 day, 11:26:04", "remaining_time": "1 day, 13:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4704, "total_steps": 9627, "loss": 1.8482, "learning_rate": 5.178628436793115e-05, "epoch": 0.488625740105952, "percentage": 48.86, "elapsed_time": "1 day, 11:26:34", "remaining_time": "1 day, 13:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4705, "total_steps": 9627, "loss": 1.7622, "learning_rate": 5.176997811767387e-05, "epoch": 0.4887296146255324, "percentage": 48.87, "elapsed_time": "1 day, 11:27:02", "remaining_time": "1 day, 13:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4706, "total_steps": 9627, "loss": 1.7822, "learning_rate": 5.175367167892774e-05, "epoch": 0.4888334891451127, "percentage": 48.88, "elapsed_time": "1 day, 11:27:31", "remaining_time": "1 day, 13:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4707, "total_steps": 9627, "loss": 1.4567, "learning_rate": 5.1737365053429254e-05, "epoch": 0.48893736366469304, "percentage": 48.89, "elapsed_time": "1 day, 11:27:59", "remaining_time": "1 day, 13:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4708, "total_steps": 9627, "loss": 1.7415, "learning_rate": 5.1721058242914935e-05, "epoch": 0.4890412381842734, "percentage": 48.9, "elapsed_time": "1 day, 11:28:28", "remaining_time": "1 day, 13:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4709, "total_steps": 9627, "loss": 1.6306, "learning_rate": 5.170475124912134e-05, "epoch": 0.48914511270385375, "percentage": 48.91, "elapsed_time": "1 day, 11:28:57", "remaining_time": "1 day, 13:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4710, "total_steps": 9627, "loss": 1.6247, "learning_rate": 5.168844407378506e-05, "epoch": 0.4892489872234341, "percentage": 48.92, "elapsed_time": "1 day, 11:29:25", "remaining_time": "1 day, 13:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4711, "total_steps": 9627, "loss": 1.6903, "learning_rate": 5.167213671864263e-05, "epoch": 0.48935286174301446, "percentage": 48.94, "elapsed_time": "1 day, 11:29:52", "remaining_time": "1 day, 13:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4712, "total_steps": 9627, "loss": 1.6055, "learning_rate": 5.1655829185430685e-05, "epoch": 0.4894567362625948, "percentage": 48.95, "elapsed_time": "1 day, 11:30:22", "remaining_time": "1 day, 13:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4713, "total_steps": 9627, "loss": 1.6719, "learning_rate": 5.1639521475885854e-05, "epoch": 0.4895606107821751, "percentage": 48.96, "elapsed_time": "1 day, 11:30:50", "remaining_time": "1 day, 13:01:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4714, "total_steps": 9627, "loss": 1.7133, "learning_rate": 5.162321359174476e-05, "epoch": 0.4896644853017555, "percentage": 48.97, "elapsed_time": "1 day, 11:31:19", "remaining_time": "1 day, 13:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4715, "total_steps": 9627, "loss": 1.805, "learning_rate": 5.16069055347441e-05, "epoch": 0.4897683598213358, "percentage": 48.98, "elapsed_time": "1 day, 11:31:47", "remaining_time": "1 day, 13:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4716, "total_steps": 9627, "loss": 1.5628, "learning_rate": 5.1590597306620525e-05, "epoch": 0.48987223434091615, "percentage": 48.99, "elapsed_time": "1 day, 11:32:16", "remaining_time": "1 day, 13:00:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4717, "total_steps": 9627, "loss": 1.5699, "learning_rate": 5.1574288909110744e-05, "epoch": 0.48997610886049653, "percentage": 49.0, "elapsed_time": "1 day, 11:32:44", "remaining_time": "1 day, 13:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4718, "total_steps": 9627, "loss": 1.7159, "learning_rate": 5.155798034395147e-05, "epoch": 0.49007998338007686, "percentage": 49.01, "elapsed_time": "1 day, 11:33:13", "remaining_time": "1 day, 12:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4719, "total_steps": 9627, "loss": 1.8649, "learning_rate": 5.154167161287945e-05, "epoch": 0.49018385789965724, "percentage": 49.02, "elapsed_time": "1 day, 11:33:40", "remaining_time": "1 day, 12:59:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4720, "total_steps": 9627, "loss": 1.7603, "learning_rate": 5.152536271763143e-05, "epoch": 0.49028773241923757, "percentage": 49.03, "elapsed_time": "1 day, 11:34:10", "remaining_time": "1 day, 12:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4721, "total_steps": 9627, "loss": 1.664, "learning_rate": 5.1509053659944175e-05, "epoch": 0.4903916069388179, "percentage": 49.04, "elapsed_time": "1 day, 11:34:38", "remaining_time": "1 day, 12:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4722, "total_steps": 9627, "loss": 1.5613, "learning_rate": 5.149274444155446e-05, "epoch": 0.4904954814583983, "percentage": 49.05, "elapsed_time": "1 day, 11:35:07", "remaining_time": "1 day, 12:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4723, "total_steps": 9627, "loss": 1.7978, "learning_rate": 5.147643506419914e-05, "epoch": 0.4905993559779786, "percentage": 49.06, "elapsed_time": "1 day, 11:35:34", "remaining_time": "1 day, 12:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4724, "total_steps": 9627, "loss": 1.736, "learning_rate": 5.146012552961499e-05, "epoch": 0.49070323049755893, "percentage": 49.07, "elapsed_time": "1 day, 11:36:04", "remaining_time": "1 day, 12:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4725, "total_steps": 9627, "loss": 1.7367, "learning_rate": 5.1443815839538845e-05, "epoch": 0.4908071050171393, "percentage": 49.08, "elapsed_time": "1 day, 11:36:31", "remaining_time": "1 day, 12:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4726, "total_steps": 9627, "loss": 1.4424, "learning_rate": 5.1427505995707594e-05, "epoch": 0.49091097953671964, "percentage": 49.09, "elapsed_time": "1 day, 11:37:01", "remaining_time": "1 day, 12:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4727, "total_steps": 9627, "loss": 1.8207, "learning_rate": 5.1411195999858074e-05, "epoch": 0.49101485405629997, "percentage": 49.1, "elapsed_time": "1 day, 11:37:29", "remaining_time": "1 day, 12:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4728, "total_steps": 9627, "loss": 1.756, "learning_rate": 5.1394885853727195e-05, "epoch": 0.49111872857588035, "percentage": 49.11, "elapsed_time": "1 day, 11:37:57", "remaining_time": "1 day, 12:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4729, "total_steps": 9627, "loss": 1.5362, "learning_rate": 5.137857555905184e-05, "epoch": 0.4912226030954607, "percentage": 49.12, "elapsed_time": "1 day, 11:38:25", "remaining_time": "1 day, 12:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4730, "total_steps": 9627, "loss": 1.6924, "learning_rate": 5.1362265117568965e-05, "epoch": 0.49132647761504106, "percentage": 49.13, "elapsed_time": "1 day, 11:38:54", "remaining_time": "1 day, 12:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4731, "total_steps": 9627, "loss": 1.7965, "learning_rate": 5.134595453101547e-05, "epoch": 0.4914303521346214, "percentage": 49.14, "elapsed_time": "1 day, 11:39:22", "remaining_time": "1 day, 12:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4732, "total_steps": 9627, "loss": 1.5735, "learning_rate": 5.1329643801128324e-05, "epoch": 0.4915342266542017, "percentage": 49.15, "elapsed_time": "1 day, 11:39:51", "remaining_time": "1 day, 12:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4733, "total_steps": 9627, "loss": 1.7203, "learning_rate": 5.131333292964447e-05, "epoch": 0.4916381011737821, "percentage": 49.16, "elapsed_time": "1 day, 11:40:20", "remaining_time": "1 day, 12:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4734, "total_steps": 9627, "loss": 1.7932, "learning_rate": 5.12970219183009e-05, "epoch": 0.4917419756933624, "percentage": 49.17, "elapsed_time": "1 day, 11:40:48", "remaining_time": "1 day, 12:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4735, "total_steps": 9627, "loss": 1.8202, "learning_rate": 5.128071076883463e-05, "epoch": 0.49184585021294275, "percentage": 49.18, "elapsed_time": "1 day, 11:41:17", "remaining_time": "1 day, 12:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4736, "total_steps": 9627, "loss": 1.6721, "learning_rate": 5.126439948298264e-05, "epoch": 0.49194972473252313, "percentage": 49.19, "elapsed_time": "1 day, 11:41:46", "remaining_time": "1 day, 12:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4737, "total_steps": 9627, "loss": 1.6901, "learning_rate": 5.124808806248199e-05, "epoch": 0.49205359925210346, "percentage": 49.21, "elapsed_time": "1 day, 11:42:14", "remaining_time": "1 day, 12:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4738, "total_steps": 9627, "loss": 1.745, "learning_rate": 5.123177650906968e-05, "epoch": 0.4921574737716838, "percentage": 49.22, "elapsed_time": "1 day, 11:42:41", "remaining_time": "1 day, 12:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4739, "total_steps": 9627, "loss": 1.7013, "learning_rate": 5.1215464824482775e-05, "epoch": 0.49226134829126417, "percentage": 49.23, "elapsed_time": "1 day, 11:43:11", "remaining_time": "1 day, 12:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4740, "total_steps": 9627, "loss": 1.5359, "learning_rate": 5.119915301045836e-05, "epoch": 0.4923652228108445, "percentage": 49.24, "elapsed_time": "1 day, 11:43:39", "remaining_time": "1 day, 12:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4741, "total_steps": 9627, "loss": 1.6351, "learning_rate": 5.118284106873349e-05, "epoch": 0.4924690973304248, "percentage": 49.25, "elapsed_time": "1 day, 11:44:07", "remaining_time": "1 day, 12:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4742, "total_steps": 9627, "loss": 1.9368, "learning_rate": 5.116652900104527e-05, "epoch": 0.4925729718500052, "percentage": 49.26, "elapsed_time": "1 day, 11:44:37", "remaining_time": "1 day, 12:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4743, "total_steps": 9627, "loss": 1.6977, "learning_rate": 5.1150216809130826e-05, "epoch": 0.49267684636958553, "percentage": 49.27, "elapsed_time": "1 day, 11:45:05", "remaining_time": "1 day, 12:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4744, "total_steps": 9627, "loss": 1.8549, "learning_rate": 5.113390449472726e-05, "epoch": 0.4927807208891659, "percentage": 49.28, "elapsed_time": "1 day, 11:45:34", "remaining_time": "1 day, 12:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4745, "total_steps": 9627, "loss": 1.7991, "learning_rate": 5.11175920595717e-05, "epoch": 0.49288459540874624, "percentage": 49.29, "elapsed_time": "1 day, 11:46:01", "remaining_time": "1 day, 12:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4746, "total_steps": 9627, "loss": 1.7089, "learning_rate": 5.1101279505401325e-05, "epoch": 0.49298846992832657, "percentage": 49.3, "elapsed_time": "1 day, 11:46:30", "remaining_time": "1 day, 12:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4747, "total_steps": 9627, "loss": 1.6423, "learning_rate": 5.108496683395324e-05, "epoch": 0.49309234444790695, "percentage": 49.31, "elapsed_time": "1 day, 11:46:58", "remaining_time": "1 day, 12:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4748, "total_steps": 9627, "loss": 1.6201, "learning_rate": 5.106865404696468e-05, "epoch": 0.4931962189674873, "percentage": 49.32, "elapsed_time": "1 day, 11:47:28", "remaining_time": "1 day, 12:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4749, "total_steps": 9627, "loss": 1.7299, "learning_rate": 5.1052341146172785e-05, "epoch": 0.4933000934870676, "percentage": 49.33, "elapsed_time": "1 day, 11:47:55", "remaining_time": "1 day, 12:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4750, "total_steps": 9627, "loss": 1.7541, "learning_rate": 5.103602813331476e-05, "epoch": 0.493403968006648, "percentage": 49.34, "elapsed_time": "1 day, 11:48:25", "remaining_time": "1 day, 12:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4751, "total_steps": 9627, "loss": 1.3569, "learning_rate": 5.101971501012785e-05, "epoch": 0.4935078425262283, "percentage": 49.35, "elapsed_time": "1 day, 11:48:53", "remaining_time": "1 day, 12:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4752, "total_steps": 9627, "loss": 1.8115, "learning_rate": 5.1003401778349224e-05, "epoch": 0.49361171704580864, "percentage": 49.36, "elapsed_time": "1 day, 11:49:21", "remaining_time": "1 day, 12:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4753, "total_steps": 9627, "loss": 1.6486, "learning_rate": 5.0987088439716134e-05, "epoch": 0.493715591565389, "percentage": 49.37, "elapsed_time": "1 day, 11:49:51", "remaining_time": "1 day, 12:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4754, "total_steps": 9627, "loss": 1.8906, "learning_rate": 5.097077499596583e-05, "epoch": 0.49381946608496935, "percentage": 49.38, "elapsed_time": "1 day, 11:50:18", "remaining_time": "1 day, 12:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4755, "total_steps": 9627, "loss": 1.5989, "learning_rate": 5.095446144883556e-05, "epoch": 0.4939233406045497, "percentage": 49.39, "elapsed_time": "1 day, 11:50:47", "remaining_time": "1 day, 12:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4756, "total_steps": 9627, "loss": 1.5584, "learning_rate": 5.0938147800062586e-05, "epoch": 0.49402721512413006, "percentage": 49.4, "elapsed_time": "1 day, 11:51:16", "remaining_time": "1 day, 12:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4757, "total_steps": 9627, "loss": 1.6068, "learning_rate": 5.092183405138419e-05, "epoch": 0.4941310896437104, "percentage": 49.41, "elapsed_time": "1 day, 11:51:43", "remaining_time": "1 day, 12:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4758, "total_steps": 9627, "loss": 1.8445, "learning_rate": 5.090552020453766e-05, "epoch": 0.49423496416329077, "percentage": 49.42, "elapsed_time": "1 day, 11:52:13", "remaining_time": "1 day, 12:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4759, "total_steps": 9627, "loss": 1.8761, "learning_rate": 5.08892062612603e-05, "epoch": 0.4943388386828711, "percentage": 49.43, "elapsed_time": "1 day, 11:52:42", "remaining_time": "1 day, 12:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4760, "total_steps": 9627, "loss": 1.5639, "learning_rate": 5.08728922232894e-05, "epoch": 0.4944427132024514, "percentage": 49.44, "elapsed_time": "1 day, 11:53:10", "remaining_time": "1 day, 12:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4761, "total_steps": 9627, "loss": 1.7764, "learning_rate": 5.0856578092362285e-05, "epoch": 0.4945465877220318, "percentage": 49.45, "elapsed_time": "1 day, 11:53:39", "remaining_time": "1 day, 12:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4762, "total_steps": 9627, "loss": 1.6924, "learning_rate": 5.084026387021629e-05, "epoch": 0.49465046224161213, "percentage": 49.47, "elapsed_time": "1 day, 11:54:08", "remaining_time": "1 day, 12:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4763, "total_steps": 9627, "loss": 1.7549, "learning_rate": 5.0823949558588746e-05, "epoch": 0.49475433676119246, "percentage": 49.48, "elapsed_time": "1 day, 11:54:37", "remaining_time": "1 day, 12:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4764, "total_steps": 9627, "loss": 1.5389, "learning_rate": 5.0807635159216993e-05, "epoch": 0.49485821128077284, "percentage": 49.49, "elapsed_time": "1 day, 11:55:05", "remaining_time": "1 day, 12:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4765, "total_steps": 9627, "loss": 1.7683, "learning_rate": 5.079132067383842e-05, "epoch": 0.49496208580035317, "percentage": 49.5, "elapsed_time": "1 day, 11:55:34", "remaining_time": "1 day, 12:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4766, "total_steps": 9627, "loss": 1.7123, "learning_rate": 5.077500610419036e-05, "epoch": 0.4950659603199335, "percentage": 49.51, "elapsed_time": "1 day, 11:56:02", "remaining_time": "1 day, 12:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4767, "total_steps": 9627, "loss": 1.7361, "learning_rate": 5.0758691452010175e-05, "epoch": 0.4951698348395139, "percentage": 49.52, "elapsed_time": "1 day, 11:56:31", "remaining_time": "1 day, 12:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4768, "total_steps": 9627, "loss": 1.8205, "learning_rate": 5.0742376719035276e-05, "epoch": 0.4952737093590942, "percentage": 49.53, "elapsed_time": "1 day, 11:56:59", "remaining_time": "1 day, 12:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4769, "total_steps": 9627, "loss": 1.6695, "learning_rate": 5.0726061907003045e-05, "epoch": 0.4953775838786746, "percentage": 49.54, "elapsed_time": "1 day, 11:57:28", "remaining_time": "1 day, 12:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4770, "total_steps": 9627, "loss": 1.6963, "learning_rate": 5.070974701765089e-05, "epoch": 0.4954814583982549, "percentage": 49.55, "elapsed_time": "1 day, 11:57:57", "remaining_time": "1 day, 12:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4771, "total_steps": 9627, "loss": 1.5213, "learning_rate": 5.069343205271622e-05, "epoch": 0.49558533291783524, "percentage": 49.56, "elapsed_time": "1 day, 11:58:25", "remaining_time": "1 day, 12:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4772, "total_steps": 9627, "loss": 1.5632, "learning_rate": 5.067711701393644e-05, "epoch": 0.4956892074374156, "percentage": 49.57, "elapsed_time": "1 day, 11:58:54", "remaining_time": "1 day, 12:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4773, "total_steps": 9627, "loss": 1.717, "learning_rate": 5.066080190304898e-05, "epoch": 0.49579308195699595, "percentage": 49.58, "elapsed_time": "1 day, 11:59:21", "remaining_time": "1 day, 12:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4774, "total_steps": 9627, "loss": 1.7107, "learning_rate": 5.0644486721791273e-05, "epoch": 0.4958969564765763, "percentage": 49.59, "elapsed_time": "1 day, 11:59:51", "remaining_time": "1 day, 12:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4775, "total_steps": 9627, "loss": 1.8646, "learning_rate": 5.0628171471900756e-05, "epoch": 0.49600083099615666, "percentage": 49.6, "elapsed_time": "1 day, 12:00:19", "remaining_time": "1 day, 12:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4776, "total_steps": 9627, "loss": 1.6334, "learning_rate": 5.0611856155114876e-05, "epoch": 0.496104705515737, "percentage": 49.61, "elapsed_time": "1 day, 12:00:48", "remaining_time": "1 day, 12:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4777, "total_steps": 9627, "loss": 1.7811, "learning_rate": 5.059554077317109e-05, "epoch": 0.4962085800353173, "percentage": 49.62, "elapsed_time": "1 day, 12:01:16", "remaining_time": "1 day, 12:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4778, "total_steps": 9627, "loss": 1.6125, "learning_rate": 5.0579225327806847e-05, "epoch": 0.4963124545548977, "percentage": 49.63, "elapsed_time": "1 day, 12:01:45", "remaining_time": "1 day, 12:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4779, "total_steps": 9627, "loss": 1.554, "learning_rate": 5.0562909820759654e-05, "epoch": 0.496416329074478, "percentage": 49.64, "elapsed_time": "1 day, 12:02:13", "remaining_time": "1 day, 12:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4780, "total_steps": 9627, "loss": 1.6951, "learning_rate": 5.054659425376693e-05, "epoch": 0.49652020359405835, "percentage": 49.65, "elapsed_time": "1 day, 12:02:43", "remaining_time": "1 day, 12:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4781, "total_steps": 9627, "loss": 1.7489, "learning_rate": 5.0530278628566175e-05, "epoch": 0.49662407811363873, "percentage": 49.66, "elapsed_time": "1 day, 12:03:11", "remaining_time": "1 day, 12:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4782, "total_steps": 9627, "loss": 1.7431, "learning_rate": 5.05139629468949e-05, "epoch": 0.49672795263321906, "percentage": 49.67, "elapsed_time": "1 day, 12:03:40", "remaining_time": "1 day, 12:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4783, "total_steps": 9627, "loss": 1.5739, "learning_rate": 5.0497647210490565e-05, "epoch": 0.49683182715279944, "percentage": 49.68, "elapsed_time": "1 day, 12:04:08", "remaining_time": "1 day, 12:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4784, "total_steps": 9627, "loss": 1.6096, "learning_rate": 5.048133142109069e-05, "epoch": 0.49693570167237977, "percentage": 49.69, "elapsed_time": "1 day, 12:04:37", "remaining_time": "1 day, 12:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4785, "total_steps": 9627, "loss": 1.8216, "learning_rate": 5.046501558043278e-05, "epoch": 0.4970395761919601, "percentage": 49.7, "elapsed_time": "1 day, 12:05:05", "remaining_time": "1 day, 12:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4786, "total_steps": 9627, "loss": 1.6871, "learning_rate": 5.044869969025434e-05, "epoch": 0.4971434507115405, "percentage": 49.71, "elapsed_time": "1 day, 12:05:34", "remaining_time": "1 day, 12:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4787, "total_steps": 9627, "loss": 1.6358, "learning_rate": 5.043238375229289e-05, "epoch": 0.4972473252311208, "percentage": 49.72, "elapsed_time": "1 day, 12:06:02", "remaining_time": "1 day, 12:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4788, "total_steps": 9627, "loss": 1.6841, "learning_rate": 5.0416067768285924e-05, "epoch": 0.49735119975070113, "percentage": 49.74, "elapsed_time": "1 day, 12:06:31", "remaining_time": "1 day, 12:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4789, "total_steps": 9627, "loss": 1.4662, "learning_rate": 5.039975173997099e-05, "epoch": 0.4974550742702815, "percentage": 49.75, "elapsed_time": "1 day, 12:06:59", "remaining_time": "1 day, 12:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4790, "total_steps": 9627, "loss": 1.8741, "learning_rate": 5.038343566908562e-05, "epoch": 0.49755894878986184, "percentage": 49.76, "elapsed_time": "1 day, 12:07:28", "remaining_time": "1 day, 12:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4791, "total_steps": 9627, "loss": 1.6235, "learning_rate": 5.036711955736734e-05, "epoch": 0.49766282330944217, "percentage": 49.77, "elapsed_time": "1 day, 12:07:56", "remaining_time": "1 day, 12:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4792, "total_steps": 9627, "loss": 1.4756, "learning_rate": 5.0350803406553684e-05, "epoch": 0.49776669782902255, "percentage": 49.78, "elapsed_time": "1 day, 12:08:25", "remaining_time": "1 day, 12:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4793, "total_steps": 9627, "loss": 1.6785, "learning_rate": 5.033448721838222e-05, "epoch": 0.4978705723486029, "percentage": 49.79, "elapsed_time": "1 day, 12:08:53", "remaining_time": "1 day, 12:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4794, "total_steps": 9627, "loss": 1.6019, "learning_rate": 5.0318170994590464e-05, "epoch": 0.4979744468681832, "percentage": 49.8, "elapsed_time": "1 day, 12:09:21", "remaining_time": "1 day, 12:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4795, "total_steps": 9627, "loss": 1.8253, "learning_rate": 5.030185473691597e-05, "epoch": 0.4980783213877636, "percentage": 49.81, "elapsed_time": "1 day, 12:09:51", "remaining_time": "1 day, 12:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4796, "total_steps": 9627, "loss": 1.6124, "learning_rate": 5.0285538447096315e-05, "epoch": 0.4981821959073439, "percentage": 49.82, "elapsed_time": "1 day, 12:10:19", "remaining_time": "1 day, 12:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4797, "total_steps": 9627, "loss": 1.67, "learning_rate": 5.026922212686902e-05, "epoch": 0.4982860704269243, "percentage": 49.83, "elapsed_time": "1 day, 12:10:48", "remaining_time": "1 day, 12:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4798, "total_steps": 9627, "loss": 1.6923, "learning_rate": 5.025290577797169e-05, "epoch": 0.4983899449465046, "percentage": 49.84, "elapsed_time": "1 day, 12:11:16", "remaining_time": "1 day, 12:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4799, "total_steps": 9627, "loss": 1.585, "learning_rate": 5.0236589402141864e-05, "epoch": 0.49849381946608495, "percentage": 49.85, "elapsed_time": "1 day, 12:11:45", "remaining_time": "1 day, 12:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4800, "total_steps": 9627, "loss": 1.4631, "learning_rate": 5.022027300111711e-05, "epoch": 0.49859769398566534, "percentage": 49.86, "elapsed_time": "1 day, 12:12:14", "remaining_time": "1 day, 12:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4801, "total_steps": 9627, "loss": 1.6969, "learning_rate": 5.0203956576635015e-05, "epoch": 0.49870156850524566, "percentage": 49.87, "elapsed_time": "1 day, 12:12:42", "remaining_time": "1 day, 12:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4802, "total_steps": 9627, "loss": 1.8514, "learning_rate": 5.018764013043312e-05, "epoch": 0.498805443024826, "percentage": 49.88, "elapsed_time": "1 day, 12:13:11", "remaining_time": "1 day, 12:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4803, "total_steps": 9627, "loss": 1.7264, "learning_rate": 5.0171323664249005e-05, "epoch": 0.49890931754440637, "percentage": 49.89, "elapsed_time": "1 day, 12:13:39", "remaining_time": "1 day, 12:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4804, "total_steps": 9627, "loss": 1.6963, "learning_rate": 5.0155007179820266e-05, "epoch": 0.4990131920639867, "percentage": 49.9, "elapsed_time": "1 day, 12:14:07", "remaining_time": "1 day, 12:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4805, "total_steps": 9627, "loss": 1.7839, "learning_rate": 5.013869067888448e-05, "epoch": 0.499117066583567, "percentage": 49.91, "elapsed_time": "1 day, 12:14:37", "remaining_time": "1 day, 12:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4806, "total_steps": 9627, "loss": 1.6467, "learning_rate": 5.01223741631792e-05, "epoch": 0.4992209411031474, "percentage": 49.92, "elapsed_time": "1 day, 12:15:05", "remaining_time": "1 day, 12:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4807, "total_steps": 9627, "loss": 1.8405, "learning_rate": 5.010605763444205e-05, "epoch": 0.49932481562272774, "percentage": 49.93, "elapsed_time": "1 day, 12:15:34", "remaining_time": "1 day, 12:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4808, "total_steps": 9627, "loss": 1.6736, "learning_rate": 5.008974109441057e-05, "epoch": 0.4994286901423081, "percentage": 49.94, "elapsed_time": "1 day, 12:16:02", "remaining_time": "1 day, 12:21:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4809, "total_steps": 9627, "loss": 1.6041, "learning_rate": 5.007342454482238e-05, "epoch": 0.49953256466188845, "percentage": 49.95, "elapsed_time": "1 day, 12:16:32", "remaining_time": "1 day, 12:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4810, "total_steps": 9627, "loss": 1.7678, "learning_rate": 5.005710798741503e-05, "epoch": 0.49963643918146877, "percentage": 49.96, "elapsed_time": "1 day, 12:17:00", "remaining_time": "1 day, 12:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4811, "total_steps": 9627, "loss": 1.5475, "learning_rate": 5.0040791423926125e-05, "epoch": 0.49974031370104915, "percentage": 49.97, "elapsed_time": "1 day, 12:17:29", "remaining_time": "1 day, 12:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4812, "total_steps": 9627, "loss": 1.4978, "learning_rate": 5.002447485609327e-05, "epoch": 0.4998441882206295, "percentage": 49.98, "elapsed_time": "1 day, 12:17:57", "remaining_time": "1 day, 12:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4813, "total_steps": 9627, "loss": 1.7025, "learning_rate": 5.0008158285654027e-05, "epoch": 0.4999480627402098, "percentage": 49.99, "elapsed_time": "1 day, 12:18:26", "remaining_time": "1 day, 12:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4814, "total_steps": 9627, "loss": 1.7601, "learning_rate": 4.9991841714345985e-05, "epoch": 0.5000519372597901, "percentage": 50.01, "elapsed_time": "1 day, 12:18:55", "remaining_time": "1 day, 12:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4815, "total_steps": 9627, "loss": 1.5614, "learning_rate": 4.997552514390674e-05, "epoch": 0.5001558117793705, "percentage": 50.02, "elapsed_time": "1 day, 12:19:24", "remaining_time": "1 day, 12:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4816, "total_steps": 9627, "loss": 1.7504, "learning_rate": 4.9959208576073866e-05, "epoch": 0.5002596862989509, "percentage": 50.03, "elapsed_time": "1 day, 12:19:52", "remaining_time": "1 day, 12:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4817, "total_steps": 9627, "loss": 1.6628, "learning_rate": 4.994289201258498e-05, "epoch": 0.5003635608185312, "percentage": 50.04, "elapsed_time": "1 day, 12:20:21", "remaining_time": "1 day, 12:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4818, "total_steps": 9627, "loss": 1.7745, "learning_rate": 4.992657545517764e-05, "epoch": 0.5004674353381116, "percentage": 50.05, "elapsed_time": "1 day, 12:20:50", "remaining_time": "1 day, 12:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4819, "total_steps": 9627, "loss": 1.6339, "learning_rate": 4.9910258905589427e-05, "epoch": 0.5005713098576919, "percentage": 50.06, "elapsed_time": "1 day, 12:21:19", "remaining_time": "1 day, 12:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4820, "total_steps": 9627, "loss": 1.6569, "learning_rate": 4.989394236555797e-05, "epoch": 0.5006751843772722, "percentage": 50.07, "elapsed_time": "1 day, 12:21:47", "remaining_time": "1 day, 12:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4821, "total_steps": 9627, "loss": 1.602, "learning_rate": 4.9877625836820806e-05, "epoch": 0.5007790588968526, "percentage": 50.08, "elapsed_time": "1 day, 12:22:15", "remaining_time": "1 day, 12:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4822, "total_steps": 9627, "loss": 1.6783, "learning_rate": 4.986130932111553e-05, "epoch": 0.500882933416433, "percentage": 50.09, "elapsed_time": "1 day, 12:22:45", "remaining_time": "1 day, 12:15:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4823, "total_steps": 9627, "loss": 1.6118, "learning_rate": 4.984499282017975e-05, "epoch": 0.5009868079360132, "percentage": 50.1, "elapsed_time": "1 day, 12:23:13", "remaining_time": "1 day, 12:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4824, "total_steps": 9627, "loss": 1.8231, "learning_rate": 4.9828676335751006e-05, "epoch": 0.5010906824555936, "percentage": 50.11, "elapsed_time": "1 day, 12:23:42", "remaining_time": "1 day, 12:14:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4825, "total_steps": 9627, "loss": 1.667, "learning_rate": 4.9812359869566896e-05, "epoch": 0.501194556975174, "percentage": 50.12, "elapsed_time": "1 day, 12:24:11", "remaining_time": "1 day, 12:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4826, "total_steps": 9627, "loss": 1.6415, "learning_rate": 4.979604342336501e-05, "epoch": 0.5012984314947543, "percentage": 50.13, "elapsed_time": "1 day, 12:24:40", "remaining_time": "1 day, 12:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4827, "total_steps": 9627, "loss": 1.7066, "learning_rate": 4.977972699888289e-05, "epoch": 0.5014023060143347, "percentage": 50.14, "elapsed_time": "1 day, 12:25:09", "remaining_time": "1 day, 12:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4828, "total_steps": 9627, "loss": 1.6469, "learning_rate": 4.976341059785815e-05, "epoch": 0.501506180533915, "percentage": 50.15, "elapsed_time": "1 day, 12:25:36", "remaining_time": "1 day, 12:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4829, "total_steps": 9627, "loss": 1.9436, "learning_rate": 4.974709422202831e-05, "epoch": 0.5016100550534954, "percentage": 50.16, "elapsed_time": "1 day, 12:26:06", "remaining_time": "1 day, 12:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4830, "total_steps": 9627, "loss": 1.5765, "learning_rate": 4.973077787313099e-05, "epoch": 0.5017139295730757, "percentage": 50.17, "elapsed_time": "1 day, 12:26:34", "remaining_time": "1 day, 12:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4831, "total_steps": 9627, "loss": 1.8306, "learning_rate": 4.9714461552903704e-05, "epoch": 0.5018178040926561, "percentage": 50.18, "elapsed_time": "1 day, 12:27:04", "remaining_time": "1 day, 12:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4832, "total_steps": 9627, "loss": 1.7797, "learning_rate": 4.9698145263084036e-05, "epoch": 0.5019216786122365, "percentage": 50.19, "elapsed_time": "1 day, 12:27:31", "remaining_time": "1 day, 12:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4833, "total_steps": 9627, "loss": 1.646, "learning_rate": 4.968182900540956e-05, "epoch": 0.5020255531318167, "percentage": 50.2, "elapsed_time": "1 day, 12:28:00", "remaining_time": "1 day, 12:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4834, "total_steps": 9627, "loss": 1.6855, "learning_rate": 4.966551278161779e-05, "epoch": 0.5021294276513971, "percentage": 50.21, "elapsed_time": "1 day, 12:28:29", "remaining_time": "1 day, 12:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4835, "total_steps": 9627, "loss": 1.678, "learning_rate": 4.964919659344632e-05, "epoch": 0.5022333021709775, "percentage": 50.22, "elapsed_time": "1 day, 12:28:57", "remaining_time": "1 day, 12:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4836, "total_steps": 9627, "loss": 1.6203, "learning_rate": 4.963288044263268e-05, "epoch": 0.5023371766905578, "percentage": 50.23, "elapsed_time": "1 day, 12:29:25", "remaining_time": "1 day, 12:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4837, "total_steps": 9627, "loss": 1.772, "learning_rate": 4.96165643309144e-05, "epoch": 0.5024410512101382, "percentage": 50.24, "elapsed_time": "1 day, 12:29:54", "remaining_time": "1 day, 12:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4838, "total_steps": 9627, "loss": 1.8326, "learning_rate": 4.9600248260029016e-05, "epoch": 0.5025449257297185, "percentage": 50.25, "elapsed_time": "1 day, 12:30:22", "remaining_time": "1 day, 12:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4839, "total_steps": 9627, "loss": 1.5652, "learning_rate": 4.9583932231714095e-05, "epoch": 0.5026488002492988, "percentage": 50.26, "elapsed_time": "1 day, 12:30:51", "remaining_time": "1 day, 12:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4840, "total_steps": 9627, "loss": 1.8814, "learning_rate": 4.956761624770713e-05, "epoch": 0.5027526747688792, "percentage": 50.28, "elapsed_time": "1 day, 12:31:19", "remaining_time": "1 day, 12:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4841, "total_steps": 9627, "loss": 1.748, "learning_rate": 4.9551300309745666e-05, "epoch": 0.5028565492884596, "percentage": 50.29, "elapsed_time": "1 day, 12:31:48", "remaining_time": "1 day, 12:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4842, "total_steps": 9627, "loss": 1.6055, "learning_rate": 4.953498441956723e-05, "epoch": 0.5029604238080398, "percentage": 50.3, "elapsed_time": "1 day, 12:32:17", "remaining_time": "1 day, 12:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4843, "total_steps": 9627, "loss": 1.7516, "learning_rate": 4.951866857890931e-05, "epoch": 0.5030642983276202, "percentage": 50.31, "elapsed_time": "1 day, 12:32:46", "remaining_time": "1 day, 12:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4844, "total_steps": 9627, "loss": 1.521, "learning_rate": 4.950235278950943e-05, "epoch": 0.5031681728472006, "percentage": 50.32, "elapsed_time": "1 day, 12:33:14", "remaining_time": "1 day, 12:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4845, "total_steps": 9627, "loss": 1.7387, "learning_rate": 4.9486037053105125e-05, "epoch": 0.5032720473667809, "percentage": 50.33, "elapsed_time": "1 day, 12:33:43", "remaining_time": "1 day, 12:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4846, "total_steps": 9627, "loss": 1.6565, "learning_rate": 4.946972137143383e-05, "epoch": 0.5033759218863613, "percentage": 50.34, "elapsed_time": "1 day, 12:34:12", "remaining_time": "1 day, 12:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4847, "total_steps": 9627, "loss": 1.7404, "learning_rate": 4.9453405746233076e-05, "epoch": 0.5034797964059416, "percentage": 50.35, "elapsed_time": "1 day, 12:34:41", "remaining_time": "1 day, 12:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4848, "total_steps": 9627, "loss": 1.7237, "learning_rate": 4.943709017924038e-05, "epoch": 0.5035836709255219, "percentage": 50.36, "elapsed_time": "1 day, 12:35:09", "remaining_time": "1 day, 12:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4849, "total_steps": 9627, "loss": 1.4753, "learning_rate": 4.9420774672193165e-05, "epoch": 0.5036875454451023, "percentage": 50.37, "elapsed_time": "1 day, 12:35:37", "remaining_time": "1 day, 12:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4850, "total_steps": 9627, "loss": 1.9151, "learning_rate": 4.940445922682892e-05, "epoch": 0.5037914199646827, "percentage": 50.38, "elapsed_time": "1 day, 12:36:06", "remaining_time": "1 day, 12:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4851, "total_steps": 9627, "loss": 1.707, "learning_rate": 4.938814384488515e-05, "epoch": 0.503895294484263, "percentage": 50.39, "elapsed_time": "1 day, 12:36:33", "remaining_time": "1 day, 12:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4852, "total_steps": 9627, "loss": 1.658, "learning_rate": 4.937182852809926e-05, "epoch": 0.5039991690038433, "percentage": 50.4, "elapsed_time": "1 day, 12:37:04", "remaining_time": "1 day, 12:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4853, "total_steps": 9627, "loss": 1.8472, "learning_rate": 4.935551327820873e-05, "epoch": 0.5041030435234237, "percentage": 50.41, "elapsed_time": "1 day, 12:37:32", "remaining_time": "1 day, 12:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4854, "total_steps": 9627, "loss": 1.7557, "learning_rate": 4.933919809695103e-05, "epoch": 0.5042069180430041, "percentage": 50.42, "elapsed_time": "1 day, 12:38:01", "remaining_time": "1 day, 12:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4855, "total_steps": 9627, "loss": 1.7145, "learning_rate": 4.9322882986063566e-05, "epoch": 0.5043107925625844, "percentage": 50.43, "elapsed_time": "1 day, 12:38:30", "remaining_time": "1 day, 12:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4856, "total_steps": 9627, "loss": 1.5709, "learning_rate": 4.9306567947283785e-05, "epoch": 0.5044146670821648, "percentage": 50.44, "elapsed_time": "1 day, 12:38:57", "remaining_time": "1 day, 12:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4857, "total_steps": 9627, "loss": 1.6956, "learning_rate": 4.92902529823491e-05, "epoch": 0.5045185416017451, "percentage": 50.45, "elapsed_time": "1 day, 12:39:27", "remaining_time": "1 day, 12:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4858, "total_steps": 9627, "loss": 1.6442, "learning_rate": 4.927393809299696e-05, "epoch": 0.5046224161213254, "percentage": 50.46, "elapsed_time": "1 day, 12:39:55", "remaining_time": "1 day, 11:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4859, "total_steps": 9627, "loss": 1.7561, "learning_rate": 4.925762328096473e-05, "epoch": 0.5047262906409058, "percentage": 50.47, "elapsed_time": "1 day, 12:40:23", "remaining_time": "1 day, 11:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4860, "total_steps": 9627, "loss": 1.6888, "learning_rate": 4.924130854798983e-05, "epoch": 0.5048301651604862, "percentage": 50.48, "elapsed_time": "1 day, 12:40:52", "remaining_time": "1 day, 11:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4861, "total_steps": 9627, "loss": 1.8061, "learning_rate": 4.922499389580967e-05, "epoch": 0.5049340396800664, "percentage": 50.49, "elapsed_time": "1 day, 12:41:22", "remaining_time": "1 day, 11:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4862, "total_steps": 9627, "loss": 1.7401, "learning_rate": 4.920867932616159e-05, "epoch": 0.5050379141996468, "percentage": 50.5, "elapsed_time": "1 day, 12:41:50", "remaining_time": "1 day, 11:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4863, "total_steps": 9627, "loss": 1.5993, "learning_rate": 4.9192364840783e-05, "epoch": 0.5051417887192272, "percentage": 50.51, "elapsed_time": "1 day, 12:42:18", "remaining_time": "1 day, 11:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4864, "total_steps": 9627, "loss": 1.7359, "learning_rate": 4.917605044141127e-05, "epoch": 0.5052456632388075, "percentage": 50.52, "elapsed_time": "1 day, 12:42:48", "remaining_time": "1 day, 11:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4865, "total_steps": 9627, "loss": 1.6507, "learning_rate": 4.915973612978372e-05, "epoch": 0.5053495377583879, "percentage": 50.53, "elapsed_time": "1 day, 12:43:17", "remaining_time": "1 day, 11:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4866, "total_steps": 9627, "loss": 1.6881, "learning_rate": 4.914342190763771e-05, "epoch": 0.5054534122779683, "percentage": 50.55, "elapsed_time": "1 day, 12:43:46", "remaining_time": "1 day, 11:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4867, "total_steps": 9627, "loss": 1.5866, "learning_rate": 4.912710777671062e-05, "epoch": 0.5055572867975485, "percentage": 50.56, "elapsed_time": "1 day, 12:44:14", "remaining_time": "1 day, 11:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4868, "total_steps": 9627, "loss": 1.7478, "learning_rate": 4.9110793738739715e-05, "epoch": 0.5056611613171289, "percentage": 50.57, "elapsed_time": "1 day, 12:44:42", "remaining_time": "1 day, 11:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4869, "total_steps": 9627, "loss": 1.6304, "learning_rate": 4.909447979546235e-05, "epoch": 0.5057650358367093, "percentage": 50.58, "elapsed_time": "1 day, 12:45:12", "remaining_time": "1 day, 11:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4870, "total_steps": 9627, "loss": 1.6151, "learning_rate": 4.907816594861582e-05, "epoch": 0.5058689103562896, "percentage": 50.59, "elapsed_time": "1 day, 12:45:39", "remaining_time": "1 day, 11:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4871, "total_steps": 9627, "loss": 1.7042, "learning_rate": 4.906185219993743e-05, "epoch": 0.5059727848758699, "percentage": 50.6, "elapsed_time": "1 day, 12:46:09", "remaining_time": "1 day, 11:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4872, "total_steps": 9627, "loss": 1.7608, "learning_rate": 4.904553855116445e-05, "epoch": 0.5060766593954503, "percentage": 50.61, "elapsed_time": "1 day, 12:46:37", "remaining_time": "1 day, 11:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4873, "total_steps": 9627, "loss": 1.7, "learning_rate": 4.90292250040342e-05, "epoch": 0.5061805339150306, "percentage": 50.62, "elapsed_time": "1 day, 12:47:06", "remaining_time": "1 day, 11:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4874, "total_steps": 9627, "loss": 1.5532, "learning_rate": 4.901291156028388e-05, "epoch": 0.506284408434611, "percentage": 50.63, "elapsed_time": "1 day, 12:47:34", "remaining_time": "1 day, 11:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4875, "total_steps": 9627, "loss": 1.7019, "learning_rate": 4.899659822165079e-05, "epoch": 0.5063882829541914, "percentage": 50.64, "elapsed_time": "1 day, 12:48:03", "remaining_time": "1 day, 11:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4876, "total_steps": 9627, "loss": 1.7414, "learning_rate": 4.898028498987217e-05, "epoch": 0.5064921574737716, "percentage": 50.65, "elapsed_time": "1 day, 12:48:31", "remaining_time": "1 day, 11:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4877, "total_steps": 9627, "loss": 1.7377, "learning_rate": 4.8963971866685245e-05, "epoch": 0.506596031993352, "percentage": 50.66, "elapsed_time": "1 day, 12:49:00", "remaining_time": "1 day, 11:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4878, "total_steps": 9627, "loss": 1.6698, "learning_rate": 4.894765885382722e-05, "epoch": 0.5066999065129324, "percentage": 50.67, "elapsed_time": "1 day, 12:49:28", "remaining_time": "1 day, 11:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4879, "total_steps": 9627, "loss": 1.5029, "learning_rate": 4.8931345953035326e-05, "epoch": 0.5068037810325128, "percentage": 50.68, "elapsed_time": "1 day, 12:49:58", "remaining_time": "1 day, 11:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4880, "total_steps": 9627, "loss": 1.7055, "learning_rate": 4.891503316604677e-05, "epoch": 0.506907655552093, "percentage": 50.69, "elapsed_time": "1 day, 12:50:26", "remaining_time": "1 day, 11:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4881, "total_steps": 9627, "loss": 1.6002, "learning_rate": 4.889872049459869e-05, "epoch": 0.5070115300716734, "percentage": 50.7, "elapsed_time": "1 day, 12:50:55", "remaining_time": "1 day, 11:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4882, "total_steps": 9627, "loss": 1.6086, "learning_rate": 4.88824079404283e-05, "epoch": 0.5071154045912538, "percentage": 50.71, "elapsed_time": "1 day, 12:51:24", "remaining_time": "1 day, 11:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4883, "total_steps": 9627, "loss": 1.4958, "learning_rate": 4.8866095505272754e-05, "epoch": 0.5072192791108341, "percentage": 50.72, "elapsed_time": "1 day, 12:51:52", "remaining_time": "1 day, 11:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4884, "total_steps": 9627, "loss": 1.6549, "learning_rate": 4.8849783190869186e-05, "epoch": 0.5073231536304145, "percentage": 50.73, "elapsed_time": "1 day, 12:52:21", "remaining_time": "1 day, 11:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4885, "total_steps": 9627, "loss": 1.9594, "learning_rate": 4.883347099895473e-05, "epoch": 0.5074270281499949, "percentage": 50.74, "elapsed_time": "1 day, 12:52:50", "remaining_time": "1 day, 11:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4886, "total_steps": 9627, "loss": 1.5258, "learning_rate": 4.8817158931266534e-05, "epoch": 0.5075309026695751, "percentage": 50.75, "elapsed_time": "1 day, 12:53:19", "remaining_time": "1 day, 11:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4887, "total_steps": 9627, "loss": 1.5779, "learning_rate": 4.880084698954166e-05, "epoch": 0.5076347771891555, "percentage": 50.76, "elapsed_time": "1 day, 12:53:47", "remaining_time": "1 day, 11:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4888, "total_steps": 9627, "loss": 1.874, "learning_rate": 4.878453517551722e-05, "epoch": 0.5077386517087359, "percentage": 50.77, "elapsed_time": "1 day, 12:54:15", "remaining_time": "1 day, 11:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4889, "total_steps": 9627, "loss": 1.4991, "learning_rate": 4.876822349093034e-05, "epoch": 0.5078425262283162, "percentage": 50.78, "elapsed_time": "1 day, 12:54:44", "remaining_time": "1 day, 11:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4890, "total_steps": 9627, "loss": 1.5891, "learning_rate": 4.875191193751802e-05, "epoch": 0.5079464007478965, "percentage": 50.79, "elapsed_time": "1 day, 12:55:12", "remaining_time": "1 day, 11:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4891, "total_steps": 9627, "loss": 1.8611, "learning_rate": 4.873560051701736e-05, "epoch": 0.5080502752674769, "percentage": 50.81, "elapsed_time": "1 day, 12:55:42", "remaining_time": "1 day, 11:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4892, "total_steps": 9627, "loss": 1.5606, "learning_rate": 4.871928923116539e-05, "epoch": 0.5081541497870572, "percentage": 50.82, "elapsed_time": "1 day, 12:56:10", "remaining_time": "1 day, 11:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4893, "total_steps": 9627, "loss": 1.7001, "learning_rate": 4.8702978081699104e-05, "epoch": 0.5082580243066376, "percentage": 50.83, "elapsed_time": "1 day, 12:56:39", "remaining_time": "1 day, 11:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4894, "total_steps": 9627, "loss": 1.8272, "learning_rate": 4.868666707035554e-05, "epoch": 0.508361898826218, "percentage": 50.84, "elapsed_time": "1 day, 12:57:07", "remaining_time": "1 day, 11:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4895, "total_steps": 9627, "loss": 1.8023, "learning_rate": 4.86703561988717e-05, "epoch": 0.5084657733457982, "percentage": 50.85, "elapsed_time": "1 day, 12:57:36", "remaining_time": "1 day, 11:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4896, "total_steps": 9627, "loss": 1.6024, "learning_rate": 4.865404546898454e-05, "epoch": 0.5085696478653786, "percentage": 50.86, "elapsed_time": "1 day, 12:58:05", "remaining_time": "1 day, 11:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4897, "total_steps": 9627, "loss": 1.6815, "learning_rate": 4.863773488243105e-05, "epoch": 0.508673522384959, "percentage": 50.87, "elapsed_time": "1 day, 12:58:34", "remaining_time": "1 day, 11:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4898, "total_steps": 9627, "loss": 1.8893, "learning_rate": 4.862142444094816e-05, "epoch": 0.5087773969045393, "percentage": 50.88, "elapsed_time": "1 day, 12:59:01", "remaining_time": "1 day, 11:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4899, "total_steps": 9627, "loss": 1.6191, "learning_rate": 4.8605114146272824e-05, "epoch": 0.5088812714241197, "percentage": 50.89, "elapsed_time": "1 day, 12:59:31", "remaining_time": "1 day, 11:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4900, "total_steps": 9627, "loss": 1.9152, "learning_rate": 4.858880400014194e-05, "epoch": 0.5089851459437, "percentage": 50.9, "elapsed_time": "1 day, 12:59:59", "remaining_time": "1 day, 11:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4901, "total_steps": 9627, "loss": 1.787, "learning_rate": 4.857249400429244e-05, "epoch": 0.5090890204632803, "percentage": 50.91, "elapsed_time": "1 day, 13:00:28", "remaining_time": "1 day, 11:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4902, "total_steps": 9627, "loss": 1.6278, "learning_rate": 4.8556184160461167e-05, "epoch": 0.5091928949828607, "percentage": 50.92, "elapsed_time": "1 day, 13:00:56", "remaining_time": "1 day, 11:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4903, "total_steps": 9627, "loss": 1.8381, "learning_rate": 4.8539874470385024e-05, "epoch": 0.5092967695024411, "percentage": 50.93, "elapsed_time": "1 day, 13:01:25", "remaining_time": "1 day, 11:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4904, "total_steps": 9627, "loss": 1.7702, "learning_rate": 4.852356493580088e-05, "epoch": 0.5094006440220213, "percentage": 50.94, "elapsed_time": "1 day, 13:01:54", "remaining_time": "1 day, 11:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4905, "total_steps": 9627, "loss": 1.8187, "learning_rate": 4.850725555844555e-05, "epoch": 0.5095045185416017, "percentage": 50.95, "elapsed_time": "1 day, 13:02:22", "remaining_time": "1 day, 11:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4906, "total_steps": 9627, "loss": 1.7612, "learning_rate": 4.8490946340055837e-05, "epoch": 0.5096083930611821, "percentage": 50.96, "elapsed_time": "1 day, 13:02:51", "remaining_time": "1 day, 11:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4907, "total_steps": 9627, "loss": 1.6873, "learning_rate": 4.8474637282368577e-05, "epoch": 0.5097122675807625, "percentage": 50.97, "elapsed_time": "1 day, 13:03:20", "remaining_time": "1 day, 11:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4908, "total_steps": 9627, "loss": 2.1091, "learning_rate": 4.8458328387120565e-05, "epoch": 0.5098161421003428, "percentage": 50.98, "elapsed_time": "1 day, 13:03:48", "remaining_time": "1 day, 11:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4909, "total_steps": 9627, "loss": 1.6583, "learning_rate": 4.844201965604853e-05, "epoch": 0.5099200166199231, "percentage": 50.99, "elapsed_time": "1 day, 13:04:16", "remaining_time": "1 day, 11:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4910, "total_steps": 9627, "loss": 1.5176, "learning_rate": 4.842571109088927e-05, "epoch": 0.5100238911395035, "percentage": 51.0, "elapsed_time": "1 day, 13:04:46", "remaining_time": "1 day, 11:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4911, "total_steps": 9627, "loss": 1.5699, "learning_rate": 4.840940269337949e-05, "epoch": 0.5101277656590838, "percentage": 51.01, "elapsed_time": "1 day, 13:05:14", "remaining_time": "1 day, 11:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4912, "total_steps": 9627, "loss": 1.6266, "learning_rate": 4.839309446525592e-05, "epoch": 0.5102316401786642, "percentage": 51.02, "elapsed_time": "1 day, 13:05:43", "remaining_time": "1 day, 11:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4913, "total_steps": 9627, "loss": 1.6759, "learning_rate": 4.837678640825524e-05, "epoch": 0.5103355146982446, "percentage": 51.03, "elapsed_time": "1 day, 13:06:12", "remaining_time": "1 day, 11:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4914, "total_steps": 9627, "loss": 1.7818, "learning_rate": 4.836047852411417e-05, "epoch": 0.5104393892178248, "percentage": 51.04, "elapsed_time": "1 day, 13:06:40", "remaining_time": "1 day, 11:35:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4915, "total_steps": 9627, "loss": 1.7876, "learning_rate": 4.834417081456933e-05, "epoch": 0.5105432637374052, "percentage": 51.05, "elapsed_time": "1 day, 13:07:09", "remaining_time": "1 day, 11:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4916, "total_steps": 9627, "loss": 1.9106, "learning_rate": 4.8327863281357376e-05, "epoch": 0.5106471382569856, "percentage": 51.06, "elapsed_time": "1 day, 13:07:37", "remaining_time": "1 day, 11:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4917, "total_steps": 9627, "loss": 1.6729, "learning_rate": 4.8311555926214966e-05, "epoch": 0.5107510127765659, "percentage": 51.08, "elapsed_time": "1 day, 13:08:06", "remaining_time": "1 day, 11:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4918, "total_steps": 9627, "loss": 1.7575, "learning_rate": 4.829524875087867e-05, "epoch": 0.5108548872961463, "percentage": 51.09, "elapsed_time": "1 day, 13:08:35", "remaining_time": "1 day, 11:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4919, "total_steps": 9627, "loss": 1.5132, "learning_rate": 4.8278941757085063e-05, "epoch": 0.5109587618157266, "percentage": 51.1, "elapsed_time": "1 day, 13:09:04", "remaining_time": "1 day, 11:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4920, "total_steps": 9627, "loss": 1.6706, "learning_rate": 4.8262634946570764e-05, "epoch": 0.5110626363353069, "percentage": 51.11, "elapsed_time": "1 day, 13:09:33", "remaining_time": "1 day, 11:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4921, "total_steps": 9627, "loss": 1.7722, "learning_rate": 4.824632832107227e-05, "epoch": 0.5111665108548873, "percentage": 51.12, "elapsed_time": "1 day, 13:10:01", "remaining_time": "1 day, 11:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4922, "total_steps": 9627, "loss": 1.7226, "learning_rate": 4.8230021882326135e-05, "epoch": 0.5112703853744677, "percentage": 51.13, "elapsed_time": "1 day, 13:10:30", "remaining_time": "1 day, 11:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4923, "total_steps": 9627, "loss": 1.7858, "learning_rate": 4.821371563206888e-05, "epoch": 0.5113742598940479, "percentage": 51.14, "elapsed_time": "1 day, 13:10:59", "remaining_time": "1 day, 11:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4924, "total_steps": 9627, "loss": 1.4821, "learning_rate": 4.819740957203696e-05, "epoch": 0.5114781344136283, "percentage": 51.15, "elapsed_time": "1 day, 13:11:28", "remaining_time": "1 day, 11:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4925, "total_steps": 9627, "loss": 1.6467, "learning_rate": 4.818110370396686e-05, "epoch": 0.5115820089332087, "percentage": 51.16, "elapsed_time": "1 day, 13:11:56", "remaining_time": "1 day, 11:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4926, "total_steps": 9627, "loss": 1.6146, "learning_rate": 4.816479802959503e-05, "epoch": 0.511685883452789, "percentage": 51.17, "elapsed_time": "1 day, 13:12:24", "remaining_time": "1 day, 11:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4927, "total_steps": 9627, "loss": 1.6783, "learning_rate": 4.81484925506579e-05, "epoch": 0.5117897579723694, "percentage": 51.18, "elapsed_time": "1 day, 13:12:54", "remaining_time": "1 day, 11:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4928, "total_steps": 9627, "loss": 1.749, "learning_rate": 4.813218726889186e-05, "epoch": 0.5118936324919497, "percentage": 51.19, "elapsed_time": "1 day, 13:13:22", "remaining_time": "1 day, 11:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4929, "total_steps": 9627, "loss": 1.5492, "learning_rate": 4.8115882186033326e-05, "epoch": 0.51199750701153, "percentage": 51.2, "elapsed_time": "1 day, 13:13:52", "remaining_time": "1 day, 11:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4930, "total_steps": 9627, "loss": 1.7461, "learning_rate": 4.8099577303818616e-05, "epoch": 0.5121013815311104, "percentage": 51.21, "elapsed_time": "1 day, 13:14:20", "remaining_time": "1 day, 11:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4931, "total_steps": 9627, "loss": 1.9981, "learning_rate": 4.8083272623984104e-05, "epoch": 0.5122052560506908, "percentage": 51.22, "elapsed_time": "1 day, 13:14:49", "remaining_time": "1 day, 11:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4932, "total_steps": 9627, "loss": 1.7219, "learning_rate": 4.8066968148266116e-05, "epoch": 0.5123091305702712, "percentage": 51.23, "elapsed_time": "1 day, 13:15:18", "remaining_time": "1 day, 11:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4933, "total_steps": 9627, "loss": 1.6126, "learning_rate": 4.805066387840096e-05, "epoch": 0.5124130050898514, "percentage": 51.24, "elapsed_time": "1 day, 13:15:45", "remaining_time": "1 day, 11:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4934, "total_steps": 9627, "loss": 1.7436, "learning_rate": 4.803435981612486e-05, "epoch": 0.5125168796094318, "percentage": 51.25, "elapsed_time": "1 day, 13:16:13", "remaining_time": "1 day, 11:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4935, "total_steps": 9627, "loss": 1.6401, "learning_rate": 4.801805596317412e-05, "epoch": 0.5126207541290122, "percentage": 51.26, "elapsed_time": "1 day, 13:16:44", "remaining_time": "1 day, 11:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4936, "total_steps": 9627, "loss": 1.6504, "learning_rate": 4.800175232128498e-05, "epoch": 0.5127246286485925, "percentage": 51.27, "elapsed_time": "1 day, 13:17:12", "remaining_time": "1 day, 11:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4937, "total_steps": 9627, "loss": 1.6495, "learning_rate": 4.79854488921936e-05, "epoch": 0.5128285031681729, "percentage": 51.28, "elapsed_time": "1 day, 13:17:41", "remaining_time": "1 day, 11:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4938, "total_steps": 9627, "loss": 1.6088, "learning_rate": 4.7969145677636215e-05, "epoch": 0.5129323776877532, "percentage": 51.29, "elapsed_time": "1 day, 13:18:09", "remaining_time": "1 day, 11:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4939, "total_steps": 9627, "loss": 1.8945, "learning_rate": 4.795284267934898e-05, "epoch": 0.5130362522073335, "percentage": 51.3, "elapsed_time": "1 day, 13:18:38", "remaining_time": "1 day, 11:24:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4940, "total_steps": 9627, "loss": 1.8459, "learning_rate": 4.793653989906802e-05, "epoch": 0.5131401267269139, "percentage": 51.31, "elapsed_time": "1 day, 13:19:07", "remaining_time": "1 day, 11:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4941, "total_steps": 9627, "loss": 1.6314, "learning_rate": 4.792023733852947e-05, "epoch": 0.5132440012464943, "percentage": 51.32, "elapsed_time": "1 day, 13:19:36", "remaining_time": "1 day, 11:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4942, "total_steps": 9627, "loss": 1.6349, "learning_rate": 4.790393499946943e-05, "epoch": 0.5133478757660745, "percentage": 51.33, "elapsed_time": "1 day, 13:20:03", "remaining_time": "1 day, 11:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4943, "total_steps": 9627, "loss": 1.7195, "learning_rate": 4.788763288362394e-05, "epoch": 0.5134517502856549, "percentage": 51.35, "elapsed_time": "1 day, 13:20:32", "remaining_time": "1 day, 11:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4944, "total_steps": 9627, "loss": 1.5917, "learning_rate": 4.787133099272908e-05, "epoch": 0.5135556248052353, "percentage": 51.36, "elapsed_time": "1 day, 13:21:01", "remaining_time": "1 day, 11:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4945, "total_steps": 9627, "loss": 1.6664, "learning_rate": 4.7855029328520876e-05, "epoch": 0.5136594993248156, "percentage": 51.37, "elapsed_time": "1 day, 13:21:30", "remaining_time": "1 day, 11:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4946, "total_steps": 9627, "loss": 1.6255, "learning_rate": 4.7838727892735315e-05, "epoch": 0.513763373844396, "percentage": 51.38, "elapsed_time": "1 day, 13:21:58", "remaining_time": "1 day, 11:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4947, "total_steps": 9627, "loss": 1.7316, "learning_rate": 4.782242668710836e-05, "epoch": 0.5138672483639763, "percentage": 51.39, "elapsed_time": "1 day, 13:22:27", "remaining_time": "1 day, 11:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4948, "total_steps": 9627, "loss": 1.6513, "learning_rate": 4.7806125713376e-05, "epoch": 0.5139711228835566, "percentage": 51.4, "elapsed_time": "1 day, 13:22:56", "remaining_time": "1 day, 11:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4949, "total_steps": 9627, "loss": 1.6415, "learning_rate": 4.7789824973274114e-05, "epoch": 0.514074997403137, "percentage": 51.41, "elapsed_time": "1 day, 13:23:25", "remaining_time": "1 day, 11:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4950, "total_steps": 9627, "loss": 1.8161, "learning_rate": 4.7773524468538624e-05, "epoch": 0.5141788719227174, "percentage": 51.42, "elapsed_time": "1 day, 13:23:53", "remaining_time": "1 day, 11:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4951, "total_steps": 9627, "loss": 1.7179, "learning_rate": 4.7757224200905444e-05, "epoch": 0.5142827464422977, "percentage": 51.43, "elapsed_time": "1 day, 13:24:21", "remaining_time": "1 day, 11:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4952, "total_steps": 9627, "loss": 1.6069, "learning_rate": 4.774092417211037e-05, "epoch": 0.514386620961878, "percentage": 51.44, "elapsed_time": "1 day, 13:24:50", "remaining_time": "1 day, 11:19:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4953, "total_steps": 9627, "loss": 1.7158, "learning_rate": 4.7724624383889256e-05, "epoch": 0.5144904954814584, "percentage": 51.45, "elapsed_time": "1 day, 13:25:19", "remaining_time": "1 day, 11:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4954, "total_steps": 9627, "loss": 1.6917, "learning_rate": 4.770832483797789e-05, "epoch": 0.5145943700010387, "percentage": 51.46, "elapsed_time": "1 day, 13:25:48", "remaining_time": "1 day, 11:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4955, "total_steps": 9627, "loss": 1.817, "learning_rate": 4.769202553611206e-05, "epoch": 0.5146982445206191, "percentage": 51.47, "elapsed_time": "1 day, 13:26:15", "remaining_time": "1 day, 11:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4956, "total_steps": 9627, "loss": 1.7038, "learning_rate": 4.76757264800275e-05, "epoch": 0.5148021190401995, "percentage": 51.48, "elapsed_time": "1 day, 13:26:43", "remaining_time": "1 day, 11:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4957, "total_steps": 9627, "loss": 1.6663, "learning_rate": 4.765942767145994e-05, "epoch": 0.5149059935597798, "percentage": 51.49, "elapsed_time": "1 day, 13:27:12", "remaining_time": "1 day, 11:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4958, "total_steps": 9627, "loss": 1.5594, "learning_rate": 4.764312911214509e-05, "epoch": 0.5150098680793601, "percentage": 51.5, "elapsed_time": "1 day, 13:27:41", "remaining_time": "1 day, 11:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4959, "total_steps": 9627, "loss": 1.7743, "learning_rate": 4.762683080381859e-05, "epoch": 0.5151137425989405, "percentage": 51.51, "elapsed_time": "1 day, 13:28:10", "remaining_time": "1 day, 11:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4960, "total_steps": 9627, "loss": 1.6531, "learning_rate": 4.761053274821611e-05, "epoch": 0.5152176171185209, "percentage": 51.52, "elapsed_time": "1 day, 13:28:38", "remaining_time": "1 day, 11:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4961, "total_steps": 9627, "loss": 1.8683, "learning_rate": 4.7594234947073256e-05, "epoch": 0.5153214916381011, "percentage": 51.53, "elapsed_time": "1 day, 13:29:07", "remaining_time": "1 day, 11:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4962, "total_steps": 9627, "loss": 1.5823, "learning_rate": 4.75779374021256e-05, "epoch": 0.5154253661576815, "percentage": 51.54, "elapsed_time": "1 day, 13:29:36", "remaining_time": "1 day, 11:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4963, "total_steps": 9627, "loss": 1.802, "learning_rate": 4.756164011510871e-05, "epoch": 0.5155292406772619, "percentage": 51.55, "elapsed_time": "1 day, 13:30:04", "remaining_time": "1 day, 11:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4964, "total_steps": 9627, "loss": 1.7046, "learning_rate": 4.754534308775816e-05, "epoch": 0.5156331151968422, "percentage": 51.56, "elapsed_time": "1 day, 13:30:33", "remaining_time": "1 day, 11:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4965, "total_steps": 9627, "loss": 1.5606, "learning_rate": 4.75290463218094e-05, "epoch": 0.5157369897164226, "percentage": 51.57, "elapsed_time": "1 day, 13:31:01", "remaining_time": "1 day, 11:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4966, "total_steps": 9627, "loss": 1.6814, "learning_rate": 4.7512749818997936e-05, "epoch": 0.515840864236003, "percentage": 51.58, "elapsed_time": "1 day, 13:31:29", "remaining_time": "1 day, 11:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4967, "total_steps": 9627, "loss": 1.6354, "learning_rate": 4.749645358105923e-05, "epoch": 0.5159447387555832, "percentage": 51.59, "elapsed_time": "1 day, 13:31:59", "remaining_time": "1 day, 11:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4968, "total_steps": 9627, "loss": 1.6332, "learning_rate": 4.748015760972867e-05, "epoch": 0.5160486132751636, "percentage": 51.6, "elapsed_time": "1 day, 13:32:27", "remaining_time": "1 day, 11:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4969, "total_steps": 9627, "loss": 1.3089, "learning_rate": 4.7463861906741666e-05, "epoch": 0.516152487794744, "percentage": 51.62, "elapsed_time": "1 day, 13:32:56", "remaining_time": "1 day, 11:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4970, "total_steps": 9627, "loss": 1.5917, "learning_rate": 4.7447566473833615e-05, "epoch": 0.5162563623143243, "percentage": 51.63, "elapsed_time": "1 day, 13:33:24", "remaining_time": "1 day, 11:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4971, "total_steps": 9627, "loss": 1.7515, "learning_rate": 4.743127131273979e-05, "epoch": 0.5163602368339046, "percentage": 51.64, "elapsed_time": "1 day, 13:33:52", "remaining_time": "1 day, 11:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4972, "total_steps": 9627, "loss": 1.5085, "learning_rate": 4.7414976425195544e-05, "epoch": 0.516464111353485, "percentage": 51.65, "elapsed_time": "1 day, 13:34:22", "remaining_time": "1 day, 11:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4973, "total_steps": 9627, "loss": 1.8201, "learning_rate": 4.739868181293616e-05, "epoch": 0.5165679858730653, "percentage": 51.66, "elapsed_time": "1 day, 13:34:49", "remaining_time": "1 day, 11:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4974, "total_steps": 9627, "loss": 1.7515, "learning_rate": 4.738238747769687e-05, "epoch": 0.5166718603926457, "percentage": 51.67, "elapsed_time": "1 day, 13:35:18", "remaining_time": "1 day, 11:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4975, "total_steps": 9627, "loss": 1.6677, "learning_rate": 4.7366093421212884e-05, "epoch": 0.5167757349122261, "percentage": 51.68, "elapsed_time": "1 day, 13:35:48", "remaining_time": "1 day, 11:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4976, "total_steps": 9627, "loss": 1.7249, "learning_rate": 4.7349799645219415e-05, "epoch": 0.5168796094318063, "percentage": 51.69, "elapsed_time": "1 day, 13:36:15", "remaining_time": "1 day, 11:08:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4977, "total_steps": 9627, "loss": 1.6639, "learning_rate": 4.73335061514516e-05, "epoch": 0.5169834839513867, "percentage": 51.7, "elapsed_time": "1 day, 13:36:45", "remaining_time": "1 day, 11:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4978, "total_steps": 9627, "loss": 1.6422, "learning_rate": 4.731721294164457e-05, "epoch": 0.5170873584709671, "percentage": 51.71, "elapsed_time": "1 day, 13:37:13", "remaining_time": "1 day, 11:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4979, "total_steps": 9627, "loss": 1.8851, "learning_rate": 4.730092001753346e-05, "epoch": 0.5171912329905474, "percentage": 51.72, "elapsed_time": "1 day, 13:37:41", "remaining_time": "1 day, 11:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4980, "total_steps": 9627, "loss": 1.6397, "learning_rate": 4.72846273808533e-05, "epoch": 0.5172951075101277, "percentage": 51.73, "elapsed_time": "1 day, 13:38:10", "remaining_time": "1 day, 11:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4981, "total_steps": 9627, "loss": 1.4696, "learning_rate": 4.726833503333915e-05, "epoch": 0.5173989820297081, "percentage": 51.74, "elapsed_time": "1 day, 13:38:38", "remaining_time": "1 day, 11:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4982, "total_steps": 9627, "loss": 1.814, "learning_rate": 4.7252042976726e-05, "epoch": 0.5175028565492885, "percentage": 51.75, "elapsed_time": "1 day, 13:39:07", "remaining_time": "1 day, 11:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4983, "total_steps": 9627, "loss": 1.6521, "learning_rate": 4.723575121274885e-05, "epoch": 0.5176067310688688, "percentage": 51.76, "elapsed_time": "1 day, 13:39:35", "remaining_time": "1 day, 11:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4984, "total_steps": 9627, "loss": 1.6085, "learning_rate": 4.721945974314263e-05, "epoch": 0.5177106055884492, "percentage": 51.77, "elapsed_time": "1 day, 13:40:04", "remaining_time": "1 day, 11:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4985, "total_steps": 9627, "loss": 1.6189, "learning_rate": 4.720316856964224e-05, "epoch": 0.5178144801080296, "percentage": 51.78, "elapsed_time": "1 day, 13:40:33", "remaining_time": "1 day, 11:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4986, "total_steps": 9627, "loss": 1.7474, "learning_rate": 4.7186877693982616e-05, "epoch": 0.5179183546276098, "percentage": 51.79, "elapsed_time": "1 day, 13:41:00", "remaining_time": "1 day, 11:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4987, "total_steps": 9627, "loss": 1.5625, "learning_rate": 4.717058711789855e-05, "epoch": 0.5180222291471902, "percentage": 51.8, "elapsed_time": "1 day, 13:41:30", "remaining_time": "1 day, 11:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4988, "total_steps": 9627, "loss": 1.6004, "learning_rate": 4.715429684312489e-05, "epoch": 0.5181261036667706, "percentage": 51.81, "elapsed_time": "1 day, 13:41:57", "remaining_time": "1 day, 11:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4989, "total_steps": 9627, "loss": 1.6596, "learning_rate": 4.713800687139644e-05, "epoch": 0.5182299781863509, "percentage": 51.82, "elapsed_time": "1 day, 13:42:27", "remaining_time": "1 day, 11:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4990, "total_steps": 9627, "loss": 1.8412, "learning_rate": 4.712171720444791e-05, "epoch": 0.5183338527059312, "percentage": 51.83, "elapsed_time": "1 day, 13:42:56", "remaining_time": "1 day, 11:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4991, "total_steps": 9627, "loss": 1.8457, "learning_rate": 4.7105427844014046e-05, "epoch": 0.5184377272255116, "percentage": 51.84, "elapsed_time": "1 day, 13:43:24", "remaining_time": "1 day, 11:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4992, "total_steps": 9627, "loss": 1.6451, "learning_rate": 4.7089138791829554e-05, "epoch": 0.5185416017450919, "percentage": 51.85, "elapsed_time": "1 day, 13:43:54", "remaining_time": "1 day, 11:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4993, "total_steps": 9627, "loss": 1.8016, "learning_rate": 4.707285004962906e-05, "epoch": 0.5186454762646723, "percentage": 51.86, "elapsed_time": "1 day, 13:44:21", "remaining_time": "1 day, 11:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4994, "total_steps": 9627, "loss": 1.5526, "learning_rate": 4.70565616191472e-05, "epoch": 0.5187493507842527, "percentage": 51.87, "elapsed_time": "1 day, 13:44:50", "remaining_time": "1 day, 11:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4995, "total_steps": 9627, "loss": 1.6518, "learning_rate": 4.704027350211859e-05, "epoch": 0.5188532253038329, "percentage": 51.89, "elapsed_time": "1 day, 13:45:19", "remaining_time": "1 day, 11:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4996, "total_steps": 9627, "loss": 1.5955, "learning_rate": 4.702398570027775e-05, "epoch": 0.5189570998234133, "percentage": 51.9, "elapsed_time": "1 day, 13:45:48", "remaining_time": "1 day, 11:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4997, "total_steps": 9627, "loss": 1.7202, "learning_rate": 4.700769821535921e-05, "epoch": 0.5190609743429937, "percentage": 51.91, "elapsed_time": "1 day, 13:46:16", "remaining_time": "1 day, 10:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4998, "total_steps": 9627, "loss": 1.6186, "learning_rate": 4.6991411049097494e-05, "epoch": 0.519164848862574, "percentage": 51.92, "elapsed_time": "1 day, 13:46:46", "remaining_time": "1 day, 10:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4999, "total_steps": 9627, "loss": 1.7077, "learning_rate": 4.697512420322701e-05, "epoch": 0.5192687233821544, "percentage": 51.93, "elapsed_time": "1 day, 13:47:14", "remaining_time": "1 day, 10:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5000, "total_steps": 9627, "loss": 1.5771, "learning_rate": 4.69588376794822e-05, "epoch": 0.5193725979017347, "percentage": 51.94, "elapsed_time": "1 day, 13:47:42", "remaining_time": "1 day, 10:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5001, "total_steps": 9627, "loss": 1.6497, "learning_rate": 4.694255147959749e-05, "epoch": 0.519476472421315, "percentage": 51.95, "elapsed_time": "1 day, 13:48:12", "remaining_time": "1 day, 10:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5002, "total_steps": 9627, "loss": 1.6801, "learning_rate": 4.6926265605307175e-05, "epoch": 0.5195803469408954, "percentage": 51.96, "elapsed_time": "1 day, 13:48:41", "remaining_time": "1 day, 10:57:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5003, "total_steps": 9627, "loss": 1.5736, "learning_rate": 4.690998005834559e-05, "epoch": 0.5196842214604758, "percentage": 51.97, "elapsed_time": "1 day, 13:49:09", "remaining_time": "1 day, 10:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5004, "total_steps": 9627, "loss": 1.7306, "learning_rate": 4.689369484044705e-05, "epoch": 0.519788095980056, "percentage": 51.98, "elapsed_time": "1 day, 13:49:39", "remaining_time": "1 day, 10:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5005, "total_steps": 9627, "loss": 1.7073, "learning_rate": 4.687740995334575e-05, "epoch": 0.5198919704996364, "percentage": 51.99, "elapsed_time": "1 day, 13:50:06", "remaining_time": "1 day, 10:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5006, "total_steps": 9627, "loss": 1.7753, "learning_rate": 4.686112539877594e-05, "epoch": 0.5199958450192168, "percentage": 52.0, "elapsed_time": "1 day, 13:50:36", "remaining_time": "1 day, 10:55:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5007, "total_steps": 9627, "loss": 1.5766, "learning_rate": 4.684484117847181e-05, "epoch": 0.5200997195387971, "percentage": 52.01, "elapsed_time": "1 day, 13:51:04", "remaining_time": "1 day, 10:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5008, "total_steps": 9627, "loss": 1.6717, "learning_rate": 4.6828557294167465e-05, "epoch": 0.5202035940583775, "percentage": 52.02, "elapsed_time": "1 day, 13:51:33", "remaining_time": "1 day, 10:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5009, "total_steps": 9627, "loss": 1.7227, "learning_rate": 4.681227374759704e-05, "epoch": 0.5203074685779578, "percentage": 52.03, "elapsed_time": "1 day, 13:52:01", "remaining_time": "1 day, 10:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5010, "total_steps": 9627, "loss": 1.6448, "learning_rate": 4.679599054049458e-05, "epoch": 0.5204113430975382, "percentage": 52.04, "elapsed_time": "1 day, 13:52:31", "remaining_time": "1 day, 10:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5011, "total_steps": 9627, "loss": 1.7294, "learning_rate": 4.677970767459416e-05, "epoch": 0.5205152176171185, "percentage": 52.05, "elapsed_time": "1 day, 13:52:59", "remaining_time": "1 day, 10:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5012, "total_steps": 9627, "loss": 1.6219, "learning_rate": 4.676342515162973e-05, "epoch": 0.5206190921366989, "percentage": 52.06, "elapsed_time": "1 day, 13:53:27", "remaining_time": "1 day, 10:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5013, "total_steps": 9627, "loss": 1.99, "learning_rate": 4.674714297333527e-05, "epoch": 0.5207229666562793, "percentage": 52.07, "elapsed_time": "1 day, 13:53:55", "remaining_time": "1 day, 10:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5014, "total_steps": 9627, "loss": 1.5943, "learning_rate": 4.673086114144474e-05, "epoch": 0.5208268411758595, "percentage": 52.08, "elapsed_time": "1 day, 13:54:24", "remaining_time": "1 day, 10:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5015, "total_steps": 9627, "loss": 1.6115, "learning_rate": 4.671457965769198e-05, "epoch": 0.5209307156954399, "percentage": 52.09, "elapsed_time": "1 day, 13:54:52", "remaining_time": "1 day, 10:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5016, "total_steps": 9627, "loss": 1.6077, "learning_rate": 4.6698298523810854e-05, "epoch": 0.5210345902150203, "percentage": 52.1, "elapsed_time": "1 day, 13:55:21", "remaining_time": "1 day, 10:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5017, "total_steps": 9627, "loss": 1.5769, "learning_rate": 4.668201774153521e-05, "epoch": 0.5211384647346006, "percentage": 52.11, "elapsed_time": "1 day, 13:55:49", "remaining_time": "1 day, 10:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5018, "total_steps": 9627, "loss": 1.6872, "learning_rate": 4.666573731259877e-05, "epoch": 0.521242339254181, "percentage": 52.12, "elapsed_time": "1 day, 13:56:19", "remaining_time": "1 day, 10:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5019, "total_steps": 9627, "loss": 1.6696, "learning_rate": 4.664945723873529e-05, "epoch": 0.5213462137737613, "percentage": 52.13, "elapsed_time": "1 day, 13:56:47", "remaining_time": "1 day, 10:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5020, "total_steps": 9627, "loss": 1.716, "learning_rate": 4.66331775216785e-05, "epoch": 0.5214500882933416, "percentage": 52.15, "elapsed_time": "1 day, 13:57:16", "remaining_time": "1 day, 10:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5021, "total_steps": 9627, "loss": 1.6107, "learning_rate": 4.6616898163162024e-05, "epoch": 0.521553962812922, "percentage": 52.16, "elapsed_time": "1 day, 13:57:43", "remaining_time": "1 day, 10:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5022, "total_steps": 9627, "loss": 1.6419, "learning_rate": 4.660061916491952e-05, "epoch": 0.5216578373325024, "percentage": 52.17, "elapsed_time": "1 day, 13:58:13", "remaining_time": "1 day, 10:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5023, "total_steps": 9627, "loss": 1.8734, "learning_rate": 4.658434052868455e-05, "epoch": 0.5217617118520826, "percentage": 52.18, "elapsed_time": "1 day, 13:58:41", "remaining_time": "1 day, 10:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5024, "total_steps": 9627, "loss": 1.8781, "learning_rate": 4.656806225619067e-05, "epoch": 0.521865586371663, "percentage": 52.19, "elapsed_time": "1 day, 13:59:09", "remaining_time": "1 day, 10:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5025, "total_steps": 9627, "loss": 1.7415, "learning_rate": 4.655178434917139e-05, "epoch": 0.5219694608912434, "percentage": 52.2, "elapsed_time": "1 day, 13:59:39", "remaining_time": "1 day, 10:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5026, "total_steps": 9627, "loss": 1.6995, "learning_rate": 4.65355068093602e-05, "epoch": 0.5220733354108237, "percentage": 52.21, "elapsed_time": "1 day, 14:00:06", "remaining_time": "1 day, 10:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5027, "total_steps": 9627, "loss": 1.7536, "learning_rate": 4.651922963849048e-05, "epoch": 0.5221772099304041, "percentage": 52.22, "elapsed_time": "1 day, 14:00:35", "remaining_time": "1 day, 10:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5028, "total_steps": 9627, "loss": 1.6309, "learning_rate": 4.6502952838295654e-05, "epoch": 0.5222810844499844, "percentage": 52.23, "elapsed_time": "1 day, 14:01:03", "remaining_time": "1 day, 10:46:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5029, "total_steps": 9627, "loss": 1.6537, "learning_rate": 4.64866764105091e-05, "epoch": 0.5223849589695647, "percentage": 52.24, "elapsed_time": "1 day, 14:01:32", "remaining_time": "1 day, 10:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5030, "total_steps": 9627, "loss": 1.3474, "learning_rate": 4.647040035686409e-05, "epoch": 0.5224888334891451, "percentage": 52.25, "elapsed_time": "1 day, 14:02:01", "remaining_time": "1 day, 10:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5031, "total_steps": 9627, "loss": 1.6824, "learning_rate": 4.64541246790939e-05, "epoch": 0.5225927080087255, "percentage": 52.26, "elapsed_time": "1 day, 14:02:29", "remaining_time": "1 day, 10:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5032, "total_steps": 9627, "loss": 1.6969, "learning_rate": 4.643784937893179e-05, "epoch": 0.5226965825283058, "percentage": 52.27, "elapsed_time": "1 day, 14:02:57", "remaining_time": "1 day, 10:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5033, "total_steps": 9627, "loss": 1.614, "learning_rate": 4.642157445811092e-05, "epoch": 0.5228004570478861, "percentage": 52.28, "elapsed_time": "1 day, 14:03:26", "remaining_time": "1 day, 10:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5034, "total_steps": 9627, "loss": 1.7664, "learning_rate": 4.6405299918364456e-05, "epoch": 0.5229043315674665, "percentage": 52.29, "elapsed_time": "1 day, 14:03:55", "remaining_time": "1 day, 10:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5035, "total_steps": 9627, "loss": 1.4807, "learning_rate": 4.638902576142552e-05, "epoch": 0.5230082060870469, "percentage": 52.3, "elapsed_time": "1 day, 14:04:24", "remaining_time": "1 day, 10:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5036, "total_steps": 9627, "loss": 1.4604, "learning_rate": 4.637275198902717e-05, "epoch": 0.5231120806066272, "percentage": 52.31, "elapsed_time": "1 day, 14:04:51", "remaining_time": "1 day, 10:42:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5037, "total_steps": 9627, "loss": 1.7642, "learning_rate": 4.635647860290244e-05, "epoch": 0.5232159551262076, "percentage": 52.32, "elapsed_time": "1 day, 14:05:21", "remaining_time": "1 day, 10:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5038, "total_steps": 9627, "loss": 1.7285, "learning_rate": 4.634020560478431e-05, "epoch": 0.5233198296457879, "percentage": 52.33, "elapsed_time": "1 day, 14:05:48", "remaining_time": "1 day, 10:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5039, "total_steps": 9627, "loss": 1.665, "learning_rate": 4.6323932996405764e-05, "epoch": 0.5234237041653682, "percentage": 52.34, "elapsed_time": "1 day, 14:06:18", "remaining_time": "1 day, 10:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5040, "total_steps": 9627, "loss": 1.731, "learning_rate": 4.630766077949965e-05, "epoch": 0.5235275786849486, "percentage": 52.35, "elapsed_time": "1 day, 14:06:47", "remaining_time": "1 day, 10:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5041, "total_steps": 9627, "loss": 1.541, "learning_rate": 4.629138895579886e-05, "epoch": 0.523631453204529, "percentage": 52.36, "elapsed_time": "1 day, 14:07:14", "remaining_time": "1 day, 10:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5042, "total_steps": 9627, "loss": 1.6621, "learning_rate": 4.6275117527036246e-05, "epoch": 0.5237353277241092, "percentage": 52.37, "elapsed_time": "1 day, 14:07:43", "remaining_time": "1 day, 10:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5043, "total_steps": 9627, "loss": 1.5298, "learning_rate": 4.625884649494453e-05, "epoch": 0.5238392022436896, "percentage": 52.38, "elapsed_time": "1 day, 14:08:11", "remaining_time": "1 day, 10:39:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5044, "total_steps": 9627, "loss": 1.8429, "learning_rate": 4.6242575861256496e-05, "epoch": 0.52394307676327, "percentage": 52.39, "elapsed_time": "1 day, 14:08:39", "remaining_time": "1 day, 10:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5045, "total_steps": 9627, "loss": 1.589, "learning_rate": 4.622630562770483e-05, "epoch": 0.5240469512828503, "percentage": 52.4, "elapsed_time": "1 day, 14:09:09", "remaining_time": "1 day, 10:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5046, "total_steps": 9627, "loss": 1.6403, "learning_rate": 4.6210035796022166e-05, "epoch": 0.5241508258024307, "percentage": 52.42, "elapsed_time": "1 day, 14:09:37", "remaining_time": "1 day, 10:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5047, "total_steps": 9627, "loss": 1.6255, "learning_rate": 4.619376636794113e-05, "epoch": 0.524254700322011, "percentage": 52.43, "elapsed_time": "1 day, 14:10:06", "remaining_time": "1 day, 10:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5048, "total_steps": 9627, "loss": 1.627, "learning_rate": 4.61774973451943e-05, "epoch": 0.5243585748415913, "percentage": 52.44, "elapsed_time": "1 day, 14:10:33", "remaining_time": "1 day, 10:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5049, "total_steps": 9627, "loss": 1.5215, "learning_rate": 4.6161228729514164e-05, "epoch": 0.5244624493611717, "percentage": 52.45, "elapsed_time": "1 day, 14:11:03", "remaining_time": "1 day, 10:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5050, "total_steps": 9627, "loss": 1.615, "learning_rate": 4.614496052263324e-05, "epoch": 0.5245663238807521, "percentage": 52.46, "elapsed_time": "1 day, 14:11:32", "remaining_time": "1 day, 10:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5051, "total_steps": 9627, "loss": 1.8979, "learning_rate": 4.612869272628394e-05, "epoch": 0.5246701984003324, "percentage": 52.47, "elapsed_time": "1 day, 14:12:00", "remaining_time": "1 day, 10:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5052, "total_steps": 9627, "loss": 1.7807, "learning_rate": 4.611242534219867e-05, "epoch": 0.5247740729199127, "percentage": 52.48, "elapsed_time": "1 day, 14:12:29", "remaining_time": "1 day, 10:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5053, "total_steps": 9627, "loss": 1.6944, "learning_rate": 4.609615837210977e-05, "epoch": 0.5248779474394931, "percentage": 52.49, "elapsed_time": "1 day, 14:12:58", "remaining_time": "1 day, 10:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5054, "total_steps": 9627, "loss": 1.5408, "learning_rate": 4.6079891817749576e-05, "epoch": 0.5249818219590734, "percentage": 52.5, "elapsed_time": "1 day, 14:13:26", "remaining_time": "1 day, 10:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5055, "total_steps": 9627, "loss": 1.8648, "learning_rate": 4.6063625680850306e-05, "epoch": 0.5250856964786538, "percentage": 52.51, "elapsed_time": "1 day, 14:13:54", "remaining_time": "1 day, 10:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5056, "total_steps": 9627, "loss": 1.5844, "learning_rate": 4.6047359963144187e-05, "epoch": 0.5251895709982342, "percentage": 52.52, "elapsed_time": "1 day, 14:14:23", "remaining_time": "1 day, 10:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5057, "total_steps": 9627, "loss": 1.9145, "learning_rate": 4.6031094666363426e-05, "epoch": 0.5252934455178144, "percentage": 52.53, "elapsed_time": "1 day, 14:14:51", "remaining_time": "1 day, 10:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5058, "total_steps": 9627, "loss": 1.9522, "learning_rate": 4.601482979224012e-05, "epoch": 0.5253973200373948, "percentage": 52.54, "elapsed_time": "1 day, 14:15:19", "remaining_time": "1 day, 10:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5059, "total_steps": 9627, "loss": 1.7487, "learning_rate": 4.599856534250633e-05, "epoch": 0.5255011945569752, "percentage": 52.55, "elapsed_time": "1 day, 14:15:49", "remaining_time": "1 day, 10:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5060, "total_steps": 9627, "loss": 1.7626, "learning_rate": 4.5982301318894126e-05, "epoch": 0.5256050690765556, "percentage": 52.56, "elapsed_time": "1 day, 14:16:16", "remaining_time": "1 day, 10:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5061, "total_steps": 9627, "loss": 1.9035, "learning_rate": 4.596603772313552e-05, "epoch": 0.5257089435961358, "percentage": 52.57, "elapsed_time": "1 day, 14:16:44", "remaining_time": "1 day, 10:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5062, "total_steps": 9627, "loss": 1.654, "learning_rate": 4.59497745569624e-05, "epoch": 0.5258128181157162, "percentage": 52.58, "elapsed_time": "1 day, 14:17:14", "remaining_time": "1 day, 10:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5063, "total_steps": 9627, "loss": 1.6587, "learning_rate": 4.593351182210671e-05, "epoch": 0.5259166926352966, "percentage": 52.59, "elapsed_time": "1 day, 14:17:42", "remaining_time": "1 day, 10:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5064, "total_steps": 9627, "loss": 1.7732, "learning_rate": 4.59172495203003e-05, "epoch": 0.5260205671548769, "percentage": 52.6, "elapsed_time": "1 day, 14:18:12", "remaining_time": "1 day, 10:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5065, "total_steps": 9627, "loss": 1.7154, "learning_rate": 4.590098765327496e-05, "epoch": 0.5261244416744573, "percentage": 52.61, "elapsed_time": "1 day, 14:18:39", "remaining_time": "1 day, 10:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5066, "total_steps": 9627, "loss": 1.7209, "learning_rate": 4.588472622276245e-05, "epoch": 0.5262283161940376, "percentage": 52.62, "elapsed_time": "1 day, 14:19:08", "remaining_time": "1 day, 10:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5067, "total_steps": 9627, "loss": 1.7113, "learning_rate": 4.5868465230494525e-05, "epoch": 0.5263321907136179, "percentage": 52.63, "elapsed_time": "1 day, 14:19:38", "remaining_time": "1 day, 10:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5068, "total_steps": 9627, "loss": 1.7318, "learning_rate": 4.58522046782028e-05, "epoch": 0.5264360652331983, "percentage": 52.64, "elapsed_time": "1 day, 14:20:06", "remaining_time": "1 day, 10:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5069, "total_steps": 9627, "loss": 1.721, "learning_rate": 4.5835944567618916e-05, "epoch": 0.5265399397527787, "percentage": 52.65, "elapsed_time": "1 day, 14:20:34", "remaining_time": "1 day, 10:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5070, "total_steps": 9627, "loss": 1.7771, "learning_rate": 4.5819684900474486e-05, "epoch": 0.526643814272359, "percentage": 52.66, "elapsed_time": "1 day, 14:21:03", "remaining_time": "1 day, 10:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5071, "total_steps": 9627, "loss": 1.6757, "learning_rate": 4.580342567850098e-05, "epoch": 0.5267476887919393, "percentage": 52.67, "elapsed_time": "1 day, 14:21:31", "remaining_time": "1 day, 10:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5072, "total_steps": 9627, "loss": 1.597, "learning_rate": 4.578716690342992e-05, "epoch": 0.5268515633115197, "percentage": 52.69, "elapsed_time": "1 day, 14:22:00", "remaining_time": "1 day, 10:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5073, "total_steps": 9627, "loss": 1.4776, "learning_rate": 4.577090857699273e-05, "epoch": 0.5269554378311, "percentage": 52.7, "elapsed_time": "1 day, 14:22:29", "remaining_time": "1 day, 10:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5074, "total_steps": 9627, "loss": 1.7005, "learning_rate": 4.575465070092077e-05, "epoch": 0.5270593123506804, "percentage": 52.71, "elapsed_time": "1 day, 14:22:57", "remaining_time": "1 day, 10:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5075, "total_steps": 9627, "loss": 1.7374, "learning_rate": 4.573839327694539e-05, "epoch": 0.5271631868702608, "percentage": 52.72, "elapsed_time": "1 day, 14:23:26", "remaining_time": "1 day, 10:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5076, "total_steps": 9627, "loss": 1.7146, "learning_rate": 4.5722136306797914e-05, "epoch": 0.527267061389841, "percentage": 52.73, "elapsed_time": "1 day, 14:23:55", "remaining_time": "1 day, 10:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5077, "total_steps": 9627, "loss": 1.7662, "learning_rate": 4.570587979220953e-05, "epoch": 0.5273709359094214, "percentage": 52.74, "elapsed_time": "1 day, 14:24:24", "remaining_time": "1 day, 10:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5078, "total_steps": 9627, "loss": 1.5801, "learning_rate": 4.568962373491146e-05, "epoch": 0.5274748104290018, "percentage": 52.75, "elapsed_time": "1 day, 14:24:52", "remaining_time": "1 day, 10:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5079, "total_steps": 9627, "loss": 1.6804, "learning_rate": 4.567336813663484e-05, "epoch": 0.5275786849485821, "percentage": 52.76, "elapsed_time": "1 day, 14:25:21", "remaining_time": "1 day, 10:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5080, "total_steps": 9627, "loss": 1.6895, "learning_rate": 4.565711299911076e-05, "epoch": 0.5276825594681624, "percentage": 52.77, "elapsed_time": "1 day, 14:25:49", "remaining_time": "1 day, 10:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5081, "total_steps": 9627, "loss": 1.9221, "learning_rate": 4.564085832407026e-05, "epoch": 0.5277864339877428, "percentage": 52.78, "elapsed_time": "1 day, 14:26:18", "remaining_time": "1 day, 10:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5082, "total_steps": 9627, "loss": 1.6225, "learning_rate": 4.5624604113244376e-05, "epoch": 0.5278903085073231, "percentage": 52.79, "elapsed_time": "1 day, 14:26:47", "remaining_time": "1 day, 10:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5083, "total_steps": 9627, "loss": 1.4058, "learning_rate": 4.5608350368363995e-05, "epoch": 0.5279941830269035, "percentage": 52.8, "elapsed_time": "1 day, 14:27:16", "remaining_time": "1 day, 10:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5084, "total_steps": 9627, "loss": 1.4616, "learning_rate": 4.559209709116005e-05, "epoch": 0.5280980575464839, "percentage": 52.81, "elapsed_time": "1 day, 14:27:44", "remaining_time": "1 day, 10:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5085, "total_steps": 9627, "loss": 1.7984, "learning_rate": 4.557584428336339e-05, "epoch": 0.5282019320660641, "percentage": 52.82, "elapsed_time": "1 day, 14:28:13", "remaining_time": "1 day, 10:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5086, "total_steps": 9627, "loss": 1.6124, "learning_rate": 4.555959194670481e-05, "epoch": 0.5283058065856445, "percentage": 52.83, "elapsed_time": "1 day, 14:28:42", "remaining_time": "1 day, 10:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5087, "total_steps": 9627, "loss": 1.629, "learning_rate": 4.554334008291503e-05, "epoch": 0.5284096811052249, "percentage": 52.84, "elapsed_time": "1 day, 14:29:10", "remaining_time": "1 day, 10:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5088, "total_steps": 9627, "loss": 1.6488, "learning_rate": 4.5527088693724775e-05, "epoch": 0.5285135556248053, "percentage": 52.85, "elapsed_time": "1 day, 14:29:39", "remaining_time": "1 day, 10:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5089, "total_steps": 9627, "loss": 1.8, "learning_rate": 4.5510837780864705e-05, "epoch": 0.5286174301443856, "percentage": 52.86, "elapsed_time": "1 day, 14:30:08", "remaining_time": "1 day, 10:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5090, "total_steps": 9627, "loss": 1.6027, "learning_rate": 4.549458734606537e-05, "epoch": 0.5287213046639659, "percentage": 52.87, "elapsed_time": "1 day, 14:30:37", "remaining_time": "1 day, 10:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5091, "total_steps": 9627, "loss": 1.4691, "learning_rate": 4.547833739105735e-05, "epoch": 0.5288251791835463, "percentage": 52.88, "elapsed_time": "1 day, 14:31:05", "remaining_time": "1 day, 10:19:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5092, "total_steps": 9627, "loss": 1.7615, "learning_rate": 4.5462087917571124e-05, "epoch": 0.5289290537031266, "percentage": 52.89, "elapsed_time": "1 day, 14:31:34", "remaining_time": "1 day, 10:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5093, "total_steps": 9627, "loss": 1.6093, "learning_rate": 4.544583892733714e-05, "epoch": 0.529032928222707, "percentage": 52.9, "elapsed_time": "1 day, 14:32:02", "remaining_time": "1 day, 10:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5094, "total_steps": 9627, "loss": 1.7545, "learning_rate": 4.5429590422085776e-05, "epoch": 0.5291368027422874, "percentage": 52.91, "elapsed_time": "1 day, 14:32:31", "remaining_time": "1 day, 10:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5095, "total_steps": 9627, "loss": 1.6709, "learning_rate": 4.5413342403547403e-05, "epoch": 0.5292406772618676, "percentage": 52.92, "elapsed_time": "1 day, 14:32:59", "remaining_time": "1 day, 10:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5096, "total_steps": 9627, "loss": 1.4997, "learning_rate": 4.539709487345227e-05, "epoch": 0.529344551781448, "percentage": 52.93, "elapsed_time": "1 day, 14:33:29", "remaining_time": "1 day, 10:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5097, "total_steps": 9627, "loss": 1.803, "learning_rate": 4.5380847833530625e-05, "epoch": 0.5294484263010284, "percentage": 52.94, "elapsed_time": "1 day, 14:33:56", "remaining_time": "1 day, 10:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5098, "total_steps": 9627, "loss": 1.589, "learning_rate": 4.5364601285512674e-05, "epoch": 0.5295523008206087, "percentage": 52.96, "elapsed_time": "1 day, 14:34:25", "remaining_time": "1 day, 10:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5099, "total_steps": 9627, "loss": 1.6351, "learning_rate": 4.534835523112852e-05, "epoch": 0.529656175340189, "percentage": 52.97, "elapsed_time": "1 day, 14:34:53", "remaining_time": "1 day, 10:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5100, "total_steps": 9627, "loss": 1.7417, "learning_rate": 4.533210967210824e-05, "epoch": 0.5297600498597694, "percentage": 52.98, "elapsed_time": "1 day, 14:35:21", "remaining_time": "1 day, 10:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5101, "total_steps": 9627, "loss": 1.9393, "learning_rate": 4.5315864610181894e-05, "epoch": 0.5298639243793497, "percentage": 52.99, "elapsed_time": "1 day, 14:35:51", "remaining_time": "1 day, 10:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5102, "total_steps": 9627, "loss": 1.5193, "learning_rate": 4.52996200470794e-05, "epoch": 0.5299677988989301, "percentage": 53.0, "elapsed_time": "1 day, 14:36:20", "remaining_time": "1 day, 10:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5103, "total_steps": 9627, "loss": 1.6073, "learning_rate": 4.528337598453071e-05, "epoch": 0.5300716734185105, "percentage": 53.01, "elapsed_time": "1 day, 14:36:49", "remaining_time": "1 day, 10:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5104, "total_steps": 9627, "loss": 1.6722, "learning_rate": 4.5267132424265705e-05, "epoch": 0.5301755479380907, "percentage": 53.02, "elapsed_time": "1 day, 14:37:17", "remaining_time": "1 day, 10:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5105, "total_steps": 9627, "loss": 1.684, "learning_rate": 4.5250889368014166e-05, "epoch": 0.5302794224576711, "percentage": 53.03, "elapsed_time": "1 day, 14:37:46", "remaining_time": "1 day, 10:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5106, "total_steps": 9627, "loss": 1.5668, "learning_rate": 4.523464681750587e-05, "epoch": 0.5303832969772515, "percentage": 53.04, "elapsed_time": "1 day, 14:38:14", "remaining_time": "1 day, 10:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5107, "total_steps": 9627, "loss": 1.8714, "learning_rate": 4.521840477447051e-05, "epoch": 0.5304871714968318, "percentage": 53.05, "elapsed_time": "1 day, 14:38:42", "remaining_time": "1 day, 10:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5108, "total_steps": 9627, "loss": 1.6501, "learning_rate": 4.5202163240637755e-05, "epoch": 0.5305910460164122, "percentage": 53.06, "elapsed_time": "1 day, 14:39:10", "remaining_time": "1 day, 10:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5109, "total_steps": 9627, "loss": 1.5287, "learning_rate": 4.5185922217737175e-05, "epoch": 0.5306949205359925, "percentage": 53.07, "elapsed_time": "1 day, 14:39:39", "remaining_time": "1 day, 10:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5110, "total_steps": 9627, "loss": 1.7683, "learning_rate": 4.5169681707498354e-05, "epoch": 0.5307987950555728, "percentage": 53.08, "elapsed_time": "1 day, 14:40:09", "remaining_time": "1 day, 10:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5111, "total_steps": 9627, "loss": 1.4853, "learning_rate": 4.515344171165072e-05, "epoch": 0.5309026695751532, "percentage": 53.09, "elapsed_time": "1 day, 14:40:37", "remaining_time": "1 day, 10:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5112, "total_steps": 9627, "loss": 1.7049, "learning_rate": 4.5137202231923744e-05, "epoch": 0.5310065440947336, "percentage": 53.1, "elapsed_time": "1 day, 14:41:06", "remaining_time": "1 day, 10:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5113, "total_steps": 9627, "loss": 1.822, "learning_rate": 4.512096327004682e-05, "epoch": 0.531110418614314, "percentage": 53.11, "elapsed_time": "1 day, 14:41:34", "remaining_time": "1 day, 10:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5114, "total_steps": 9627, "loss": 1.8201, "learning_rate": 4.5104724827749254e-05, "epoch": 0.5312142931338942, "percentage": 53.12, "elapsed_time": "1 day, 14:42:03", "remaining_time": "1 day, 10:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5115, "total_steps": 9627, "loss": 1.8475, "learning_rate": 4.508848690676028e-05, "epoch": 0.5313181676534746, "percentage": 53.13, "elapsed_time": "1 day, 14:42:31", "remaining_time": "1 day, 10:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5116, "total_steps": 9627, "loss": 1.8352, "learning_rate": 4.507224950880915e-05, "epoch": 0.531422042173055, "percentage": 53.14, "elapsed_time": "1 day, 14:43:02", "remaining_time": "1 day, 10:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5117, "total_steps": 9627, "loss": 1.7358, "learning_rate": 4.505601263562502e-05, "epoch": 0.5315259166926353, "percentage": 53.15, "elapsed_time": "1 day, 14:43:29", "remaining_time": "1 day, 10:07:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5118, "total_steps": 9627, "loss": 1.7055, "learning_rate": 4.503977628893697e-05, "epoch": 0.5316297912122157, "percentage": 53.16, "elapsed_time": "1 day, 14:43:59", "remaining_time": "1 day, 10:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5119, "total_steps": 9627, "loss": 1.6146, "learning_rate": 4.502354047047406e-05, "epoch": 0.531733665731796, "percentage": 53.17, "elapsed_time": "1 day, 14:44:27", "remaining_time": "1 day, 10:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5120, "total_steps": 9627, "loss": 1.6813, "learning_rate": 4.500730518196527e-05, "epoch": 0.5318375402513763, "percentage": 53.18, "elapsed_time": "1 day, 14:44:55", "remaining_time": "1 day, 10:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5121, "total_steps": 9627, "loss": 1.566, "learning_rate": 4.499107042513953e-05, "epoch": 0.5319414147709567, "percentage": 53.19, "elapsed_time": "1 day, 14:45:25", "remaining_time": "1 day, 10:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5122, "total_steps": 9627, "loss": 1.5526, "learning_rate": 4.4974836201725715e-05, "epoch": 0.5320452892905371, "percentage": 53.2, "elapsed_time": "1 day, 14:45:53", "remaining_time": "1 day, 10:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5123, "total_steps": 9627, "loss": 1.6931, "learning_rate": 4.495860251345266e-05, "epoch": 0.5321491638101173, "percentage": 53.21, "elapsed_time": "1 day, 14:46:22", "remaining_time": "1 day, 10:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5124, "total_steps": 9627, "loss": 1.5507, "learning_rate": 4.49423693620491e-05, "epoch": 0.5322530383296977, "percentage": 53.23, "elapsed_time": "1 day, 14:46:51", "remaining_time": "1 day, 10:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5125, "total_steps": 9627, "loss": 1.7912, "learning_rate": 4.4926136749243754e-05, "epoch": 0.5323569128492781, "percentage": 53.24, "elapsed_time": "1 day, 14:47:18", "remaining_time": "1 day, 10:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5126, "total_steps": 9627, "loss": 1.7354, "learning_rate": 4.490990467676528e-05, "epoch": 0.5324607873688584, "percentage": 53.25, "elapsed_time": "1 day, 14:47:48", "remaining_time": "1 day, 10:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5127, "total_steps": 9627, "loss": 1.5337, "learning_rate": 4.489367314634225e-05, "epoch": 0.5325646618884388, "percentage": 53.26, "elapsed_time": "1 day, 14:48:15", "remaining_time": "1 day, 10:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5128, "total_steps": 9627, "loss": 1.7209, "learning_rate": 4.487744215970318e-05, "epoch": 0.5326685364080191, "percentage": 53.27, "elapsed_time": "1 day, 14:48:46", "remaining_time": "1 day, 10:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5129, "total_steps": 9627, "loss": 1.7835, "learning_rate": 4.486121171857659e-05, "epoch": 0.5327724109275994, "percentage": 53.28, "elapsed_time": "1 day, 14:49:13", "remaining_time": "1 day, 10:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5130, "total_steps": 9627, "loss": 1.7334, "learning_rate": 4.4844981824690844e-05, "epoch": 0.5328762854471798, "percentage": 53.29, "elapsed_time": "1 day, 14:49:42", "remaining_time": "1 day, 10:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5131, "total_steps": 9627, "loss": 1.5904, "learning_rate": 4.4828752479774324e-05, "epoch": 0.5329801599667602, "percentage": 53.3, "elapsed_time": "1 day, 14:50:10", "remaining_time": "1 day, 10:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5132, "total_steps": 9627, "loss": 1.6793, "learning_rate": 4.481252368555535e-05, "epoch": 0.5330840344863405, "percentage": 53.31, "elapsed_time": "1 day, 14:50:40", "remaining_time": "1 day, 10:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5133, "total_steps": 9627, "loss": 1.7484, "learning_rate": 4.4796295443762116e-05, "epoch": 0.5331879090059208, "percentage": 53.32, "elapsed_time": "1 day, 14:51:08", "remaining_time": "1 day, 10:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5134, "total_steps": 9627, "loss": 1.6216, "learning_rate": 4.478006775612284e-05, "epoch": 0.5332917835255012, "percentage": 53.33, "elapsed_time": "1 day, 14:51:36", "remaining_time": "1 day, 10:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5135, "total_steps": 9627, "loss": 1.8178, "learning_rate": 4.476384062436563e-05, "epoch": 0.5333956580450815, "percentage": 53.34, "elapsed_time": "1 day, 14:52:05", "remaining_time": "1 day, 10:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5136, "total_steps": 9627, "loss": 1.8414, "learning_rate": 4.474761405021855e-05, "epoch": 0.5334995325646619, "percentage": 53.35, "elapsed_time": "1 day, 14:52:33", "remaining_time": "1 day, 9:59:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5137, "total_steps": 9627, "loss": 1.7848, "learning_rate": 4.4731388035409586e-05, "epoch": 0.5336034070842423, "percentage": 53.36, "elapsed_time": "1 day, 14:53:02", "remaining_time": "1 day, 9:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5138, "total_steps": 9627, "loss": 1.8443, "learning_rate": 4.471516258166671e-05, "epoch": 0.5337072816038226, "percentage": 53.37, "elapsed_time": "1 day, 14:53:31", "remaining_time": "1 day, 9:58:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5139, "total_steps": 9627, "loss": 1.6394, "learning_rate": 4.4698937690717816e-05, "epoch": 0.5338111561234029, "percentage": 53.38, "elapsed_time": "1 day, 14:53:59", "remaining_time": "1 day, 9:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5140, "total_steps": 9627, "loss": 1.5261, "learning_rate": 4.468271336429068e-05, "epoch": 0.5339150306429833, "percentage": 53.39, "elapsed_time": "1 day, 14:54:28", "remaining_time": "1 day, 9:57:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5141, "total_steps": 9627, "loss": 1.512, "learning_rate": 4.466648960411311e-05, "epoch": 0.5340189051625637, "percentage": 53.4, "elapsed_time": "1 day, 14:54:57", "remaining_time": "1 day, 9:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5142, "total_steps": 9627, "loss": 1.8027, "learning_rate": 4.46502664119128e-05, "epoch": 0.5341227796821439, "percentage": 53.41, "elapsed_time": "1 day, 14:55:25", "remaining_time": "1 day, 9:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5143, "total_steps": 9627, "loss": 1.8224, "learning_rate": 4.463404378941737e-05, "epoch": 0.5342266542017243, "percentage": 53.42, "elapsed_time": "1 day, 14:55:54", "remaining_time": "1 day, 9:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5144, "total_steps": 9627, "loss": 1.6209, "learning_rate": 4.461782173835442e-05, "epoch": 0.5343305287213047, "percentage": 53.43, "elapsed_time": "1 day, 14:56:21", "remaining_time": "1 day, 9:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5145, "total_steps": 9627, "loss": 1.8086, "learning_rate": 4.4601600260451494e-05, "epoch": 0.534434403240885, "percentage": 53.44, "elapsed_time": "1 day, 14:56:51", "remaining_time": "1 day, 9:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5146, "total_steps": 9627, "loss": 1.7298, "learning_rate": 4.458537935743601e-05, "epoch": 0.5345382777604654, "percentage": 53.45, "elapsed_time": "1 day, 14:57:19", "remaining_time": "1 day, 9:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5147, "total_steps": 9627, "loss": 1.6128, "learning_rate": 4.45691590310354e-05, "epoch": 0.5346421522800457, "percentage": 53.46, "elapsed_time": "1 day, 14:57:48", "remaining_time": "1 day, 9:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5148, "total_steps": 9627, "loss": 1.8353, "learning_rate": 4.455293928297698e-05, "epoch": 0.534746026799626, "percentage": 53.47, "elapsed_time": "1 day, 14:58:16", "remaining_time": "1 day, 9:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5149, "total_steps": 9627, "loss": 1.5159, "learning_rate": 4.453672011498805e-05, "epoch": 0.5348499013192064, "percentage": 53.48, "elapsed_time": "1 day, 14:58:45", "remaining_time": "1 day, 9:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5150, "total_steps": 9627, "loss": 1.7056, "learning_rate": 4.45205015287958e-05, "epoch": 0.5349537758387868, "percentage": 53.5, "elapsed_time": "1 day, 14:59:14", "remaining_time": "1 day, 9:53:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5151, "total_steps": 9627, "loss": 1.5728, "learning_rate": 4.450428352612742e-05, "epoch": 0.535057650358367, "percentage": 53.51, "elapsed_time": "1 day, 14:59:43", "remaining_time": "1 day, 9:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5152, "total_steps": 9627, "loss": 1.8235, "learning_rate": 4.448806610870995e-05, "epoch": 0.5351615248779474, "percentage": 53.52, "elapsed_time": "1 day, 15:00:11", "remaining_time": "1 day, 9:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5153, "total_steps": 9627, "loss": 1.6757, "learning_rate": 4.4471849278270446e-05, "epoch": 0.5352653993975278, "percentage": 53.53, "elapsed_time": "1 day, 15:00:40", "remaining_time": "1 day, 9:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5154, "total_steps": 9627, "loss": 1.7759, "learning_rate": 4.445563303653589e-05, "epoch": 0.5353692739171081, "percentage": 53.54, "elapsed_time": "1 day, 15:01:09", "remaining_time": "1 day, 9:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5155, "total_steps": 9627, "loss": 1.6766, "learning_rate": 4.443941738523316e-05, "epoch": 0.5354731484366885, "percentage": 53.55, "elapsed_time": "1 day, 15:01:38", "remaining_time": "1 day, 9:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5156, "total_steps": 9627, "loss": 1.5477, "learning_rate": 4.4423202326089095e-05, "epoch": 0.5355770229562689, "percentage": 53.56, "elapsed_time": "1 day, 15:02:07", "remaining_time": "1 day, 9:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5157, "total_steps": 9627, "loss": 1.6997, "learning_rate": 4.4406987860830505e-05, "epoch": 0.5356808974758491, "percentage": 53.57, "elapsed_time": "1 day, 15:02:34", "remaining_time": "1 day, 9:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5158, "total_steps": 9627, "loss": 1.7147, "learning_rate": 4.439077399118405e-05, "epoch": 0.5357847719954295, "percentage": 53.58, "elapsed_time": "1 day, 15:03:03", "remaining_time": "1 day, 9:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5159, "total_steps": 9627, "loss": 1.6825, "learning_rate": 4.4374560718876426e-05, "epoch": 0.5358886465150099, "percentage": 53.59, "elapsed_time": "1 day, 15:03:32", "remaining_time": "1 day, 9:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5160, "total_steps": 9627, "loss": 1.6888, "learning_rate": 4.4358348045634215e-05, "epoch": 0.5359925210345902, "percentage": 53.6, "elapsed_time": "1 day, 15:04:01", "remaining_time": "1 day, 9:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5161, "total_steps": 9627, "loss": 1.7675, "learning_rate": 4.4342135973183915e-05, "epoch": 0.5360963955541705, "percentage": 53.61, "elapsed_time": "1 day, 15:04:29", "remaining_time": "1 day, 9:48:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5162, "total_steps": 9627, "loss": 1.7902, "learning_rate": 4.432592450325201e-05, "epoch": 0.5362002700737509, "percentage": 53.62, "elapsed_time": "1 day, 15:04:57", "remaining_time": "1 day, 9:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5163, "total_steps": 9627, "loss": 1.8162, "learning_rate": 4.430971363756487e-05, "epoch": 0.5363041445933313, "percentage": 53.63, "elapsed_time": "1 day, 15:05:27", "remaining_time": "1 day, 9:47:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5164, "total_steps": 9627, "loss": 1.7314, "learning_rate": 4.429350337784887e-05, "epoch": 0.5364080191129116, "percentage": 53.64, "elapsed_time": "1 day, 15:05:54", "remaining_time": "1 day, 9:47:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5165, "total_steps": 9627, "loss": 1.7803, "learning_rate": 4.427729372583023e-05, "epoch": 0.536511893632492, "percentage": 53.65, "elapsed_time": "1 day, 15:06:24", "remaining_time": "1 day, 9:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5166, "total_steps": 9627, "loss": 1.6121, "learning_rate": 4.426108468323516e-05, "epoch": 0.5366157681520723, "percentage": 53.66, "elapsed_time": "1 day, 15:06:52", "remaining_time": "1 day, 9:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5167, "total_steps": 9627, "loss": 1.6125, "learning_rate": 4.424487625178983e-05, "epoch": 0.5367196426716526, "percentage": 53.67, "elapsed_time": "1 day, 15:07:22", "remaining_time": "1 day, 9:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5168, "total_steps": 9627, "loss": 1.806, "learning_rate": 4.4228668433220264e-05, "epoch": 0.536823517191233, "percentage": 53.68, "elapsed_time": "1 day, 15:07:49", "remaining_time": "1 day, 9:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5169, "total_steps": 9627, "loss": 1.4683, "learning_rate": 4.421246122925251e-05, "epoch": 0.5369273917108134, "percentage": 53.69, "elapsed_time": "1 day, 15:08:19", "remaining_time": "1 day, 9:45:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5170, "total_steps": 9627, "loss": 1.7148, "learning_rate": 4.419625464161249e-05, "epoch": 0.5370312662303937, "percentage": 53.7, "elapsed_time": "1 day, 15:08:46", "remaining_time": "1 day, 9:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5171, "total_steps": 9627, "loss": 1.5598, "learning_rate": 4.4180048672026066e-05, "epoch": 0.537135140749974, "percentage": 53.71, "elapsed_time": "1 day, 15:09:16", "remaining_time": "1 day, 9:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5172, "total_steps": 9627, "loss": 1.6101, "learning_rate": 4.416384332221906e-05, "epoch": 0.5372390152695544, "percentage": 53.72, "elapsed_time": "1 day, 15:09:44", "remaining_time": "1 day, 9:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5173, "total_steps": 9627, "loss": 1.7957, "learning_rate": 4.414763859391724e-05, "epoch": 0.5373428897891347, "percentage": 53.73, "elapsed_time": "1 day, 15:10:13", "remaining_time": "1 day, 9:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5174, "total_steps": 9627, "loss": 1.5504, "learning_rate": 4.4131434488846236e-05, "epoch": 0.5374467643087151, "percentage": 53.74, "elapsed_time": "1 day, 15:10:42", "remaining_time": "1 day, 9:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5175, "total_steps": 9627, "loss": 1.7433, "learning_rate": 4.4115231008731696e-05, "epoch": 0.5375506388282955, "percentage": 53.76, "elapsed_time": "1 day, 15:11:10", "remaining_time": "1 day, 9:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5176, "total_steps": 9627, "loss": 1.7387, "learning_rate": 4.409902815529914e-05, "epoch": 0.5376545133478757, "percentage": 53.77, "elapsed_time": "1 day, 15:11:38", "remaining_time": "1 day, 9:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5177, "total_steps": 9627, "loss": 1.8365, "learning_rate": 4.4082825930274066e-05, "epoch": 0.5377583878674561, "percentage": 53.78, "elapsed_time": "1 day, 15:12:07", "remaining_time": "1 day, 9:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5178, "total_steps": 9627, "loss": 1.6611, "learning_rate": 4.4066624335381864e-05, "epoch": 0.5378622623870365, "percentage": 53.79, "elapsed_time": "1 day, 15:12:35", "remaining_time": "1 day, 9:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5179, "total_steps": 9627, "loss": 1.7386, "learning_rate": 4.40504233723479e-05, "epoch": 0.5379661369066168, "percentage": 53.8, "elapsed_time": "1 day, 15:13:03", "remaining_time": "1 day, 9:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5180, "total_steps": 9627, "loss": 1.7121, "learning_rate": 4.4034223042897423e-05, "epoch": 0.5380700114261971, "percentage": 53.81, "elapsed_time": "1 day, 15:13:33", "remaining_time": "1 day, 9:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5181, "total_steps": 9627, "loss": 1.746, "learning_rate": 4.4018023348755666e-05, "epoch": 0.5381738859457775, "percentage": 53.82, "elapsed_time": "1 day, 15:14:01", "remaining_time": "1 day, 9:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5182, "total_steps": 9627, "loss": 1.5526, "learning_rate": 4.400182429164778e-05, "epoch": 0.5382777604653578, "percentage": 53.83, "elapsed_time": "1 day, 15:14:30", "remaining_time": "1 day, 9:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5183, "total_steps": 9627, "loss": 1.7516, "learning_rate": 4.39856258732988e-05, "epoch": 0.5383816349849382, "percentage": 53.84, "elapsed_time": "1 day, 15:14:57", "remaining_time": "1 day, 9:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5184, "total_steps": 9627, "loss": 1.7992, "learning_rate": 4.396942809543374e-05, "epoch": 0.5384855095045186, "percentage": 53.85, "elapsed_time": "1 day, 15:15:27", "remaining_time": "1 day, 9:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5185, "total_steps": 9627, "loss": 1.6651, "learning_rate": 4.395323095977757e-05, "epoch": 0.5385893840240988, "percentage": 53.86, "elapsed_time": "1 day, 15:15:55", "remaining_time": "1 day, 9:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5186, "total_steps": 9627, "loss": 1.7299, "learning_rate": 4.393703446805512e-05, "epoch": 0.5386932585436792, "percentage": 53.87, "elapsed_time": "1 day, 15:16:24", "remaining_time": "1 day, 9:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5187, "total_steps": 9627, "loss": 1.8707, "learning_rate": 4.39208386219912e-05, "epoch": 0.5387971330632596, "percentage": 53.88, "elapsed_time": "1 day, 15:16:52", "remaining_time": "1 day, 9:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5188, "total_steps": 9627, "loss": 1.6647, "learning_rate": 4.3904643423310574e-05, "epoch": 0.5389010075828399, "percentage": 53.89, "elapsed_time": "1 day, 15:17:21", "remaining_time": "1 day, 9:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5189, "total_steps": 9627, "loss": 1.7202, "learning_rate": 4.388844887373785e-05, "epoch": 0.5390048821024203, "percentage": 53.9, "elapsed_time": "1 day, 15:17:50", "remaining_time": "1 day, 9:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5190, "total_steps": 9627, "loss": 1.7193, "learning_rate": 4.387225497499767e-05, "epoch": 0.5391087566220006, "percentage": 53.91, "elapsed_time": "1 day, 15:18:18", "remaining_time": "1 day, 9:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5191, "total_steps": 9627, "loss": 1.6711, "learning_rate": 4.385606172881452e-05, "epoch": 0.539212631141581, "percentage": 53.92, "elapsed_time": "1 day, 15:18:46", "remaining_time": "1 day, 9:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5192, "total_steps": 9627, "loss": 1.7142, "learning_rate": 4.383986913691289e-05, "epoch": 0.5393165056611613, "percentage": 53.93, "elapsed_time": "1 day, 15:19:16", "remaining_time": "1 day, 9:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5193, "total_steps": 9627, "loss": 1.7295, "learning_rate": 4.382367720101713e-05, "epoch": 0.5394203801807417, "percentage": 53.94, "elapsed_time": "1 day, 15:19:43", "remaining_time": "1 day, 9:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5194, "total_steps": 9627, "loss": 1.574, "learning_rate": 4.3807485922851574e-05, "epoch": 0.5395242547003221, "percentage": 53.95, "elapsed_time": "1 day, 15:20:13", "remaining_time": "1 day, 9:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5195, "total_steps": 9627, "loss": 1.6128, "learning_rate": 4.3791295304140476e-05, "epoch": 0.5396281292199023, "percentage": 53.96, "elapsed_time": "1 day, 15:20:40", "remaining_time": "1 day, 9:33:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5196, "total_steps": 9627, "loss": 1.8546, "learning_rate": 4.3775105346607983e-05, "epoch": 0.5397320037394827, "percentage": 53.97, "elapsed_time": "1 day, 15:21:10", "remaining_time": "1 day, 9:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5197, "total_steps": 9627, "loss": 1.7621, "learning_rate": 4.375891605197822e-05, "epoch": 0.5398358782590631, "percentage": 53.98, "elapsed_time": "1 day, 15:21:38", "remaining_time": "1 day, 9:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5198, "total_steps": 9627, "loss": 1.6286, "learning_rate": 4.3742727421975224e-05, "epoch": 0.5399397527786434, "percentage": 53.99, "elapsed_time": "1 day, 15:22:07", "remaining_time": "1 day, 9:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5199, "total_steps": 9627, "loss": 1.8302, "learning_rate": 4.3726539458322943e-05, "epoch": 0.5400436272982237, "percentage": 54.0, "elapsed_time": "1 day, 15:22:35", "remaining_time": "1 day, 9:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5200, "total_steps": 9627, "loss": 1.7163, "learning_rate": 4.371035216274526e-05, "epoch": 0.5401475018178041, "percentage": 54.01, "elapsed_time": "1 day, 15:23:03", "remaining_time": "1 day, 9:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5201, "total_steps": 9627, "loss": 1.5436, "learning_rate": 4.369416553696604e-05, "epoch": 0.5402513763373844, "percentage": 54.03, "elapsed_time": "1 day, 15:23:33", "remaining_time": "1 day, 9:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5202, "total_steps": 9627, "loss": 1.6028, "learning_rate": 4.367797958270897e-05, "epoch": 0.5403552508569648, "percentage": 54.04, "elapsed_time": "1 day, 15:24:01", "remaining_time": "1 day, 9:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5203, "total_steps": 9627, "loss": 1.6886, "learning_rate": 4.366179430169779e-05, "epoch": 0.5404591253765452, "percentage": 54.05, "elapsed_time": "1 day, 15:24:29", "remaining_time": "1 day, 9:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5204, "total_steps": 9627, "loss": 1.604, "learning_rate": 4.3645609695656056e-05, "epoch": 0.5405629998961254, "percentage": 54.06, "elapsed_time": "1 day, 15:24:59", "remaining_time": "1 day, 9:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5205, "total_steps": 9627, "loss": 1.6635, "learning_rate": 4.3629425766307334e-05, "epoch": 0.5406668744157058, "percentage": 54.07, "elapsed_time": "1 day, 15:25:27", "remaining_time": "1 day, 9:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5206, "total_steps": 9627, "loss": 1.5922, "learning_rate": 4.361324251537506e-05, "epoch": 0.5407707489352862, "percentage": 54.08, "elapsed_time": "1 day, 15:25:55", "remaining_time": "1 day, 9:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5207, "total_steps": 9627, "loss": 1.7722, "learning_rate": 4.359705994458267e-05, "epoch": 0.5408746234548665, "percentage": 54.09, "elapsed_time": "1 day, 15:26:25", "remaining_time": "1 day, 9:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5208, "total_steps": 9627, "loss": 1.6145, "learning_rate": 4.358087805565343e-05, "epoch": 0.5409784979744469, "percentage": 54.1, "elapsed_time": "1 day, 15:26:53", "remaining_time": "1 day, 9:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5209, "total_steps": 9627, "loss": 1.5844, "learning_rate": 4.35646968503106e-05, "epoch": 0.5410823724940272, "percentage": 54.11, "elapsed_time": "1 day, 15:27:21", "remaining_time": "1 day, 9:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5210, "total_steps": 9627, "loss": 1.7365, "learning_rate": 4.354851633027738e-05, "epoch": 0.5411862470136075, "percentage": 54.12, "elapsed_time": "1 day, 15:27:50", "remaining_time": "1 day, 9:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5211, "total_steps": 9627, "loss": 1.7656, "learning_rate": 4.3532336497276836e-05, "epoch": 0.5412901215331879, "percentage": 54.13, "elapsed_time": "1 day, 15:28:18", "remaining_time": "1 day, 9:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5212, "total_steps": 9627, "loss": 1.7024, "learning_rate": 4.351615735303199e-05, "epoch": 0.5413939960527683, "percentage": 54.14, "elapsed_time": "1 day, 15:28:47", "remaining_time": "1 day, 9:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5213, "total_steps": 9627, "loss": 1.9407, "learning_rate": 4.3499978899265844e-05, "epoch": 0.5414978705723485, "percentage": 54.15, "elapsed_time": "1 day, 15:29:15", "remaining_time": "1 day, 9:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5214, "total_steps": 9627, "loss": 1.7781, "learning_rate": 4.348380113770121e-05, "epoch": 0.5416017450919289, "percentage": 54.16, "elapsed_time": "1 day, 15:29:44", "remaining_time": "1 day, 9:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5215, "total_steps": 9627, "loss": 1.6077, "learning_rate": 4.346762407006093e-05, "epoch": 0.5417056196115093, "percentage": 54.17, "elapsed_time": "1 day, 15:30:12", "remaining_time": "1 day, 9:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5216, "total_steps": 9627, "loss": 1.5677, "learning_rate": 4.345144769806775e-05, "epoch": 0.5418094941310897, "percentage": 54.18, "elapsed_time": "1 day, 15:30:42", "remaining_time": "1 day, 9:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5217, "total_steps": 9627, "loss": 1.5191, "learning_rate": 4.3435272023444304e-05, "epoch": 0.54191336865067, "percentage": 54.19, "elapsed_time": "1 day, 15:31:09", "remaining_time": "1 day, 9:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5218, "total_steps": 9627, "loss": 1.5929, "learning_rate": 4.3419097047913175e-05, "epoch": 0.5420172431702504, "percentage": 54.2, "elapsed_time": "1 day, 15:31:39", "remaining_time": "1 day, 9:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5219, "total_steps": 9627, "loss": 1.612, "learning_rate": 4.340292277319687e-05, "epoch": 0.5421211176898307, "percentage": 54.21, "elapsed_time": "1 day, 15:32:07", "remaining_time": "1 day, 9:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5220, "total_steps": 9627, "loss": 1.6542, "learning_rate": 4.3386749201017856e-05, "epoch": 0.542224992209411, "percentage": 54.22, "elapsed_time": "1 day, 15:32:37", "remaining_time": "1 day, 9:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5221, "total_steps": 9627, "loss": 1.6344, "learning_rate": 4.3370576333098446e-05, "epoch": 0.5423288667289914, "percentage": 54.23, "elapsed_time": "1 day, 15:33:04", "remaining_time": "1 day, 9:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5222, "total_steps": 9627, "loss": 1.6036, "learning_rate": 4.335440417116094e-05, "epoch": 0.5424327412485718, "percentage": 54.24, "elapsed_time": "1 day, 15:33:34", "remaining_time": "1 day, 9:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5223, "total_steps": 9627, "loss": 1.6746, "learning_rate": 4.3338232716927574e-05, "epoch": 0.542536615768152, "percentage": 54.25, "elapsed_time": "1 day, 15:34:02", "remaining_time": "1 day, 9:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5224, "total_steps": 9627, "loss": 1.6285, "learning_rate": 4.3322061972120445e-05, "epoch": 0.5426404902877324, "percentage": 54.26, "elapsed_time": "1 day, 15:34:30", "remaining_time": "1 day, 9:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5225, "total_steps": 9627, "loss": 1.5169, "learning_rate": 4.3305891938461626e-05, "epoch": 0.5427443648073128, "percentage": 54.27, "elapsed_time": "1 day, 15:34:59", "remaining_time": "1 day, 9:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5226, "total_steps": 9627, "loss": 1.6436, "learning_rate": 4.3289722617673115e-05, "epoch": 0.5428482393268931, "percentage": 54.28, "elapsed_time": "1 day, 15:35:27", "remaining_time": "1 day, 9:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5227, "total_steps": 9627, "loss": 1.7777, "learning_rate": 4.327355401147679e-05, "epoch": 0.5429521138464735, "percentage": 54.3, "elapsed_time": "1 day, 15:35:57", "remaining_time": "1 day, 9:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5228, "total_steps": 9627, "loss": 1.5837, "learning_rate": 4.3257386121594485e-05, "epoch": 0.5430559883660538, "percentage": 54.31, "elapsed_time": "1 day, 15:36:24", "remaining_time": "1 day, 9:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5229, "total_steps": 9627, "loss": 1.8451, "learning_rate": 4.324121894974799e-05, "epoch": 0.5431598628856341, "percentage": 54.32, "elapsed_time": "1 day, 15:36:54", "remaining_time": "1 day, 9:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5230, "total_steps": 9627, "loss": 1.7015, "learning_rate": 4.322505249765893e-05, "epoch": 0.5432637374052145, "percentage": 54.33, "elapsed_time": "1 day, 15:37:23", "remaining_time": "1 day, 9:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5231, "total_steps": 9627, "loss": 1.7247, "learning_rate": 4.320888676704895e-05, "epoch": 0.5433676119247949, "percentage": 54.34, "elapsed_time": "1 day, 15:37:51", "remaining_time": "1 day, 9:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5232, "total_steps": 9627, "loss": 1.6449, "learning_rate": 4.3192721759639545e-05, "epoch": 0.5434714864443752, "percentage": 54.35, "elapsed_time": "1 day, 15:38:21", "remaining_time": "1 day, 9:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5233, "total_steps": 9627, "loss": 1.5498, "learning_rate": 4.317655747715218e-05, "epoch": 0.5435753609639555, "percentage": 54.36, "elapsed_time": "1 day, 15:38:48", "remaining_time": "1 day, 9:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5234, "total_steps": 9627, "loss": 1.7594, "learning_rate": 4.3160393921308204e-05, "epoch": 0.5436792354835359, "percentage": 54.37, "elapsed_time": "1 day, 15:39:17", "remaining_time": "1 day, 9:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5235, "total_steps": 9627, "loss": 1.8968, "learning_rate": 4.3144231093828954e-05, "epoch": 0.5437831100031162, "percentage": 54.38, "elapsed_time": "1 day, 15:39:46", "remaining_time": "1 day, 9:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5236, "total_steps": 9627, "loss": 1.5737, "learning_rate": 4.312806899643559e-05, "epoch": 0.5438869845226966, "percentage": 54.39, "elapsed_time": "1 day, 15:40:14", "remaining_time": "1 day, 9:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5237, "total_steps": 9627, "loss": 1.6493, "learning_rate": 4.311190763084928e-05, "epoch": 0.543990859042277, "percentage": 54.4, "elapsed_time": "1 day, 15:40:42", "remaining_time": "1 day, 9:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5238, "total_steps": 9627, "loss": 1.7359, "learning_rate": 4.309574699879109e-05, "epoch": 0.5440947335618572, "percentage": 54.41, "elapsed_time": "1 day, 15:41:12", "remaining_time": "1 day, 9:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5239, "total_steps": 9627, "loss": 1.8211, "learning_rate": 4.3079587101981985e-05, "epoch": 0.5441986080814376, "percentage": 54.42, "elapsed_time": "1 day, 15:41:40", "remaining_time": "1 day, 9:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5240, "total_steps": 9627, "loss": 1.4555, "learning_rate": 4.306342794214286e-05, "epoch": 0.544302482601018, "percentage": 54.43, "elapsed_time": "1 day, 15:42:09", "remaining_time": "1 day, 9:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5241, "total_steps": 9627, "loss": 1.6498, "learning_rate": 4.3047269520994555e-05, "epoch": 0.5444063571205984, "percentage": 54.44, "elapsed_time": "1 day, 15:42:38", "remaining_time": "1 day, 9:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5242, "total_steps": 9627, "loss": 1.7542, "learning_rate": 4.3031111840257834e-05, "epoch": 0.5445102316401786, "percentage": 54.45, "elapsed_time": "1 day, 15:43:06", "remaining_time": "1 day, 9:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5243, "total_steps": 9627, "loss": 1.6508, "learning_rate": 4.301495490165331e-05, "epoch": 0.544614106159759, "percentage": 54.46, "elapsed_time": "1 day, 15:43:34", "remaining_time": "1 day, 9:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5244, "total_steps": 9627, "loss": 1.8128, "learning_rate": 4.299879870690162e-05, "epoch": 0.5447179806793394, "percentage": 54.47, "elapsed_time": "1 day, 15:44:03", "remaining_time": "1 day, 9:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5245, "total_steps": 9627, "loss": 1.6395, "learning_rate": 4.298264325772327e-05, "epoch": 0.5448218551989197, "percentage": 54.48, "elapsed_time": "1 day, 15:44:31", "remaining_time": "1 day, 9:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5246, "total_steps": 9627, "loss": 1.6735, "learning_rate": 4.2966488555838656e-05, "epoch": 0.5449257297185001, "percentage": 54.49, "elapsed_time": "1 day, 15:45:00", "remaining_time": "1 day, 9:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5247, "total_steps": 9627, "loss": 1.7222, "learning_rate": 4.295033460296814e-05, "epoch": 0.5450296042380804, "percentage": 54.5, "elapsed_time": "1 day, 15:45:28", "remaining_time": "1 day, 9:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5248, "total_steps": 9627, "loss": 1.6682, "learning_rate": 4.293418140083203e-05, "epoch": 0.5451334787576607, "percentage": 54.51, "elapsed_time": "1 day, 15:45:58", "remaining_time": "1 day, 9:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5249, "total_steps": 9627, "loss": 1.746, "learning_rate": 4.291802895115046e-05, "epoch": 0.5452373532772411, "percentage": 54.52, "elapsed_time": "1 day, 15:46:26", "remaining_time": "1 day, 9:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5250, "total_steps": 9627, "loss": 1.5329, "learning_rate": 4.290187725564356e-05, "epoch": 0.5453412277968215, "percentage": 54.53, "elapsed_time": "1 day, 15:46:55", "remaining_time": "1 day, 9:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5251, "total_steps": 9627, "loss": 1.7031, "learning_rate": 4.28857263160314e-05, "epoch": 0.5454451023164018, "percentage": 54.54, "elapsed_time": "1 day, 15:47:23", "remaining_time": "1 day, 9:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5252, "total_steps": 9627, "loss": 1.5662, "learning_rate": 4.286957613403387e-05, "epoch": 0.5455489768359821, "percentage": 54.55, "elapsed_time": "1 day, 15:47:53", "remaining_time": "1 day, 9:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5253, "total_steps": 9627, "loss": 1.5221, "learning_rate": 4.285342671137086e-05, "epoch": 0.5456528513555625, "percentage": 54.57, "elapsed_time": "1 day, 15:48:21", "remaining_time": "1 day, 9:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5254, "total_steps": 9627, "loss": 1.5841, "learning_rate": 4.283727804976217e-05, "epoch": 0.5457567258751428, "percentage": 54.58, "elapsed_time": "1 day, 15:48:49", "remaining_time": "1 day, 9:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5255, "total_steps": 9627, "loss": 1.6659, "learning_rate": 4.2821130150927486e-05, "epoch": 0.5458606003947232, "percentage": 54.59, "elapsed_time": "1 day, 15:49:18", "remaining_time": "1 day, 9:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5256, "total_steps": 9627, "loss": 1.463, "learning_rate": 4.280498301658644e-05, "epoch": 0.5459644749143036, "percentage": 54.6, "elapsed_time": "1 day, 15:49:46", "remaining_time": "1 day, 9:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5257, "total_steps": 9627, "loss": 1.941, "learning_rate": 4.27888366484586e-05, "epoch": 0.5460683494338838, "percentage": 54.61, "elapsed_time": "1 day, 15:50:15", "remaining_time": "1 day, 9:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5258, "total_steps": 9627, "loss": 1.7727, "learning_rate": 4.277269104826339e-05, "epoch": 0.5461722239534642, "percentage": 54.62, "elapsed_time": "1 day, 15:50:43", "remaining_time": "1 day, 9:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5259, "total_steps": 9627, "loss": 1.6807, "learning_rate": 4.275654621772021e-05, "epoch": 0.5462760984730446, "percentage": 54.63, "elapsed_time": "1 day, 15:51:13", "remaining_time": "1 day, 9:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5260, "total_steps": 9627, "loss": 1.6696, "learning_rate": 4.2740402158548366e-05, "epoch": 0.5463799729926249, "percentage": 54.64, "elapsed_time": "1 day, 15:51:41", "remaining_time": "1 day, 9:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5261, "total_steps": 9627, "loss": 1.7343, "learning_rate": 4.272425887246706e-05, "epoch": 0.5464838475122052, "percentage": 54.65, "elapsed_time": "1 day, 15:52:09", "remaining_time": "1 day, 9:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5262, "total_steps": 9627, "loss": 1.6486, "learning_rate": 4.270811636119542e-05, "epoch": 0.5465877220317856, "percentage": 54.66, "elapsed_time": "1 day, 15:52:39", "remaining_time": "1 day, 9:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5263, "total_steps": 9627, "loss": 1.691, "learning_rate": 4.269197462645253e-05, "epoch": 0.5466915965513659, "percentage": 54.67, "elapsed_time": "1 day, 15:53:06", "remaining_time": "1 day, 9:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5264, "total_steps": 9627, "loss": 1.6651, "learning_rate": 4.267583366995732e-05, "epoch": 0.5467954710709463, "percentage": 54.68, "elapsed_time": "1 day, 15:53:35", "remaining_time": "1 day, 9:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5265, "total_steps": 9627, "loss": 1.8253, "learning_rate": 4.2659693493428684e-05, "epoch": 0.5468993455905267, "percentage": 54.69, "elapsed_time": "1 day, 15:54:05", "remaining_time": "1 day, 9:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5266, "total_steps": 9627, "loss": 1.6397, "learning_rate": 4.264355409858547e-05, "epoch": 0.5470032201101069, "percentage": 54.7, "elapsed_time": "1 day, 15:54:33", "remaining_time": "1 day, 9:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5267, "total_steps": 9627, "loss": 1.5403, "learning_rate": 4.2627415487146346e-05, "epoch": 0.5471070946296873, "percentage": 54.71, "elapsed_time": "1 day, 15:55:01", "remaining_time": "1 day, 9:02:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5268, "total_steps": 9627, "loss": 1.8323, "learning_rate": 4.261127766082995e-05, "epoch": 0.5472109691492677, "percentage": 54.72, "elapsed_time": "1 day, 15:55:30", "remaining_time": "1 day, 9:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5269, "total_steps": 9627, "loss": 1.7435, "learning_rate": 4.2595140621354846e-05, "epoch": 0.5473148436688481, "percentage": 54.73, "elapsed_time": "1 day, 15:55:59", "remaining_time": "1 day, 9:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5270, "total_steps": 9627, "loss": 1.5484, "learning_rate": 4.257900437043954e-05, "epoch": 0.5474187181884284, "percentage": 54.74, "elapsed_time": "1 day, 15:56:28", "remaining_time": "1 day, 9:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5271, "total_steps": 9627, "loss": 1.6659, "learning_rate": 4.256286890980234e-05, "epoch": 0.5475225927080087, "percentage": 54.75, "elapsed_time": "1 day, 15:56:56", "remaining_time": "1 day, 9:00:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5272, "total_steps": 9627, "loss": 1.6907, "learning_rate": 4.254673424116162e-05, "epoch": 0.5476264672275891, "percentage": 54.76, "elapsed_time": "1 day, 15:57:24", "remaining_time": "1 day, 9:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5273, "total_steps": 9627, "loss": 1.7444, "learning_rate": 4.2530600366235554e-05, "epoch": 0.5477303417471694, "percentage": 54.77, "elapsed_time": "1 day, 15:57:54", "remaining_time": "1 day, 8:59:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5274, "total_steps": 9627, "loss": 1.6692, "learning_rate": 4.251446728674229e-05, "epoch": 0.5478342162667498, "percentage": 54.78, "elapsed_time": "1 day, 15:58:22", "remaining_time": "1 day, 8:59:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5275, "total_steps": 9627, "loss": 1.7245, "learning_rate": 4.2498335004399864e-05, "epoch": 0.5479380907863302, "percentage": 54.79, "elapsed_time": "1 day, 15:58:50", "remaining_time": "1 day, 8:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5276, "total_steps": 9627, "loss": 1.6344, "learning_rate": 4.248220352092626e-05, "epoch": 0.5480419653059104, "percentage": 54.8, "elapsed_time": "1 day, 15:59:20", "remaining_time": "1 day, 8:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5277, "total_steps": 9627, "loss": 1.7355, "learning_rate": 4.246607283803932e-05, "epoch": 0.5481458398254908, "percentage": 54.81, "elapsed_time": "1 day, 15:59:48", "remaining_time": "1 day, 8:58:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5278, "total_steps": 9627, "loss": 1.7528, "learning_rate": 4.2449942957456855e-05, "epoch": 0.5482497143450712, "percentage": 54.82, "elapsed_time": "1 day, 16:00:15", "remaining_time": "1 day, 8:57:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5279, "total_steps": 9627, "loss": 1.7903, "learning_rate": 4.24338138808966e-05, "epoch": 0.5483535888646515, "percentage": 54.84, "elapsed_time": "1 day, 16:00:45", "remaining_time": "1 day, 8:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5280, "total_steps": 9627, "loss": 1.6569, "learning_rate": 4.241768561007613e-05, "epoch": 0.5484574633842318, "percentage": 54.85, "elapsed_time": "1 day, 16:01:13", "remaining_time": "1 day, 8:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5281, "total_steps": 9627, "loss": 1.6377, "learning_rate": 4.2401558146712994e-05, "epoch": 0.5485613379038122, "percentage": 54.86, "elapsed_time": "1 day, 16:01:42", "remaining_time": "1 day, 8:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5282, "total_steps": 9627, "loss": 1.5852, "learning_rate": 4.238543149252466e-05, "epoch": 0.5486652124233925, "percentage": 54.87, "elapsed_time": "1 day, 16:02:10", "remaining_time": "1 day, 8:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5283, "total_steps": 9627, "loss": 1.7107, "learning_rate": 4.2369305649228455e-05, "epoch": 0.5487690869429729, "percentage": 54.88, "elapsed_time": "1 day, 16:02:39", "remaining_time": "1 day, 8:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5284, "total_steps": 9627, "loss": 1.7281, "learning_rate": 4.235318061854168e-05, "epoch": 0.5488729614625533, "percentage": 54.89, "elapsed_time": "1 day, 16:03:07", "remaining_time": "1 day, 8:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5285, "total_steps": 9627, "loss": 1.7443, "learning_rate": 4.233705640218154e-05, "epoch": 0.5489768359821335, "percentage": 54.9, "elapsed_time": "1 day, 16:03:37", "remaining_time": "1 day, 8:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5286, "total_steps": 9627, "loss": 1.5151, "learning_rate": 4.2320933001865106e-05, "epoch": 0.5490807105017139, "percentage": 54.91, "elapsed_time": "1 day, 16:04:05", "remaining_time": "1 day, 8:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5287, "total_steps": 9627, "loss": 2.0025, "learning_rate": 4.230481041930941e-05, "epoch": 0.5491845850212943, "percentage": 54.92, "elapsed_time": "1 day, 16:04:34", "remaining_time": "1 day, 8:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5288, "total_steps": 9627, "loss": 1.6324, "learning_rate": 4.2288688656231384e-05, "epoch": 0.5492884595408746, "percentage": 54.93, "elapsed_time": "1 day, 16:05:02", "remaining_time": "1 day, 8:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5289, "total_steps": 9627, "loss": 1.7869, "learning_rate": 4.227256771434787e-05, "epoch": 0.549392334060455, "percentage": 54.94, "elapsed_time": "1 day, 16:05:30", "remaining_time": "1 day, 8:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5290, "total_steps": 9627, "loss": 1.6478, "learning_rate": 4.2256447595375596e-05, "epoch": 0.5494962085800353, "percentage": 54.95, "elapsed_time": "1 day, 16:06:00", "remaining_time": "1 day, 8:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5291, "total_steps": 9627, "loss": 1.7415, "learning_rate": 4.224032830103128e-05, "epoch": 0.5496000830996156, "percentage": 54.96, "elapsed_time": "1 day, 16:06:27", "remaining_time": "1 day, 8:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5292, "total_steps": 9627, "loss": 1.6643, "learning_rate": 4.2224209833031445e-05, "epoch": 0.549703957619196, "percentage": 54.97, "elapsed_time": "1 day, 16:06:57", "remaining_time": "1 day, 8:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5293, "total_steps": 9627, "loss": 1.76, "learning_rate": 4.220809219309262e-05, "epoch": 0.5498078321387764, "percentage": 54.98, "elapsed_time": "1 day, 16:07:25", "remaining_time": "1 day, 8:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5294, "total_steps": 9627, "loss": 1.6642, "learning_rate": 4.21919753829312e-05, "epoch": 0.5499117066583568, "percentage": 54.99, "elapsed_time": "1 day, 16:07:54", "remaining_time": "1 day, 8:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5295, "total_steps": 9627, "loss": 1.7614, "learning_rate": 4.217585940426351e-05, "epoch": 0.550015581177937, "percentage": 55.0, "elapsed_time": "1 day, 16:08:21", "remaining_time": "1 day, 8:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5296, "total_steps": 9627, "loss": 1.8191, "learning_rate": 4.2159744258805736e-05, "epoch": 0.5501194556975174, "percentage": 55.01, "elapsed_time": "1 day, 16:08:51", "remaining_time": "1 day, 8:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5297, "total_steps": 9627, "loss": 1.4622, "learning_rate": 4.214362994827405e-05, "epoch": 0.5502233302170978, "percentage": 55.02, "elapsed_time": "1 day, 16:09:20", "remaining_time": "1 day, 8:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5298, "total_steps": 9627, "loss": 1.9298, "learning_rate": 4.212751647438451e-05, "epoch": 0.5503272047366781, "percentage": 55.03, "elapsed_time": "1 day, 16:09:48", "remaining_time": "1 day, 8:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5299, "total_steps": 9627, "loss": 1.3871, "learning_rate": 4.2111403838853034e-05, "epoch": 0.5504310792562584, "percentage": 55.04, "elapsed_time": "1 day, 16:10:16", "remaining_time": "1 day, 8:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5300, "total_steps": 9627, "loss": 1.5378, "learning_rate": 4.209529204339553e-05, "epoch": 0.5505349537758388, "percentage": 55.05, "elapsed_time": "1 day, 16:10:46", "remaining_time": "1 day, 8:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5301, "total_steps": 9627, "loss": 1.8026, "learning_rate": 4.207918108972776e-05, "epoch": 0.5506388282954191, "percentage": 55.06, "elapsed_time": "1 day, 16:11:13", "remaining_time": "1 day, 8:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5302, "total_steps": 9627, "loss": 1.6863, "learning_rate": 4.2063070979565426e-05, "epoch": 0.5507427028149995, "percentage": 55.07, "elapsed_time": "1 day, 16:11:42", "remaining_time": "1 day, 8:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5303, "total_steps": 9627, "loss": 1.5964, "learning_rate": 4.204696171462411e-05, "epoch": 0.5508465773345799, "percentage": 55.08, "elapsed_time": "1 day, 16:12:11", "remaining_time": "1 day, 8:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5304, "total_steps": 9627, "loss": 1.7334, "learning_rate": 4.203085329661935e-05, "epoch": 0.5509504518541601, "percentage": 55.1, "elapsed_time": "1 day, 16:12:39", "remaining_time": "1 day, 8:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5305, "total_steps": 9627, "loss": 1.7121, "learning_rate": 4.201474572726654e-05, "epoch": 0.5510543263737405, "percentage": 55.11, "elapsed_time": "1 day, 16:13:08", "remaining_time": "1 day, 8:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5306, "total_steps": 9627, "loss": 1.7883, "learning_rate": 4.199863900828102e-05, "epoch": 0.5511582008933209, "percentage": 55.12, "elapsed_time": "1 day, 16:13:36", "remaining_time": "1 day, 8:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5307, "total_steps": 9627, "loss": 1.7145, "learning_rate": 4.1982533141378056e-05, "epoch": 0.5512620754129012, "percentage": 55.13, "elapsed_time": "1 day, 16:14:04", "remaining_time": "1 day, 8:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5308, "total_steps": 9627, "loss": 1.7868, "learning_rate": 4.1966428128272754e-05, "epoch": 0.5513659499324816, "percentage": 55.14, "elapsed_time": "1 day, 16:14:34", "remaining_time": "1 day, 8:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5309, "total_steps": 9627, "loss": 1.5348, "learning_rate": 4.195032397068019e-05, "epoch": 0.5514698244520619, "percentage": 55.15, "elapsed_time": "1 day, 16:15:01", "remaining_time": "1 day, 8:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5310, "total_steps": 9627, "loss": 1.8076, "learning_rate": 4.193422067031535e-05, "epoch": 0.5515736989716422, "percentage": 55.16, "elapsed_time": "1 day, 16:15:31", "remaining_time": "1 day, 8:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5311, "total_steps": 9627, "loss": 1.7471, "learning_rate": 4.191811822889307e-05, "epoch": 0.5516775734912226, "percentage": 55.17, "elapsed_time": "1 day, 16:15:59", "remaining_time": "1 day, 8:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5312, "total_steps": 9627, "loss": 1.6095, "learning_rate": 4.190201664812816e-05, "epoch": 0.551781448010803, "percentage": 55.18, "elapsed_time": "1 day, 16:16:28", "remaining_time": "1 day, 8:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5313, "total_steps": 9627, "loss": 1.7719, "learning_rate": 4.188591592973534e-05, "epoch": 0.5518853225303832, "percentage": 55.19, "elapsed_time": "1 day, 16:16:56", "remaining_time": "1 day, 8:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5314, "total_steps": 9627, "loss": 1.7216, "learning_rate": 4.1869816075429145e-05, "epoch": 0.5519891970499636, "percentage": 55.2, "elapsed_time": "1 day, 16:17:24", "remaining_time": "1 day, 8:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5315, "total_steps": 9627, "loss": 1.7245, "learning_rate": 4.1853717086924136e-05, "epoch": 0.552093071569544, "percentage": 55.21, "elapsed_time": "1 day, 16:17:54", "remaining_time": "1 day, 8:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5316, "total_steps": 9627, "loss": 1.8018, "learning_rate": 4.183761896593472e-05, "epoch": 0.5521969460891243, "percentage": 55.22, "elapsed_time": "1 day, 16:18:22", "remaining_time": "1 day, 8:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5317, "total_steps": 9627, "loss": 1.628, "learning_rate": 4.182152171417521e-05, "epoch": 0.5523008206087047, "percentage": 55.23, "elapsed_time": "1 day, 16:18:51", "remaining_time": "1 day, 8:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5318, "total_steps": 9627, "loss": 1.6717, "learning_rate": 4.180542533335984e-05, "epoch": 0.552404695128285, "percentage": 55.24, "elapsed_time": "1 day, 16:19:19", "remaining_time": "1 day, 8:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5319, "total_steps": 9627, "loss": 1.7005, "learning_rate": 4.1789329825202736e-05, "epoch": 0.5525085696478654, "percentage": 55.25, "elapsed_time": "1 day, 16:19:48", "remaining_time": "1 day, 8:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5320, "total_steps": 9627, "loss": 1.7466, "learning_rate": 4.177323519141799e-05, "epoch": 0.5526124441674457, "percentage": 55.26, "elapsed_time": "1 day, 16:20:16", "remaining_time": "1 day, 8:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5321, "total_steps": 9627, "loss": 1.6648, "learning_rate": 4.1757141433719506e-05, "epoch": 0.5527163186870261, "percentage": 55.27, "elapsed_time": "1 day, 16:20:45", "remaining_time": "1 day, 8:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5322, "total_steps": 9627, "loss": 1.5708, "learning_rate": 4.174104855382117e-05, "epoch": 0.5528201932066065, "percentage": 55.28, "elapsed_time": "1 day, 16:21:13", "remaining_time": "1 day, 8:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5323, "total_steps": 9627, "loss": 1.6883, "learning_rate": 4.1724956553436756e-05, "epoch": 0.5529240677261867, "percentage": 55.29, "elapsed_time": "1 day, 16:21:42", "remaining_time": "1 day, 8:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5324, "total_steps": 9627, "loss": 1.7223, "learning_rate": 4.17088654342799e-05, "epoch": 0.5530279422457671, "percentage": 55.3, "elapsed_time": "1 day, 16:22:11", "remaining_time": "1 day, 8:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5325, "total_steps": 9627, "loss": 1.8179, "learning_rate": 4.1692775198064194e-05, "epoch": 0.5531318167653475, "percentage": 55.31, "elapsed_time": "1 day, 16:22:39", "remaining_time": "1 day, 8:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5326, "total_steps": 9627, "loss": 1.5664, "learning_rate": 4.167668584650316e-05, "epoch": 0.5532356912849278, "percentage": 55.32, "elapsed_time": "1 day, 16:23:07", "remaining_time": "1 day, 8:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5327, "total_steps": 9627, "loss": 1.6096, "learning_rate": 4.166059738131013e-05, "epoch": 0.5533395658045082, "percentage": 55.33, "elapsed_time": "1 day, 16:23:36", "remaining_time": "1 day, 8:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5328, "total_steps": 9627, "loss": 1.8148, "learning_rate": 4.164450980419844e-05, "epoch": 0.5534434403240885, "percentage": 55.34, "elapsed_time": "1 day, 16:24:05", "remaining_time": "1 day, 8:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5329, "total_steps": 9627, "loss": 1.6699, "learning_rate": 4.162842311688129e-05, "epoch": 0.5535473148436688, "percentage": 55.35, "elapsed_time": "1 day, 16:24:33", "remaining_time": "1 day, 8:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5330, "total_steps": 9627, "loss": 1.7729, "learning_rate": 4.161233732107177e-05, "epoch": 0.5536511893632492, "percentage": 55.37, "elapsed_time": "1 day, 16:25:03", "remaining_time": "1 day, 8:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5331, "total_steps": 9627, "loss": 1.963, "learning_rate": 4.1596252418482884e-05, "epoch": 0.5537550638828296, "percentage": 55.38, "elapsed_time": "1 day, 16:25:30", "remaining_time": "1 day, 8:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5332, "total_steps": 9627, "loss": 1.8112, "learning_rate": 4.158016841082759e-05, "epoch": 0.5538589384024099, "percentage": 55.39, "elapsed_time": "1 day, 16:26:00", "remaining_time": "1 day, 8:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5333, "total_steps": 9627, "loss": 1.7265, "learning_rate": 4.1564085299818665e-05, "epoch": 0.5539628129219902, "percentage": 55.4, "elapsed_time": "1 day, 16:26:27", "remaining_time": "1 day, 8:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5334, "total_steps": 9627, "loss": 1.7181, "learning_rate": 4.154800308716885e-05, "epoch": 0.5540666874415706, "percentage": 55.41, "elapsed_time": "1 day, 16:26:55", "remaining_time": "1 day, 8:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5335, "total_steps": 9627, "loss": 1.8835, "learning_rate": 4.15319217745908e-05, "epoch": 0.5541705619611509, "percentage": 55.42, "elapsed_time": "1 day, 16:27:25", "remaining_time": "1 day, 8:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5336, "total_steps": 9627, "loss": 1.6447, "learning_rate": 4.151584136379702e-05, "epoch": 0.5542744364807313, "percentage": 55.43, "elapsed_time": "1 day, 16:27:53", "remaining_time": "1 day, 8:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5337, "total_steps": 9627, "loss": 1.7282, "learning_rate": 4.149976185649994e-05, "epoch": 0.5543783110003117, "percentage": 55.44, "elapsed_time": "1 day, 16:28:22", "remaining_time": "1 day, 8:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5338, "total_steps": 9627, "loss": 1.7406, "learning_rate": 4.148368325441194e-05, "epoch": 0.5544821855198919, "percentage": 55.45, "elapsed_time": "1 day, 16:28:50", "remaining_time": "1 day, 8:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5339, "total_steps": 9627, "loss": 1.7426, "learning_rate": 4.1467605559245226e-05, "epoch": 0.5545860600394723, "percentage": 55.46, "elapsed_time": "1 day, 16:29:18", "remaining_time": "1 day, 8:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5340, "total_steps": 9627, "loss": 1.8979, "learning_rate": 4.145152877271196e-05, "epoch": 0.5546899345590527, "percentage": 55.47, "elapsed_time": "1 day, 16:29:47", "remaining_time": "1 day, 8:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5341, "total_steps": 9627, "loss": 1.7588, "learning_rate": 4.143545289652422e-05, "epoch": 0.554793809078633, "percentage": 55.48, "elapsed_time": "1 day, 16:30:15", "remaining_time": "1 day, 8:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5342, "total_steps": 9627, "loss": 1.6979, "learning_rate": 4.141937793239392e-05, "epoch": 0.5548976835982133, "percentage": 55.49, "elapsed_time": "1 day, 16:30:43", "remaining_time": "1 day, 8:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5343, "total_steps": 9627, "loss": 1.6303, "learning_rate": 4.140330388203295e-05, "epoch": 0.5550015581177937, "percentage": 55.5, "elapsed_time": "1 day, 16:31:13", "remaining_time": "1 day, 8:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5344, "total_steps": 9627, "loss": 1.6592, "learning_rate": 4.138723074715306e-05, "epoch": 0.555105432637374, "percentage": 55.51, "elapsed_time": "1 day, 16:31:40", "remaining_time": "1 day, 8:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5345, "total_steps": 9627, "loss": 1.7364, "learning_rate": 4.1371158529465916e-05, "epoch": 0.5552093071569544, "percentage": 55.52, "elapsed_time": "1 day, 16:32:09", "remaining_time": "1 day, 8:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5346, "total_steps": 9627, "loss": 1.5759, "learning_rate": 4.1355087230683065e-05, "epoch": 0.5553131816765348, "percentage": 55.53, "elapsed_time": "1 day, 16:32:37", "remaining_time": "1 day, 8:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5347, "total_steps": 9627, "loss": 1.544, "learning_rate": 4.1339016852516e-05, "epoch": 0.5554170561961151, "percentage": 55.54, "elapsed_time": "1 day, 16:33:06", "remaining_time": "1 day, 8:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5348, "total_steps": 9627, "loss": 1.8926, "learning_rate": 4.132294739667609e-05, "epoch": 0.5555209307156954, "percentage": 55.55, "elapsed_time": "1 day, 16:33:35", "remaining_time": "1 day, 8:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5349, "total_steps": 9627, "loss": 1.741, "learning_rate": 4.130687886487459e-05, "epoch": 0.5556248052352758, "percentage": 55.56, "elapsed_time": "1 day, 16:34:03", "remaining_time": "1 day, 8:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5350, "total_steps": 9627, "loss": 1.6806, "learning_rate": 4.1290811258822685e-05, "epoch": 0.5557286797548562, "percentage": 55.57, "elapsed_time": "1 day, 16:34:32", "remaining_time": "1 day, 8:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5351, "total_steps": 9627, "loss": 1.9815, "learning_rate": 4.127474458023146e-05, "epoch": 0.5558325542744365, "percentage": 55.58, "elapsed_time": "1 day, 16:35:00", "remaining_time": "1 day, 8:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5352, "total_steps": 9627, "loss": 1.7249, "learning_rate": 4.125867883081186e-05, "epoch": 0.5559364287940168, "percentage": 55.59, "elapsed_time": "1 day, 16:35:28", "remaining_time": "1 day, 8:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5353, "total_steps": 9627, "loss": 1.546, "learning_rate": 4.124261401227477e-05, "epoch": 0.5560403033135972, "percentage": 55.6, "elapsed_time": "1 day, 16:35:57", "remaining_time": "1 day, 8:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5354, "total_steps": 9627, "loss": 1.6632, "learning_rate": 4.122655012633101e-05, "epoch": 0.5561441778331775, "percentage": 55.61, "elapsed_time": "1 day, 16:36:26", "remaining_time": "1 day, 8:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5355, "total_steps": 9627, "loss": 1.6128, "learning_rate": 4.121048717469119e-05, "epoch": 0.5562480523527579, "percentage": 55.62, "elapsed_time": "1 day, 16:36:54", "remaining_time": "1 day, 8:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5356, "total_steps": 9627, "loss": 1.618, "learning_rate": 4.119442515906595e-05, "epoch": 0.5563519268723383, "percentage": 55.64, "elapsed_time": "1 day, 16:37:23", "remaining_time": "1 day, 8:23:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5357, "total_steps": 9627, "loss": 1.787, "learning_rate": 4.117836408116574e-05, "epoch": 0.5564558013919185, "percentage": 55.65, "elapsed_time": "1 day, 16:37:51", "remaining_time": "1 day, 8:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5358, "total_steps": 9627, "loss": 1.6505, "learning_rate": 4.116230394270094e-05, "epoch": 0.5565596759114989, "percentage": 55.66, "elapsed_time": "1 day, 16:38:19", "remaining_time": "1 day, 8:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5359, "total_steps": 9627, "loss": 1.7579, "learning_rate": 4.114624474538183e-05, "epoch": 0.5566635504310793, "percentage": 55.67, "elapsed_time": "1 day, 16:38:48", "remaining_time": "1 day, 8:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5360, "total_steps": 9627, "loss": 1.7672, "learning_rate": 4.113018649091861e-05, "epoch": 0.5567674249506596, "percentage": 55.68, "elapsed_time": "1 day, 16:39:17", "remaining_time": "1 day, 8:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5361, "total_steps": 9627, "loss": 1.8521, "learning_rate": 4.111412918102132e-05, "epoch": 0.5568712994702399, "percentage": 55.69, "elapsed_time": "1 day, 16:39:46", "remaining_time": "1 day, 8:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5362, "total_steps": 9627, "loss": 1.6816, "learning_rate": 4.1098072817399956e-05, "epoch": 0.5569751739898203, "percentage": 55.7, "elapsed_time": "1 day, 16:40:14", "remaining_time": "1 day, 8:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5363, "total_steps": 9627, "loss": 1.7746, "learning_rate": 4.108201740176443e-05, "epoch": 0.5570790485094006, "percentage": 55.71, "elapsed_time": "1 day, 16:40:42", "remaining_time": "1 day, 8:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5364, "total_steps": 9627, "loss": 1.7837, "learning_rate": 4.106596293582446e-05, "epoch": 0.557182923028981, "percentage": 55.72, "elapsed_time": "1 day, 16:41:10", "remaining_time": "1 day, 8:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5365, "total_steps": 9627, "loss": 1.8066, "learning_rate": 4.104990942128976e-05, "epoch": 0.5572867975485614, "percentage": 55.73, "elapsed_time": "1 day, 16:41:39", "remaining_time": "1 day, 8:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5366, "total_steps": 9627, "loss": 1.472, "learning_rate": 4.10338568598699e-05, "epoch": 0.5573906720681416, "percentage": 55.74, "elapsed_time": "1 day, 16:42:08", "remaining_time": "1 day, 8:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5367, "total_steps": 9627, "loss": 1.6328, "learning_rate": 4.1017805253274336e-05, "epoch": 0.557494546587722, "percentage": 55.75, "elapsed_time": "1 day, 16:42:36", "remaining_time": "1 day, 8:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5368, "total_steps": 9627, "loss": 1.5223, "learning_rate": 4.100175460321244e-05, "epoch": 0.5575984211073024, "percentage": 55.76, "elapsed_time": "1 day, 16:43:04", "remaining_time": "1 day, 8:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5369, "total_steps": 9627, "loss": 1.685, "learning_rate": 4.0985704911393506e-05, "epoch": 0.5577022956268827, "percentage": 55.77, "elapsed_time": "1 day, 16:43:33", "remaining_time": "1 day, 8:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5370, "total_steps": 9627, "loss": 1.7821, "learning_rate": 4.096965617952667e-05, "epoch": 0.557806170146463, "percentage": 55.78, "elapsed_time": "1 day, 16:44:02", "remaining_time": "1 day, 8:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5371, "total_steps": 9627, "loss": 1.7831, "learning_rate": 4.0953608409321024e-05, "epoch": 0.5579100446660434, "percentage": 55.79, "elapsed_time": "1 day, 16:44:31", "remaining_time": "1 day, 8:17:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5372, "total_steps": 9627, "loss": 1.6776, "learning_rate": 4.093756160248551e-05, "epoch": 0.5580139191856238, "percentage": 55.8, "elapsed_time": "1 day, 16:44:59", "remaining_time": "1 day, 8:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5373, "total_steps": 9627, "loss": 1.8743, "learning_rate": 4.092151576072901e-05, "epoch": 0.5581177937052041, "percentage": 55.81, "elapsed_time": "1 day, 16:45:27", "remaining_time": "1 day, 8:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5374, "total_steps": 9627, "loss": 1.6113, "learning_rate": 4.0905470885760244e-05, "epoch": 0.5582216682247845, "percentage": 55.82, "elapsed_time": "1 day, 16:45:56", "remaining_time": "1 day, 8:15:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5375, "total_steps": 9627, "loss": 1.842, "learning_rate": 4.088942697928789e-05, "epoch": 0.5583255427443649, "percentage": 55.83, "elapsed_time": "1 day, 16:46:24", "remaining_time": "1 day, 8:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5376, "total_steps": 9627, "loss": 1.7603, "learning_rate": 4.087338404302052e-05, "epoch": 0.5584294172639451, "percentage": 55.84, "elapsed_time": "1 day, 16:46:53", "remaining_time": "1 day, 8:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5377, "total_steps": 9627, "loss": 1.597, "learning_rate": 4.0857342078666546e-05, "epoch": 0.5585332917835255, "percentage": 55.85, "elapsed_time": "1 day, 16:47:21", "remaining_time": "1 day, 8:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5378, "total_steps": 9627, "loss": 1.7326, "learning_rate": 4.0841301087934326e-05, "epoch": 0.5586371663031059, "percentage": 55.86, "elapsed_time": "1 day, 16:47:49", "remaining_time": "1 day, 8:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5379, "total_steps": 9627, "loss": 1.5858, "learning_rate": 4.082526107253212e-05, "epoch": 0.5587410408226862, "percentage": 55.87, "elapsed_time": "1 day, 16:48:19", "remaining_time": "1 day, 8:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5380, "total_steps": 9627, "loss": 1.5894, "learning_rate": 4.080922203416801e-05, "epoch": 0.5588449153422665, "percentage": 55.88, "elapsed_time": "1 day, 16:48:47", "remaining_time": "1 day, 8:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5381, "total_steps": 9627, "loss": 1.6721, "learning_rate": 4.079318397455007e-05, "epoch": 0.5589487898618469, "percentage": 55.89, "elapsed_time": "1 day, 16:49:15", "remaining_time": "1 day, 8:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5382, "total_steps": 9627, "loss": 1.8013, "learning_rate": 4.077714689538624e-05, "epoch": 0.5590526643814272, "percentage": 55.91, "elapsed_time": "1 day, 16:49:43", "remaining_time": "1 day, 8:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5383, "total_steps": 9627, "loss": 1.6274, "learning_rate": 4.076111079838431e-05, "epoch": 0.5591565389010076, "percentage": 55.92, "elapsed_time": "1 day, 16:50:13", "remaining_time": "1 day, 8:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5384, "total_steps": 9627, "loss": 1.7273, "learning_rate": 4.074507568525201e-05, "epoch": 0.559260413420588, "percentage": 55.93, "elapsed_time": "1 day, 16:50:41", "remaining_time": "1 day, 8:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5385, "total_steps": 9627, "loss": 1.6412, "learning_rate": 4.072904155769697e-05, "epoch": 0.5593642879401682, "percentage": 55.94, "elapsed_time": "1 day, 16:51:10", "remaining_time": "1 day, 8:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5386, "total_steps": 9627, "loss": 1.8271, "learning_rate": 4.0713008417426676e-05, "epoch": 0.5594681624597486, "percentage": 55.95, "elapsed_time": "1 day, 16:51:37", "remaining_time": "1 day, 8:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5387, "total_steps": 9627, "loss": 1.7992, "learning_rate": 4.069697626614855e-05, "epoch": 0.559572036979329, "percentage": 55.96, "elapsed_time": "1 day, 16:52:06", "remaining_time": "1 day, 8:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5388, "total_steps": 9627, "loss": 1.4903, "learning_rate": 4.068094510556989e-05, "epoch": 0.5596759114989093, "percentage": 55.97, "elapsed_time": "1 day, 16:52:35", "remaining_time": "1 day, 8:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5389, "total_steps": 9627, "loss": 1.5853, "learning_rate": 4.066491493739788e-05, "epoch": 0.5597797860184897, "percentage": 55.98, "elapsed_time": "1 day, 16:53:04", "remaining_time": "1 day, 8:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5390, "total_steps": 9627, "loss": 1.7506, "learning_rate": 4.064888576333961e-05, "epoch": 0.55988366053807, "percentage": 55.99, "elapsed_time": "1 day, 16:53:32", "remaining_time": "1 day, 8:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5391, "total_steps": 9627, "loss": 1.6431, "learning_rate": 4.063285758510207e-05, "epoch": 0.5599875350576503, "percentage": 56.0, "elapsed_time": "1 day, 16:54:00", "remaining_time": "1 day, 8:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5392, "total_steps": 9627, "loss": 1.7715, "learning_rate": 4.061683040439214e-05, "epoch": 0.5600914095772307, "percentage": 56.01, "elapsed_time": "1 day, 16:54:28", "remaining_time": "1 day, 8:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5393, "total_steps": 9627, "loss": 1.6373, "learning_rate": 4.060080422291656e-05, "epoch": 0.5601952840968111, "percentage": 56.02, "elapsed_time": "1 day, 16:54:57", "remaining_time": "1 day, 8:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5394, "total_steps": 9627, "loss": 1.7707, "learning_rate": 4.058477904238203e-05, "epoch": 0.5602991586163913, "percentage": 56.03, "elapsed_time": "1 day, 16:55:25", "remaining_time": "1 day, 8:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5395, "total_steps": 9627, "loss": 1.8821, "learning_rate": 4.056875486449507e-05, "epoch": 0.5604030331359717, "percentage": 56.04, "elapsed_time": "1 day, 16:55:54", "remaining_time": "1 day, 8:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5396, "total_steps": 9627, "loss": 1.7404, "learning_rate": 4.055273169096216e-05, "epoch": 0.5605069076555521, "percentage": 56.05, "elapsed_time": "1 day, 16:56:22", "remaining_time": "1 day, 8:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5397, "total_steps": 9627, "loss": 1.679, "learning_rate": 4.053670952348964e-05, "epoch": 0.5606107821751325, "percentage": 56.06, "elapsed_time": "1 day, 16:56:51", "remaining_time": "1 day, 8:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5398, "total_steps": 9627, "loss": 1.69, "learning_rate": 4.052068836378374e-05, "epoch": 0.5607146566947128, "percentage": 56.07, "elapsed_time": "1 day, 16:57:19", "remaining_time": "1 day, 8:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5399, "total_steps": 9627, "loss": 1.6595, "learning_rate": 4.050466821355058e-05, "epoch": 0.5608185312142931, "percentage": 56.08, "elapsed_time": "1 day, 16:57:48", "remaining_time": "1 day, 8:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5400, "total_steps": 9627, "loss": 1.7722, "learning_rate": 4.0488649074496186e-05, "epoch": 0.5609224057338735, "percentage": 56.09, "elapsed_time": "1 day, 16:58:16", "remaining_time": "1 day, 8:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5401, "total_steps": 9627, "loss": 1.5485, "learning_rate": 4.04726309483265e-05, "epoch": 0.5610262802534538, "percentage": 56.1, "elapsed_time": "1 day, 16:58:45", "remaining_time": "1 day, 8:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5402, "total_steps": 9627, "loss": 1.6444, "learning_rate": 4.045661383674727e-05, "epoch": 0.5611301547730342, "percentage": 56.11, "elapsed_time": "1 day, 16:59:13", "remaining_time": "1 day, 8:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5403, "total_steps": 9627, "loss": 1.8602, "learning_rate": 4.044059774146423e-05, "epoch": 0.5612340292926146, "percentage": 56.12, "elapsed_time": "1 day, 16:59:42", "remaining_time": "1 day, 8:02:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5404, "total_steps": 9627, "loss": 1.6232, "learning_rate": 4.0424582664182986e-05, "epoch": 0.5613379038121948, "percentage": 56.13, "elapsed_time": "1 day, 17:00:10", "remaining_time": "1 day, 8:02:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5405, "total_steps": 9627, "loss": 1.6325, "learning_rate": 4.040856860660897e-05, "epoch": 0.5614417783317752, "percentage": 56.14, "elapsed_time": "1 day, 17:00:39", "remaining_time": "1 day, 8:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5406, "total_steps": 9627, "loss": 1.6961, "learning_rate": 4.03925555704476e-05, "epoch": 0.5615456528513556, "percentage": 56.15, "elapsed_time": "1 day, 17:01:07", "remaining_time": "1 day, 8:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5407, "total_steps": 9627, "loss": 1.6689, "learning_rate": 4.0376543557404125e-05, "epoch": 0.5616495273709359, "percentage": 56.16, "elapsed_time": "1 day, 17:01:37", "remaining_time": "1 day, 8:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5408, "total_steps": 9627, "loss": 1.5847, "learning_rate": 4.036053256918368e-05, "epoch": 0.5617534018905163, "percentage": 56.18, "elapsed_time": "1 day, 17:02:04", "remaining_time": "1 day, 8:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5409, "total_steps": 9627, "loss": 1.7453, "learning_rate": 4.034452260749132e-05, "epoch": 0.5618572764100966, "percentage": 56.19, "elapsed_time": "1 day, 17:02:34", "remaining_time": "1 day, 8:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5410, "total_steps": 9627, "loss": 1.7059, "learning_rate": 4.032851367403201e-05, "epoch": 0.5619611509296769, "percentage": 56.2, "elapsed_time": "1 day, 17:03:01", "remaining_time": "1 day, 7:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5411, "total_steps": 9627, "loss": 1.6802, "learning_rate": 4.031250577051053e-05, "epoch": 0.5620650254492573, "percentage": 56.21, "elapsed_time": "1 day, 17:03:31", "remaining_time": "1 day, 7:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5412, "total_steps": 9627, "loss": 1.7492, "learning_rate": 4.0296498898631644e-05, "epoch": 0.5621688999688377, "percentage": 56.22, "elapsed_time": "1 day, 17:03:58", "remaining_time": "1 day, 7:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5413, "total_steps": 9627, "loss": 1.7393, "learning_rate": 4.028049306009992e-05, "epoch": 0.562272774488418, "percentage": 56.23, "elapsed_time": "1 day, 17:04:28", "remaining_time": "1 day, 7:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5414, "total_steps": 9627, "loss": 1.7905, "learning_rate": 4.026448825661987e-05, "epoch": 0.5623766490079983, "percentage": 56.24, "elapsed_time": "1 day, 17:04:57", "remaining_time": "1 day, 7:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5415, "total_steps": 9627, "loss": 1.8213, "learning_rate": 4.024848448989588e-05, "epoch": 0.5624805235275787, "percentage": 56.25, "elapsed_time": "1 day, 17:05:24", "remaining_time": "1 day, 7:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5416, "total_steps": 9627, "loss": 1.4981, "learning_rate": 4.023248176163224e-05, "epoch": 0.562584398047159, "percentage": 56.26, "elapsed_time": "1 day, 17:05:54", "remaining_time": "1 day, 7:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5417, "total_steps": 9627, "loss": 1.6849, "learning_rate": 4.021648007353309e-05, "epoch": 0.5626882725667394, "percentage": 56.27, "elapsed_time": "1 day, 17:06:21", "remaining_time": "1 day, 7:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5418, "total_steps": 9627, "loss": 1.5648, "learning_rate": 4.0200479427302486e-05, "epoch": 0.5627921470863197, "percentage": 56.28, "elapsed_time": "1 day, 17:06:50", "remaining_time": "1 day, 7:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5419, "total_steps": 9627, "loss": 1.8176, "learning_rate": 4.0184479824644413e-05, "epoch": 0.5628960216059, "percentage": 56.29, "elapsed_time": "1 day, 17:07:19", "remaining_time": "1 day, 7:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5420, "total_steps": 9627, "loss": 1.6165, "learning_rate": 4.016848126726266e-05, "epoch": 0.5629998961254804, "percentage": 56.3, "elapsed_time": "1 day, 17:07:47", "remaining_time": "1 day, 7:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5421, "total_steps": 9627, "loss": 1.5583, "learning_rate": 4.0152483756860956e-05, "epoch": 0.5631037706450608, "percentage": 56.31, "elapsed_time": "1 day, 17:08:17", "remaining_time": "1 day, 7:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5422, "total_steps": 9627, "loss": 1.7998, "learning_rate": 4.0136487295142913e-05, "epoch": 0.5632076451646412, "percentage": 56.32, "elapsed_time": "1 day, 17:08:44", "remaining_time": "1 day, 7:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5423, "total_steps": 9627, "loss": 2.054, "learning_rate": 4.0120491883812065e-05, "epoch": 0.5633115196842214, "percentage": 56.33, "elapsed_time": "1 day, 17:09:13", "remaining_time": "1 day, 7:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5424, "total_steps": 9627, "loss": 1.7295, "learning_rate": 4.010449752457175e-05, "epoch": 0.5634153942038018, "percentage": 56.34, "elapsed_time": "1 day, 17:09:42", "remaining_time": "1 day, 7:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5425, "total_steps": 9627, "loss": 1.21, "learning_rate": 4.0088504219125253e-05, "epoch": 0.5635192687233822, "percentage": 56.35, "elapsed_time": "1 day, 17:10:10", "remaining_time": "1 day, 7:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5426, "total_steps": 9627, "loss": 1.6524, "learning_rate": 4.007251196917576e-05, "epoch": 0.5636231432429625, "percentage": 56.36, "elapsed_time": "1 day, 17:10:39", "remaining_time": "1 day, 7:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5427, "total_steps": 9627, "loss": 1.6198, "learning_rate": 4.00565207764263e-05, "epoch": 0.5637270177625429, "percentage": 56.37, "elapsed_time": "1 day, 17:11:06", "remaining_time": "1 day, 7:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5428, "total_steps": 9627, "loss": 1.6297, "learning_rate": 4.00405306425798e-05, "epoch": 0.5638308922821232, "percentage": 56.38, "elapsed_time": "1 day, 17:11:36", "remaining_time": "1 day, 7:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5429, "total_steps": 9627, "loss": 1.6958, "learning_rate": 4.0024541569339126e-05, "epoch": 0.5639347668017035, "percentage": 56.39, "elapsed_time": "1 day, 17:12:03", "remaining_time": "1 day, 7:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5430, "total_steps": 9627, "loss": 1.5767, "learning_rate": 4.0008553558406945e-05, "epoch": 0.5640386413212839, "percentage": 56.4, "elapsed_time": "1 day, 17:12:31", "remaining_time": "1 day, 7:51:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5431, "total_steps": 9627, "loss": 1.6399, "learning_rate": 3.9992566611485866e-05, "epoch": 0.5641425158408643, "percentage": 56.41, "elapsed_time": "1 day, 17:13:00", "remaining_time": "1 day, 7:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5432, "total_steps": 9627, "loss": 1.485, "learning_rate": 3.9976580730278405e-05, "epoch": 0.5642463903604445, "percentage": 56.42, "elapsed_time": "1 day, 17:13:29", "remaining_time": "1 day, 7:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5433, "total_steps": 9627, "loss": 1.6078, "learning_rate": 3.99605959164869e-05, "epoch": 0.5643502648800249, "percentage": 56.44, "elapsed_time": "1 day, 17:13:57", "remaining_time": "1 day, 7:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5434, "total_steps": 9627, "loss": 1.7178, "learning_rate": 3.9944612171813616e-05, "epoch": 0.5644541393996053, "percentage": 56.45, "elapsed_time": "1 day, 17:14:25", "remaining_time": "1 day, 7:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5435, "total_steps": 9627, "loss": 1.7114, "learning_rate": 3.992862949796072e-05, "epoch": 0.5645580139191856, "percentage": 56.46, "elapsed_time": "1 day, 17:14:54", "remaining_time": "1 day, 7:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5436, "total_steps": 9627, "loss": 1.5976, "learning_rate": 3.991264789663019e-05, "epoch": 0.564661888438766, "percentage": 56.47, "elapsed_time": "1 day, 17:15:23", "remaining_time": "1 day, 7:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5437, "total_steps": 9627, "loss": 1.7029, "learning_rate": 3.989666736952399e-05, "epoch": 0.5647657629583464, "percentage": 56.48, "elapsed_time": "1 day, 17:15:51", "remaining_time": "1 day, 7:48:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5438, "total_steps": 9627, "loss": 1.5416, "learning_rate": 3.9880687918343916e-05, "epoch": 0.5648696374779266, "percentage": 56.49, "elapsed_time": "1 day, 17:16:18", "remaining_time": "1 day, 7:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5439, "total_steps": 9627, "loss": 1.7622, "learning_rate": 3.986470954479163e-05, "epoch": 0.564973511997507, "percentage": 56.5, "elapsed_time": "1 day, 17:16:48", "remaining_time": "1 day, 7:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5440, "total_steps": 9627, "loss": 1.6935, "learning_rate": 3.984873225056873e-05, "epoch": 0.5650773865170874, "percentage": 56.51, "elapsed_time": "1 day, 17:17:15", "remaining_time": "1 day, 7:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5441, "total_steps": 9627, "loss": 1.6477, "learning_rate": 3.983275603737666e-05, "epoch": 0.5651812610366677, "percentage": 56.52, "elapsed_time": "1 day, 17:17:45", "remaining_time": "1 day, 7:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5442, "total_steps": 9627, "loss": 1.7526, "learning_rate": 3.981678090691676e-05, "epoch": 0.565285135556248, "percentage": 56.53, "elapsed_time": "1 day, 17:18:12", "remaining_time": "1 day, 7:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5443, "total_steps": 9627, "loss": 1.7972, "learning_rate": 3.980080686089026e-05, "epoch": 0.5653890100758284, "percentage": 56.54, "elapsed_time": "1 day, 17:18:42", "remaining_time": "1 day, 7:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5444, "total_steps": 9627, "loss": 1.738, "learning_rate": 3.9784833900998286e-05, "epoch": 0.5654928845954087, "percentage": 56.55, "elapsed_time": "1 day, 17:19:10", "remaining_time": "1 day, 7:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5445, "total_steps": 9627, "loss": 1.6437, "learning_rate": 3.97688620289418e-05, "epoch": 0.5655967591149891, "percentage": 56.56, "elapsed_time": "1 day, 17:19:38", "remaining_time": "1 day, 7:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5446, "total_steps": 9627, "loss": 1.6672, "learning_rate": 3.975289124642171e-05, "epoch": 0.5657006336345695, "percentage": 56.57, "elapsed_time": "1 day, 17:20:06", "remaining_time": "1 day, 7:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5447, "total_steps": 9627, "loss": 1.6666, "learning_rate": 3.9736921555138787e-05, "epoch": 0.5658045081541497, "percentage": 56.58, "elapsed_time": "1 day, 17:20:35", "remaining_time": "1 day, 7:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5448, "total_steps": 9627, "loss": 1.6013, "learning_rate": 3.972095295679365e-05, "epoch": 0.5659083826737301, "percentage": 56.59, "elapsed_time": "1 day, 17:21:04", "remaining_time": "1 day, 7:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5449, "total_steps": 9627, "loss": 1.6795, "learning_rate": 3.9704985453086833e-05, "epoch": 0.5660122571933105, "percentage": 56.6, "elapsed_time": "1 day, 17:21:32", "remaining_time": "1 day, 7:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5450, "total_steps": 9627, "loss": 1.4858, "learning_rate": 3.968901904571877e-05, "epoch": 0.5661161317128909, "percentage": 56.61, "elapsed_time": "1 day, 17:22:01", "remaining_time": "1 day, 7:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5451, "total_steps": 9627, "loss": 1.5509, "learning_rate": 3.967305373638976e-05, "epoch": 0.5662200062324712, "percentage": 56.62, "elapsed_time": "1 day, 17:22:29", "remaining_time": "1 day, 7:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5452, "total_steps": 9627, "loss": 1.6271, "learning_rate": 3.965708952679996e-05, "epoch": 0.5663238807520515, "percentage": 56.63, "elapsed_time": "1 day, 17:22:58", "remaining_time": "1 day, 7:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5453, "total_steps": 9627, "loss": 1.656, "learning_rate": 3.9641126418649456e-05, "epoch": 0.5664277552716319, "percentage": 56.64, "elapsed_time": "1 day, 17:23:26", "remaining_time": "1 day, 7:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5454, "total_steps": 9627, "loss": 1.6666, "learning_rate": 3.962516441363818e-05, "epoch": 0.5665316297912122, "percentage": 56.65, "elapsed_time": "1 day, 17:23:55", "remaining_time": "1 day, 7:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5455, "total_steps": 9627, "loss": 1.5975, "learning_rate": 3.9609203513465974e-05, "epoch": 0.5666355043107926, "percentage": 56.66, "elapsed_time": "1 day, 17:24:23", "remaining_time": "1 day, 7:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5456, "total_steps": 9627, "loss": 1.7687, "learning_rate": 3.9593243719832536e-05, "epoch": 0.566739378830373, "percentage": 56.67, "elapsed_time": "1 day, 17:24:52", "remaining_time": "1 day, 7:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5457, "total_steps": 9627, "loss": 1.6263, "learning_rate": 3.957728503443748e-05, "epoch": 0.5668432533499532, "percentage": 56.68, "elapsed_time": "1 day, 17:25:20", "remaining_time": "1 day, 7:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5458, "total_steps": 9627, "loss": 1.6705, "learning_rate": 3.956132745898025e-05, "epoch": 0.5669471278695336, "percentage": 56.69, "elapsed_time": "1 day, 17:25:49", "remaining_time": "1 day, 7:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5459, "total_steps": 9627, "loss": 1.6423, "learning_rate": 3.954537099516021e-05, "epoch": 0.567051002389114, "percentage": 56.71, "elapsed_time": "1 day, 17:26:17", "remaining_time": "1 day, 7:38:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5460, "total_steps": 9627, "loss": 1.7335, "learning_rate": 3.952941564467665e-05, "epoch": 0.5671548769086943, "percentage": 56.72, "elapsed_time": "1 day, 17:26:45", "remaining_time": "1 day, 7:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5461, "total_steps": 9627, "loss": 1.7162, "learning_rate": 3.951346140922863e-05, "epoch": 0.5672587514282746, "percentage": 56.73, "elapsed_time": "1 day, 17:27:14", "remaining_time": "1 day, 7:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5462, "total_steps": 9627, "loss": 1.7051, "learning_rate": 3.949750829051516e-05, "epoch": 0.567362625947855, "percentage": 56.74, "elapsed_time": "1 day, 17:27:42", "remaining_time": "1 day, 7:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5463, "total_steps": 9627, "loss": 1.5073, "learning_rate": 3.948155629023515e-05, "epoch": 0.5674665004674353, "percentage": 56.75, "elapsed_time": "1 day, 17:28:11", "remaining_time": "1 day, 7:36:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5464, "total_steps": 9627, "loss": 1.7606, "learning_rate": 3.946560541008734e-05, "epoch": 0.5675703749870157, "percentage": 56.76, "elapsed_time": "1 day, 17:28:39", "remaining_time": "1 day, 7:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5465, "total_steps": 9627, "loss": 1.576, "learning_rate": 3.9449655651770365e-05, "epoch": 0.5676742495065961, "percentage": 56.77, "elapsed_time": "1 day, 17:29:07", "remaining_time": "1 day, 7:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5466, "total_steps": 9627, "loss": 1.6677, "learning_rate": 3.943370701698281e-05, "epoch": 0.5677781240261763, "percentage": 56.78, "elapsed_time": "1 day, 17:29:36", "remaining_time": "1 day, 7:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5467, "total_steps": 9627, "loss": 1.7007, "learning_rate": 3.9417759507423004e-05, "epoch": 0.5678819985457567, "percentage": 56.79, "elapsed_time": "1 day, 17:30:05", "remaining_time": "1 day, 7:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5468, "total_steps": 9627, "loss": 1.788, "learning_rate": 3.940181312478928e-05, "epoch": 0.5679858730653371, "percentage": 56.8, "elapsed_time": "1 day, 17:30:32", "remaining_time": "1 day, 7:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5469, "total_steps": 9627, "loss": 1.7881, "learning_rate": 3.938586787077978e-05, "epoch": 0.5680897475849174, "percentage": 56.81, "elapsed_time": "1 day, 17:31:01", "remaining_time": "1 day, 7:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5470, "total_steps": 9627, "loss": 1.8009, "learning_rate": 3.936992374709256e-05, "epoch": 0.5681936221044978, "percentage": 56.82, "elapsed_time": "1 day, 17:31:30", "remaining_time": "1 day, 7:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5471, "total_steps": 9627, "loss": 1.7802, "learning_rate": 3.935398075542554e-05, "epoch": 0.5682974966240781, "percentage": 56.83, "elapsed_time": "1 day, 17:31:59", "remaining_time": "1 day, 7:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5472, "total_steps": 9627, "loss": 1.5211, "learning_rate": 3.933803889747655e-05, "epoch": 0.5684013711436584, "percentage": 56.84, "elapsed_time": "1 day, 17:32:27", "remaining_time": "1 day, 7:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5473, "total_steps": 9627, "loss": 1.6319, "learning_rate": 3.9322098174943226e-05, "epoch": 0.5685052456632388, "percentage": 56.85, "elapsed_time": "1 day, 17:32:56", "remaining_time": "1 day, 7:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5474, "total_steps": 9627, "loss": 1.4707, "learning_rate": 3.930615858952316e-05, "epoch": 0.5686091201828192, "percentage": 56.86, "elapsed_time": "1 day, 17:33:23", "remaining_time": "1 day, 7:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5475, "total_steps": 9627, "loss": 1.7746, "learning_rate": 3.929022014291379e-05, "epoch": 0.5687129947023996, "percentage": 56.87, "elapsed_time": "1 day, 17:33:52", "remaining_time": "1 day, 7:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5476, "total_steps": 9627, "loss": 1.7012, "learning_rate": 3.927428283681245e-05, "epoch": 0.5688168692219798, "percentage": 56.88, "elapsed_time": "1 day, 17:34:21", "remaining_time": "1 day, 7:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5477, "total_steps": 9627, "loss": 1.623, "learning_rate": 3.925834667291631e-05, "epoch": 0.5689207437415602, "percentage": 56.89, "elapsed_time": "1 day, 17:34:48", "remaining_time": "1 day, 7:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5478, "total_steps": 9627, "loss": 1.6304, "learning_rate": 3.924241165292245e-05, "epoch": 0.5690246182611406, "percentage": 56.9, "elapsed_time": "1 day, 17:35:18", "remaining_time": "1 day, 7:29:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5479, "total_steps": 9627, "loss": 1.7869, "learning_rate": 3.922647777852786e-05, "epoch": 0.5691284927807209, "percentage": 56.91, "elapsed_time": "1 day, 17:35:45", "remaining_time": "1 day, 7:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5480, "total_steps": 9627, "loss": 1.7863, "learning_rate": 3.9210545051429337e-05, "epoch": 0.5692323673003012, "percentage": 56.92, "elapsed_time": "1 day, 17:36:15", "remaining_time": "1 day, 7:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5481, "total_steps": 9627, "loss": 1.7295, "learning_rate": 3.919461347332361e-05, "epoch": 0.5693362418198816, "percentage": 56.93, "elapsed_time": "1 day, 17:36:42", "remaining_time": "1 day, 7:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5482, "total_steps": 9627, "loss": 1.5988, "learning_rate": 3.917868304590726e-05, "epoch": 0.5694401163394619, "percentage": 56.94, "elapsed_time": "1 day, 17:37:11", "remaining_time": "1 day, 7:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5483, "total_steps": 9627, "loss": 1.6312, "learning_rate": 3.916275377087676e-05, "epoch": 0.5695439908590423, "percentage": 56.95, "elapsed_time": "1 day, 17:37:40", "remaining_time": "1 day, 7:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5484, "total_steps": 9627, "loss": 1.7144, "learning_rate": 3.9146825649928446e-05, "epoch": 0.5696478653786227, "percentage": 56.96, "elapsed_time": "1 day, 17:38:08", "remaining_time": "1 day, 7:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5485, "total_steps": 9627, "loss": 1.8591, "learning_rate": 3.913089868475855e-05, "epoch": 0.5697517398982029, "percentage": 56.98, "elapsed_time": "1 day, 17:38:36", "remaining_time": "1 day, 7:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5486, "total_steps": 9627, "loss": 1.7331, "learning_rate": 3.911497287706315e-05, "epoch": 0.5698556144177833, "percentage": 56.99, "elapsed_time": "1 day, 17:39:04", "remaining_time": "1 day, 7:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5487, "total_steps": 9627, "loss": 1.867, "learning_rate": 3.909904822853823e-05, "epoch": 0.5699594889373637, "percentage": 57.0, "elapsed_time": "1 day, 17:39:35", "remaining_time": "1 day, 7:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5488, "total_steps": 9627, "loss": 1.7591, "learning_rate": 3.908312474087966e-05, "epoch": 0.570063363456944, "percentage": 57.01, "elapsed_time": "1 day, 17:40:02", "remaining_time": "1 day, 7:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5489, "total_steps": 9627, "loss": 1.7974, "learning_rate": 3.906720241578314e-05, "epoch": 0.5701672379765244, "percentage": 57.02, "elapsed_time": "1 day, 17:40:31", "remaining_time": "1 day, 7:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5490, "total_steps": 9627, "loss": 1.7685, "learning_rate": 3.905128125494427e-05, "epoch": 0.5702711124961047, "percentage": 57.03, "elapsed_time": "1 day, 17:40:59", "remaining_time": "1 day, 7:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5491, "total_steps": 9627, "loss": 1.7431, "learning_rate": 3.903536126005858e-05, "epoch": 0.570374987015685, "percentage": 57.04, "elapsed_time": "1 day, 17:41:28", "remaining_time": "1 day, 7:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5492, "total_steps": 9627, "loss": 1.8147, "learning_rate": 3.901944243282135e-05, "epoch": 0.5704788615352654, "percentage": 57.05, "elapsed_time": "1 day, 17:41:56", "remaining_time": "1 day, 7:23:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5493, "total_steps": 9627, "loss": 1.7233, "learning_rate": 3.900352477492786e-05, "epoch": 0.5705827360548458, "percentage": 57.06, "elapsed_time": "1 day, 17:42:25", "remaining_time": "1 day, 7:23:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5494, "total_steps": 9627, "loss": 1.5517, "learning_rate": 3.8987608288073216e-05, "epoch": 0.570686610574426, "percentage": 57.07, "elapsed_time": "1 day, 17:42:53", "remaining_time": "1 day, 7:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5495, "total_steps": 9627, "loss": 1.6967, "learning_rate": 3.897169297395238e-05, "epoch": 0.5707904850940064, "percentage": 57.08, "elapsed_time": "1 day, 17:43:20", "remaining_time": "1 day, 7:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5496, "total_steps": 9627, "loss": 1.4462, "learning_rate": 3.895577883426022e-05, "epoch": 0.5708943596135868, "percentage": 57.09, "elapsed_time": "1 day, 17:43:50", "remaining_time": "1 day, 7:21:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5497, "total_steps": 9627, "loss": 1.8624, "learning_rate": 3.893986587069147e-05, "epoch": 0.5709982341331671, "percentage": 57.1, "elapsed_time": "1 day, 17:44:18", "remaining_time": "1 day, 7:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5498, "total_steps": 9627, "loss": 1.6179, "learning_rate": 3.892395408494073e-05, "epoch": 0.5711021086527475, "percentage": 57.11, "elapsed_time": "1 day, 17:44:45", "remaining_time": "1 day, 7:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5499, "total_steps": 9627, "loss": 1.7387, "learning_rate": 3.890804347870248e-05, "epoch": 0.5712059831723278, "percentage": 57.12, "elapsed_time": "1 day, 17:45:14", "remaining_time": "1 day, 7:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5500, "total_steps": 9627, "loss": 1.4776, "learning_rate": 3.889213405367107e-05, "epoch": 0.5713098576919082, "percentage": 57.13, "elapsed_time": "1 day, 17:45:42", "remaining_time": "1 day, 7:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5501, "total_steps": 9627, "loss": 1.6338, "learning_rate": 3.887622581154077e-05, "epoch": 0.5714137322114885, "percentage": 57.14, "elapsed_time": "1 day, 17:46:11", "remaining_time": "1 day, 7:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5502, "total_steps": 9627, "loss": 1.9512, "learning_rate": 3.886031875400562e-05, "epoch": 0.5715176067310689, "percentage": 57.15, "elapsed_time": "1 day, 17:46:38", "remaining_time": "1 day, 7:19:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5503, "total_steps": 9627, "loss": 1.7856, "learning_rate": 3.884441288275965e-05, "epoch": 0.5716214812506493, "percentage": 57.16, "elapsed_time": "1 day, 17:47:08", "remaining_time": "1 day, 7:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5504, "total_steps": 9627, "loss": 1.6817, "learning_rate": 3.8828508199496694e-05, "epoch": 0.5717253557702295, "percentage": 57.17, "elapsed_time": "1 day, 17:47:35", "remaining_time": "1 day, 7:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5505, "total_steps": 9627, "loss": 1.803, "learning_rate": 3.8812604705910454e-05, "epoch": 0.5718292302898099, "percentage": 57.18, "elapsed_time": "1 day, 17:48:05", "remaining_time": "1 day, 7:17:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5506, "total_steps": 9627, "loss": 1.5654, "learning_rate": 3.8796702403694554e-05, "epoch": 0.5719331048093903, "percentage": 57.19, "elapsed_time": "1 day, 17:48:33", "remaining_time": "1 day, 7:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5507, "total_steps": 9627, "loss": 1.6287, "learning_rate": 3.8780801294542476e-05, "epoch": 0.5720369793289706, "percentage": 57.2, "elapsed_time": "1 day, 17:49:01", "remaining_time": "1 day, 7:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5508, "total_steps": 9627, "loss": 1.5963, "learning_rate": 3.876490138014752e-05, "epoch": 0.572140853848551, "percentage": 57.21, "elapsed_time": "1 day, 17:49:29", "remaining_time": "1 day, 7:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5509, "total_steps": 9627, "loss": 1.6819, "learning_rate": 3.874900266220295e-05, "epoch": 0.5722447283681313, "percentage": 57.22, "elapsed_time": "1 day, 17:49:58", "remaining_time": "1 day, 7:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5510, "total_steps": 9627, "loss": 1.5166, "learning_rate": 3.873310514240183e-05, "epoch": 0.5723486028877116, "percentage": 57.23, "elapsed_time": "1 day, 17:50:26", "remaining_time": "1 day, 7:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5511, "total_steps": 9627, "loss": 1.505, "learning_rate": 3.871720882243712e-05, "epoch": 0.572452477407292, "percentage": 57.25, "elapsed_time": "1 day, 17:50:55", "remaining_time": "1 day, 7:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5512, "total_steps": 9627, "loss": 1.6057, "learning_rate": 3.870131370400166e-05, "epoch": 0.5725563519268724, "percentage": 57.26, "elapsed_time": "1 day, 17:51:23", "remaining_time": "1 day, 7:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5513, "total_steps": 9627, "loss": 1.6186, "learning_rate": 3.868541978878818e-05, "epoch": 0.5726602264464526, "percentage": 57.27, "elapsed_time": "1 day, 17:51:51", "remaining_time": "1 day, 7:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5514, "total_steps": 9627, "loss": 1.5518, "learning_rate": 3.866952707848922e-05, "epoch": 0.572764100966033, "percentage": 57.28, "elapsed_time": "1 day, 17:52:20", "remaining_time": "1 day, 7:14:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5515, "total_steps": 9627, "loss": 1.7631, "learning_rate": 3.865363557479723e-05, "epoch": 0.5728679754856134, "percentage": 57.29, "elapsed_time": "1 day, 17:52:47", "remaining_time": "1 day, 7:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5516, "total_steps": 9627, "loss": 1.7801, "learning_rate": 3.863774527940457e-05, "epoch": 0.5729718500051937, "percentage": 57.3, "elapsed_time": "1 day, 17:53:16", "remaining_time": "1 day, 7:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5517, "total_steps": 9627, "loss": 1.4836, "learning_rate": 3.86218561940034e-05, "epoch": 0.5730757245247741, "percentage": 57.31, "elapsed_time": "1 day, 17:53:44", "remaining_time": "1 day, 7:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5518, "total_steps": 9627, "loss": 1.5733, "learning_rate": 3.860596832028579e-05, "epoch": 0.5731795990443544, "percentage": 57.32, "elapsed_time": "1 day, 17:54:13", "remaining_time": "1 day, 7:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5519, "total_steps": 9627, "loss": 1.7095, "learning_rate": 3.8590081659943694e-05, "epoch": 0.5732834735639347, "percentage": 57.33, "elapsed_time": "1 day, 17:54:41", "remaining_time": "1 day, 7:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5520, "total_steps": 9627, "loss": 1.7818, "learning_rate": 3.8574196214668876e-05, "epoch": 0.5733873480835151, "percentage": 57.34, "elapsed_time": "1 day, 17:55:10", "remaining_time": "1 day, 7:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5521, "total_steps": 9627, "loss": 1.5572, "learning_rate": 3.855831198615304e-05, "epoch": 0.5734912226030955, "percentage": 57.35, "elapsed_time": "1 day, 17:55:38", "remaining_time": "1 day, 7:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5522, "total_steps": 9627, "loss": 1.4641, "learning_rate": 3.854242897608775e-05, "epoch": 0.5735950971226758, "percentage": 57.36, "elapsed_time": "1 day, 17:56:06", "remaining_time": "1 day, 7:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5523, "total_steps": 9627, "loss": 1.3964, "learning_rate": 3.852654718616438e-05, "epoch": 0.5736989716422561, "percentage": 57.37, "elapsed_time": "1 day, 17:56:34", "remaining_time": "1 day, 7:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5524, "total_steps": 9627, "loss": 1.66, "learning_rate": 3.851066661807424e-05, "epoch": 0.5738028461618365, "percentage": 57.38, "elapsed_time": "1 day, 17:57:04", "remaining_time": "1 day, 7:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5525, "total_steps": 9627, "loss": 1.7209, "learning_rate": 3.849478727350849e-05, "epoch": 0.5739067206814168, "percentage": 57.39, "elapsed_time": "1 day, 17:57:31", "remaining_time": "1 day, 7:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5526, "total_steps": 9627, "loss": 1.6168, "learning_rate": 3.847890915415815e-05, "epoch": 0.5740105952009972, "percentage": 57.4, "elapsed_time": "1 day, 17:58:00", "remaining_time": "1 day, 7:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5527, "total_steps": 9627, "loss": 1.7073, "learning_rate": 3.8463032261714114e-05, "epoch": 0.5741144697205776, "percentage": 57.41, "elapsed_time": "1 day, 17:58:28", "remaining_time": "1 day, 7:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5528, "total_steps": 9627, "loss": 1.7536, "learning_rate": 3.8447156597867153e-05, "epoch": 0.5742183442401579, "percentage": 57.42, "elapsed_time": "1 day, 17:58:57", "remaining_time": "1 day, 7:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5529, "total_steps": 9627, "loss": 1.6032, "learning_rate": 3.843128216430791e-05, "epoch": 0.5743222187597382, "percentage": 57.43, "elapsed_time": "1 day, 17:59:25", "remaining_time": "1 day, 7:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5530, "total_steps": 9627, "loss": 1.6722, "learning_rate": 3.841540896272685e-05, "epoch": 0.5744260932793186, "percentage": 57.44, "elapsed_time": "1 day, 17:59:54", "remaining_time": "1 day, 7:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5531, "total_steps": 9627, "loss": 1.7742, "learning_rate": 3.83995369948144e-05, "epoch": 0.574529967798899, "percentage": 57.45, "elapsed_time": "1 day, 18:00:22", "remaining_time": "1 day, 7:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5532, "total_steps": 9627, "loss": 1.5992, "learning_rate": 3.838366626226078e-05, "epoch": 0.5746338423184792, "percentage": 57.46, "elapsed_time": "1 day, 18:00:49", "remaining_time": "1 day, 7:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5533, "total_steps": 9627, "loss": 1.7132, "learning_rate": 3.836779676675606e-05, "epoch": 0.5747377168380596, "percentage": 57.47, "elapsed_time": "1 day, 18:01:17", "remaining_time": "1 day, 7:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5534, "total_steps": 9627, "loss": 1.8061, "learning_rate": 3.8351928509990255e-05, "epoch": 0.57484159135764, "percentage": 57.48, "elapsed_time": "1 day, 18:01:46", "remaining_time": "1 day, 7:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5535, "total_steps": 9627, "loss": 1.7402, "learning_rate": 3.833606149365323e-05, "epoch": 0.5749454658772203, "percentage": 57.49, "elapsed_time": "1 day, 18:02:15", "remaining_time": "1 day, 7:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5536, "total_steps": 9627, "loss": 1.6522, "learning_rate": 3.832019571943465e-05, "epoch": 0.5750493403968007, "percentage": 57.5, "elapsed_time": "1 day, 18:02:44", "remaining_time": "1 day, 7:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5537, "total_steps": 9627, "loss": 1.8343, "learning_rate": 3.8304331189024127e-05, "epoch": 0.575153214916381, "percentage": 57.52, "elapsed_time": "1 day, 18:03:12", "remaining_time": "1 day, 7:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5538, "total_steps": 9627, "loss": 1.6463, "learning_rate": 3.828846790411111e-05, "epoch": 0.5752570894359613, "percentage": 57.53, "elapsed_time": "1 day, 18:03:40", "remaining_time": "1 day, 7:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5539, "total_steps": 9627, "loss": 1.672, "learning_rate": 3.82726058663849e-05, "epoch": 0.5753609639555417, "percentage": 57.54, "elapsed_time": "1 day, 18:04:09", "remaining_time": "1 day, 7:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5540, "total_steps": 9627, "loss": 1.8548, "learning_rate": 3.8256745077534684e-05, "epoch": 0.5754648384751221, "percentage": 57.55, "elapsed_time": "1 day, 18:04:37", "remaining_time": "1 day, 7:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5541, "total_steps": 9627, "loss": 1.8835, "learning_rate": 3.824088553924954e-05, "epoch": 0.5755687129947024, "percentage": 57.56, "elapsed_time": "1 day, 18:05:04", "remaining_time": "1 day, 7:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5542, "total_steps": 9627, "loss": 1.831, "learning_rate": 3.822502725321833e-05, "epoch": 0.5756725875142827, "percentage": 57.57, "elapsed_time": "1 day, 18:05:34", "remaining_time": "1 day, 7:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5543, "total_steps": 9627, "loss": 1.7199, "learning_rate": 3.8209170221129875e-05, "epoch": 0.5757764620338631, "percentage": 57.58, "elapsed_time": "1 day, 18:06:02", "remaining_time": "1 day, 7:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5544, "total_steps": 9627, "loss": 1.8026, "learning_rate": 3.819331444467284e-05, "epoch": 0.5758803365534434, "percentage": 57.59, "elapsed_time": "1 day, 18:06:31", "remaining_time": "1 day, 7:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5545, "total_steps": 9627, "loss": 1.6854, "learning_rate": 3.817745992553571e-05, "epoch": 0.5759842110730238, "percentage": 57.6, "elapsed_time": "1 day, 18:06:59", "remaining_time": "1 day, 7:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5546, "total_steps": 9627, "loss": 1.6003, "learning_rate": 3.816160666540687e-05, "epoch": 0.5760880855926042, "percentage": 57.61, "elapsed_time": "1 day, 18:07:27", "remaining_time": "1 day, 6:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5547, "total_steps": 9627, "loss": 1.8288, "learning_rate": 3.814575466597459e-05, "epoch": 0.5761919601121844, "percentage": 57.62, "elapsed_time": "1 day, 18:07:57", "remaining_time": "1 day, 6:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5548, "total_steps": 9627, "loss": 1.8433, "learning_rate": 3.8129903928926956e-05, "epoch": 0.5762958346317648, "percentage": 57.63, "elapsed_time": "1 day, 18:08:24", "remaining_time": "1 day, 6:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5549, "total_steps": 9627, "loss": 1.6735, "learning_rate": 3.811405445595197e-05, "epoch": 0.5763997091513452, "percentage": 57.64, "elapsed_time": "1 day, 18:08:52", "remaining_time": "1 day, 6:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5550, "total_steps": 9627, "loss": 1.5637, "learning_rate": 3.809820624873748e-05, "epoch": 0.5765035836709255, "percentage": 57.65, "elapsed_time": "1 day, 18:09:21", "remaining_time": "1 day, 6:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5551, "total_steps": 9627, "loss": 1.6252, "learning_rate": 3.808235930897118e-05, "epoch": 0.5766074581905059, "percentage": 57.66, "elapsed_time": "1 day, 18:09:49", "remaining_time": "1 day, 6:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5552, "total_steps": 9627, "loss": 1.7843, "learning_rate": 3.806651363834065e-05, "epoch": 0.5767113327100862, "percentage": 57.67, "elapsed_time": "1 day, 18:10:19", "remaining_time": "1 day, 6:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5553, "total_steps": 9627, "loss": 1.547, "learning_rate": 3.805066923853333e-05, "epoch": 0.5768152072296666, "percentage": 57.68, "elapsed_time": "1 day, 18:10:46", "remaining_time": "1 day, 6:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5554, "total_steps": 9627, "loss": 1.5512, "learning_rate": 3.803482611123654e-05, "epoch": 0.5769190817492469, "percentage": 57.69, "elapsed_time": "1 day, 18:11:14", "remaining_time": "1 day, 6:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5555, "total_steps": 9627, "loss": 1.5616, "learning_rate": 3.8018984258137423e-05, "epoch": 0.5770229562688273, "percentage": 57.7, "elapsed_time": "1 day, 18:11:43", "remaining_time": "1 day, 6:55:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5556, "total_steps": 9627, "loss": 1.8645, "learning_rate": 3.800314368092302e-05, "epoch": 0.5771268307884077, "percentage": 57.71, "elapsed_time": "1 day, 18:12:12", "remaining_time": "1 day, 6:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5557, "total_steps": 9627, "loss": 1.7879, "learning_rate": 3.798730438128027e-05, "epoch": 0.5772307053079879, "percentage": 57.72, "elapsed_time": "1 day, 18:12:39", "remaining_time": "1 day, 6:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5558, "total_steps": 9627, "loss": 1.8618, "learning_rate": 3.797146636089587e-05, "epoch": 0.5773345798275683, "percentage": 57.73, "elapsed_time": "1 day, 18:13:07", "remaining_time": "1 day, 6:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5559, "total_steps": 9627, "loss": 1.5837, "learning_rate": 3.795562962145649e-05, "epoch": 0.5774384543471487, "percentage": 57.74, "elapsed_time": "1 day, 18:13:35", "remaining_time": "1 day, 6:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5560, "total_steps": 9627, "loss": 1.6511, "learning_rate": 3.793979416464862e-05, "epoch": 0.577542328866729, "percentage": 57.75, "elapsed_time": "1 day, 18:14:05", "remaining_time": "1 day, 6:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5561, "total_steps": 9627, "loss": 1.5685, "learning_rate": 3.792395999215857e-05, "epoch": 0.5776462033863093, "percentage": 57.76, "elapsed_time": "1 day, 18:14:32", "remaining_time": "1 day, 6:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5562, "total_steps": 9627, "loss": 1.6031, "learning_rate": 3.790812710567259e-05, "epoch": 0.5777500779058897, "percentage": 57.78, "elapsed_time": "1 day, 18:15:01", "remaining_time": "1 day, 6:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5563, "total_steps": 9627, "loss": 1.6291, "learning_rate": 3.789229550687676e-05, "epoch": 0.57785395242547, "percentage": 57.79, "elapsed_time": "1 day, 18:15:29", "remaining_time": "1 day, 6:52:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5564, "total_steps": 9627, "loss": 1.7213, "learning_rate": 3.7876465197457014e-05, "epoch": 0.5779578269450504, "percentage": 57.8, "elapsed_time": "1 day, 18:15:58", "remaining_time": "1 day, 6:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5565, "total_steps": 9627, "loss": 1.7851, "learning_rate": 3.7860636179099153e-05, "epoch": 0.5780617014646308, "percentage": 57.81, "elapsed_time": "1 day, 18:16:25", "remaining_time": "1 day, 6:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5566, "total_steps": 9627, "loss": 1.7522, "learning_rate": 3.784480845348886e-05, "epoch": 0.578165575984211, "percentage": 57.82, "elapsed_time": "1 day, 18:16:54", "remaining_time": "1 day, 6:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5567, "total_steps": 9627, "loss": 1.6278, "learning_rate": 3.7828982022311645e-05, "epoch": 0.5782694505037914, "percentage": 57.83, "elapsed_time": "1 day, 18:17:22", "remaining_time": "1 day, 6:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5568, "total_steps": 9627, "loss": 1.566, "learning_rate": 3.7813156887252896e-05, "epoch": 0.5783733250233718, "percentage": 57.84, "elapsed_time": "1 day, 18:17:50", "remaining_time": "1 day, 6:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5569, "total_steps": 9627, "loss": 1.6743, "learning_rate": 3.77973330499979e-05, "epoch": 0.5784771995429521, "percentage": 57.85, "elapsed_time": "1 day, 18:18:19", "remaining_time": "1 day, 6:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5570, "total_steps": 9627, "loss": 1.6308, "learning_rate": 3.778151051223173e-05, "epoch": 0.5785810740625325, "percentage": 57.86, "elapsed_time": "1 day, 18:18:47", "remaining_time": "1 day, 6:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5571, "total_steps": 9627, "loss": 1.6298, "learning_rate": 3.7765689275639374e-05, "epoch": 0.5786849485821128, "percentage": 57.87, "elapsed_time": "1 day, 18:19:15", "remaining_time": "1 day, 6:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5572, "total_steps": 9627, "loss": 1.7289, "learning_rate": 3.774986934190571e-05, "epoch": 0.5787888231016931, "percentage": 57.88, "elapsed_time": "1 day, 18:19:43", "remaining_time": "1 day, 6:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5573, "total_steps": 9627, "loss": 1.7287, "learning_rate": 3.7734050712715394e-05, "epoch": 0.5788926976212735, "percentage": 57.89, "elapsed_time": "1 day, 18:20:11", "remaining_time": "1 day, 6:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5574, "total_steps": 9627, "loss": 1.4959, "learning_rate": 3.7718233389752986e-05, "epoch": 0.5789965721408539, "percentage": 57.9, "elapsed_time": "1 day, 18:20:40", "remaining_time": "1 day, 6:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5575, "total_steps": 9627, "loss": 1.669, "learning_rate": 3.770241737470295e-05, "epoch": 0.5791004466604341, "percentage": 57.91, "elapsed_time": "1 day, 18:21:08", "remaining_time": "1 day, 6:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5576, "total_steps": 9627, "loss": 1.8687, "learning_rate": 3.7686602669249505e-05, "epoch": 0.5792043211800145, "percentage": 57.92, "elapsed_time": "1 day, 18:21:36", "remaining_time": "1 day, 6:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5577, "total_steps": 9627, "loss": 1.6422, "learning_rate": 3.767078927507683e-05, "epoch": 0.5793081956995949, "percentage": 57.93, "elapsed_time": "1 day, 18:22:04", "remaining_time": "1 day, 6:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5578, "total_steps": 9627, "loss": 1.7986, "learning_rate": 3.765497719386894e-05, "epoch": 0.5794120702191753, "percentage": 57.94, "elapsed_time": "1 day, 18:22:33", "remaining_time": "1 day, 6:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5579, "total_steps": 9627, "loss": 1.52, "learning_rate": 3.763916642730969e-05, "epoch": 0.5795159447387556, "percentage": 57.95, "elapsed_time": "1 day, 18:23:00", "remaining_time": "1 day, 6:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5580, "total_steps": 9627, "loss": 1.8281, "learning_rate": 3.762335697708279e-05, "epoch": 0.5796198192583359, "percentage": 57.96, "elapsed_time": "1 day, 18:23:29", "remaining_time": "1 day, 6:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5581, "total_steps": 9627, "loss": 1.7839, "learning_rate": 3.760754884487182e-05, "epoch": 0.5797236937779163, "percentage": 57.97, "elapsed_time": "1 day, 18:23:57", "remaining_time": "1 day, 6:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5582, "total_steps": 9627, "loss": 1.643, "learning_rate": 3.759174203236025e-05, "epoch": 0.5798275682974966, "percentage": 57.98, "elapsed_time": "1 day, 18:24:26", "remaining_time": "1 day, 6:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5583, "total_steps": 9627, "loss": 1.8582, "learning_rate": 3.757593654123135e-05, "epoch": 0.579931442817077, "percentage": 57.99, "elapsed_time": "1 day, 18:24:54", "remaining_time": "1 day, 6:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5584, "total_steps": 9627, "loss": 1.7523, "learning_rate": 3.75601323731683e-05, "epoch": 0.5800353173366574, "percentage": 58.0, "elapsed_time": "1 day, 18:25:22", "remaining_time": "1 day, 6:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5585, "total_steps": 9627, "loss": 1.6175, "learning_rate": 3.754432952985413e-05, "epoch": 0.5801391918562376, "percentage": 58.01, "elapsed_time": "1 day, 18:25:51", "remaining_time": "1 day, 6:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5586, "total_steps": 9627, "loss": 1.7074, "learning_rate": 3.7528528012971694e-05, "epoch": 0.580243066375818, "percentage": 58.02, "elapsed_time": "1 day, 18:26:19", "remaining_time": "1 day, 6:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5587, "total_steps": 9627, "loss": 1.6747, "learning_rate": 3.7512727824203754e-05, "epoch": 0.5803469408953984, "percentage": 58.03, "elapsed_time": "1 day, 18:26:47", "remaining_time": "1 day, 6:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5588, "total_steps": 9627, "loss": 1.6918, "learning_rate": 3.7496928965232905e-05, "epoch": 0.5804508154149787, "percentage": 58.05, "elapsed_time": "1 day, 18:27:16", "remaining_time": "1 day, 6:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5589, "total_steps": 9627, "loss": 1.5046, "learning_rate": 3.7481131437741566e-05, "epoch": 0.580554689934559, "percentage": 58.06, "elapsed_time": "1 day, 18:27:43", "remaining_time": "1 day, 6:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5590, "total_steps": 9627, "loss": 1.4811, "learning_rate": 3.746533524341208e-05, "epoch": 0.5806585644541394, "percentage": 58.07, "elapsed_time": "1 day, 18:28:12", "remaining_time": "1 day, 6:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5591, "total_steps": 9627, "loss": 1.6301, "learning_rate": 3.7449540383926646e-05, "epoch": 0.5807624389737197, "percentage": 58.08, "elapsed_time": "1 day, 18:28:39", "remaining_time": "1 day, 6:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5592, "total_steps": 9627, "loss": 1.6732, "learning_rate": 3.7433746860967235e-05, "epoch": 0.5808663134933001, "percentage": 58.09, "elapsed_time": "1 day, 18:29:09", "remaining_time": "1 day, 6:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5593, "total_steps": 9627, "loss": 1.4708, "learning_rate": 3.741795467621578e-05, "epoch": 0.5809701880128805, "percentage": 58.1, "elapsed_time": "1 day, 18:29:36", "remaining_time": "1 day, 6:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5594, "total_steps": 9627, "loss": 1.647, "learning_rate": 3.7402163831354e-05, "epoch": 0.5810740625324607, "percentage": 58.11, "elapsed_time": "1 day, 18:30:05", "remaining_time": "1 day, 6:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5595, "total_steps": 9627, "loss": 1.5459, "learning_rate": 3.738637432806351e-05, "epoch": 0.5811779370520411, "percentage": 58.12, "elapsed_time": "1 day, 18:30:33", "remaining_time": "1 day, 6:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5596, "total_steps": 9627, "loss": 1.6415, "learning_rate": 3.737058616802575e-05, "epoch": 0.5812818115716215, "percentage": 58.13, "elapsed_time": "1 day, 18:31:02", "remaining_time": "1 day, 6:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5597, "total_steps": 9627, "loss": 1.4745, "learning_rate": 3.735479935292208e-05, "epoch": 0.5813856860912018, "percentage": 58.14, "elapsed_time": "1 day, 18:31:29", "remaining_time": "1 day, 6:37:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5598, "total_steps": 9627, "loss": 1.6336, "learning_rate": 3.733901388443361e-05, "epoch": 0.5814895606107822, "percentage": 58.15, "elapsed_time": "1 day, 18:31:57", "remaining_time": "1 day, 6:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5599, "total_steps": 9627, "loss": 1.4979, "learning_rate": 3.732322976424141e-05, "epoch": 0.5815934351303625, "percentage": 58.16, "elapsed_time": "1 day, 18:32:25", "remaining_time": "1 day, 6:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5600, "total_steps": 9627, "loss": 1.826, "learning_rate": 3.7307446994026375e-05, "epoch": 0.5816973096499428, "percentage": 58.17, "elapsed_time": "1 day, 18:32:54", "remaining_time": "1 day, 6:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5601, "total_steps": 9627, "loss": 2.0605, "learning_rate": 3.7291665575469216e-05, "epoch": 0.5818011841695232, "percentage": 58.18, "elapsed_time": "1 day, 18:33:21", "remaining_time": "1 day, 6:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5602, "total_steps": 9627, "loss": 1.6777, "learning_rate": 3.727588551025053e-05, "epoch": 0.5819050586891036, "percentage": 58.19, "elapsed_time": "1 day, 18:33:50", "remaining_time": "1 day, 6:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5603, "total_steps": 9627, "loss": 1.6875, "learning_rate": 3.72601068000508e-05, "epoch": 0.582008933208684, "percentage": 58.2, "elapsed_time": "1 day, 18:34:19", "remaining_time": "1 day, 6:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5604, "total_steps": 9627, "loss": 1.7246, "learning_rate": 3.724432944655033e-05, "epoch": 0.5821128077282642, "percentage": 58.21, "elapsed_time": "1 day, 18:34:47", "remaining_time": "1 day, 6:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5605, "total_steps": 9627, "loss": 1.7337, "learning_rate": 3.722855345142926e-05, "epoch": 0.5822166822478446, "percentage": 58.22, "elapsed_time": "1 day, 18:35:15", "remaining_time": "1 day, 6:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5606, "total_steps": 9627, "loss": 1.8097, "learning_rate": 3.721277881636764e-05, "epoch": 0.582320556767425, "percentage": 58.23, "elapsed_time": "1 day, 18:35:43", "remaining_time": "1 day, 6:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5607, "total_steps": 9627, "loss": 1.5108, "learning_rate": 3.719700554304533e-05, "epoch": 0.5824244312870053, "percentage": 58.24, "elapsed_time": "1 day, 18:36:12", "remaining_time": "1 day, 6:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5608, "total_steps": 9627, "loss": 1.541, "learning_rate": 3.718123363314206e-05, "epoch": 0.5825283058065857, "percentage": 58.25, "elapsed_time": "1 day, 18:36:40", "remaining_time": "1 day, 6:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5609, "total_steps": 9627, "loss": 1.7062, "learning_rate": 3.7165463088337406e-05, "epoch": 0.582632180326166, "percentage": 58.26, "elapsed_time": "1 day, 18:37:08", "remaining_time": "1 day, 6:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5610, "total_steps": 9627, "loss": 1.6754, "learning_rate": 3.714969391031084e-05, "epoch": 0.5827360548457463, "percentage": 58.27, "elapsed_time": "1 day, 18:37:37", "remaining_time": "1 day, 6:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5611, "total_steps": 9627, "loss": 1.6984, "learning_rate": 3.713392610074162e-05, "epoch": 0.5828399293653267, "percentage": 58.28, "elapsed_time": "1 day, 18:38:05", "remaining_time": "1 day, 6:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5612, "total_steps": 9627, "loss": 1.4976, "learning_rate": 3.7118159661308906e-05, "epoch": 0.5829438038849071, "percentage": 58.29, "elapsed_time": "1 day, 18:38:32", "remaining_time": "1 day, 6:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5613, "total_steps": 9627, "loss": 1.5536, "learning_rate": 3.7102394593691724e-05, "epoch": 0.5830476784044873, "percentage": 58.3, "elapsed_time": "1 day, 18:39:01", "remaining_time": "1 day, 6:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5614, "total_steps": 9627, "loss": 1.8147, "learning_rate": 3.7086630899568906e-05, "epoch": 0.5831515529240677, "percentage": 58.32, "elapsed_time": "1 day, 18:39:30", "remaining_time": "1 day, 6:29:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5615, "total_steps": 9627, "loss": 1.934, "learning_rate": 3.707086858061917e-05, "epoch": 0.5832554274436481, "percentage": 58.33, "elapsed_time": "1 day, 18:39:58", "remaining_time": "1 day, 6:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5616, "total_steps": 9627, "loss": 1.6462, "learning_rate": 3.7055107638521086e-05, "epoch": 0.5833593019632284, "percentage": 58.34, "elapsed_time": "1 day, 18:40:26", "remaining_time": "1 day, 6:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5617, "total_steps": 9627, "loss": 1.6508, "learning_rate": 3.703934807495305e-05, "epoch": 0.5834631764828088, "percentage": 58.35, "elapsed_time": "1 day, 18:40:54", "remaining_time": "1 day, 6:28:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5618, "total_steps": 9627, "loss": 1.9211, "learning_rate": 3.7023589891593344e-05, "epoch": 0.5835670510023891, "percentage": 58.36, "elapsed_time": "1 day, 18:41:23", "remaining_time": "1 day, 6:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5619, "total_steps": 9627, "loss": 1.7667, "learning_rate": 3.7007833090120116e-05, "epoch": 0.5836709255219694, "percentage": 58.37, "elapsed_time": "1 day, 18:41:51", "remaining_time": "1 day, 6:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5620, "total_steps": 9627, "loss": 1.4863, "learning_rate": 3.69920776722113e-05, "epoch": 0.5837748000415498, "percentage": 58.38, "elapsed_time": "1 day, 18:42:20", "remaining_time": "1 day, 6:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5621, "total_steps": 9627, "loss": 1.7431, "learning_rate": 3.697632363954475e-05, "epoch": 0.5838786745611302, "percentage": 58.39, "elapsed_time": "1 day, 18:42:48", "remaining_time": "1 day, 6:26:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5622, "total_steps": 9627, "loss": 1.6647, "learning_rate": 3.696057099379816e-05, "epoch": 0.5839825490807105, "percentage": 58.4, "elapsed_time": "1 day, 18:43:17", "remaining_time": "1 day, 6:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5623, "total_steps": 9627, "loss": 1.4736, "learning_rate": 3.694481973664904e-05, "epoch": 0.5840864236002908, "percentage": 58.41, "elapsed_time": "1 day, 18:43:45", "remaining_time": "1 day, 6:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5624, "total_steps": 9627, "loss": 1.6726, "learning_rate": 3.6929069869774766e-05, "epoch": 0.5841902981198712, "percentage": 58.42, "elapsed_time": "1 day, 18:44:12", "remaining_time": "1 day, 6:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5625, "total_steps": 9627, "loss": 1.7569, "learning_rate": 3.6913321394852616e-05, "epoch": 0.5842941726394515, "percentage": 58.43, "elapsed_time": "1 day, 18:44:41", "remaining_time": "1 day, 6:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5626, "total_steps": 9627, "loss": 1.7056, "learning_rate": 3.689757431355964e-05, "epoch": 0.5843980471590319, "percentage": 58.44, "elapsed_time": "1 day, 18:45:10", "remaining_time": "1 day, 6:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5627, "total_steps": 9627, "loss": 1.7895, "learning_rate": 3.68818286275728e-05, "epoch": 0.5845019216786123, "percentage": 58.45, "elapsed_time": "1 day, 18:45:38", "remaining_time": "1 day, 6:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5628, "total_steps": 9627, "loss": 1.7048, "learning_rate": 3.686608433856891e-05, "epoch": 0.5846057961981925, "percentage": 58.46, "elapsed_time": "1 day, 18:46:05", "remaining_time": "1 day, 6:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5629, "total_steps": 9627, "loss": 1.6414, "learning_rate": 3.6850341448224574e-05, "epoch": 0.5847096707177729, "percentage": 58.47, "elapsed_time": "1 day, 18:46:35", "remaining_time": "1 day, 6:22:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5630, "total_steps": 9627, "loss": 1.7855, "learning_rate": 3.6834599958216286e-05, "epoch": 0.5848135452373533, "percentage": 58.48, "elapsed_time": "1 day, 18:47:02", "remaining_time": "1 day, 6:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5631, "total_steps": 9627, "loss": 1.8118, "learning_rate": 3.6818859870220415e-05, "epoch": 0.5849174197569337, "percentage": 58.49, "elapsed_time": "1 day, 18:47:31", "remaining_time": "1 day, 6:22:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5632, "total_steps": 9627, "loss": 1.6769, "learning_rate": 3.680312118591317e-05, "epoch": 0.585021294276514, "percentage": 58.5, "elapsed_time": "1 day, 18:47:58", "remaining_time": "1 day, 6:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5633, "total_steps": 9627, "loss": 1.6765, "learning_rate": 3.6787383906970564e-05, "epoch": 0.5851251687960943, "percentage": 58.51, "elapsed_time": "1 day, 18:48:28", "remaining_time": "1 day, 6:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5634, "total_steps": 9627, "loss": 1.6958, "learning_rate": 3.677164803506851e-05, "epoch": 0.5852290433156747, "percentage": 58.52, "elapsed_time": "1 day, 18:48:56", "remaining_time": "1 day, 6:20:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5635, "total_steps": 9627, "loss": 1.6542, "learning_rate": 3.675591357188276e-05, "epoch": 0.585332917835255, "percentage": 58.53, "elapsed_time": "1 day, 18:49:24", "remaining_time": "1 day, 6:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5636, "total_steps": 9627, "loss": 1.802, "learning_rate": 3.6740180519088905e-05, "epoch": 0.5854367923548354, "percentage": 58.54, "elapsed_time": "1 day, 18:49:52", "remaining_time": "1 day, 6:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5637, "total_steps": 9627, "loss": 1.4738, "learning_rate": 3.672444887836239e-05, "epoch": 0.5855406668744157, "percentage": 58.55, "elapsed_time": "1 day, 18:50:20", "remaining_time": "1 day, 6:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5638, "total_steps": 9627, "loss": 1.522, "learning_rate": 3.6708718651378534e-05, "epoch": 0.585644541393996, "percentage": 58.56, "elapsed_time": "1 day, 18:50:48", "remaining_time": "1 day, 6:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5639, "total_steps": 9627, "loss": 1.6182, "learning_rate": 3.6692989839812444e-05, "epoch": 0.5857484159135764, "percentage": 58.57, "elapsed_time": "1 day, 18:51:16", "remaining_time": "1 day, 6:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5640, "total_steps": 9627, "loss": 1.6908, "learning_rate": 3.667726244533913e-05, "epoch": 0.5858522904331568, "percentage": 58.59, "elapsed_time": "1 day, 18:51:45", "remaining_time": "1 day, 6:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5641, "total_steps": 9627, "loss": 1.5382, "learning_rate": 3.6661536469633474e-05, "epoch": 0.5859561649527371, "percentage": 58.6, "elapsed_time": "1 day, 18:52:13", "remaining_time": "1 day, 6:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5642, "total_steps": 9627, "loss": 1.683, "learning_rate": 3.6645811914370126e-05, "epoch": 0.5860600394723174, "percentage": 58.61, "elapsed_time": "1 day, 18:52:41", "remaining_time": "1 day, 6:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5643, "total_steps": 9627, "loss": 1.6154, "learning_rate": 3.663008878122364e-05, "epoch": 0.5861639139918978, "percentage": 58.62, "elapsed_time": "1 day, 18:53:09", "remaining_time": "1 day, 6:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5644, "total_steps": 9627, "loss": 1.8497, "learning_rate": 3.661436707186842e-05, "epoch": 0.5862677885114781, "percentage": 58.63, "elapsed_time": "1 day, 18:53:38", "remaining_time": "1 day, 6:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5645, "total_steps": 9627, "loss": 1.6919, "learning_rate": 3.6598646787978676e-05, "epoch": 0.5863716630310585, "percentage": 58.64, "elapsed_time": "1 day, 18:54:05", "remaining_time": "1 day, 6:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5646, "total_steps": 9627, "loss": 1.6516, "learning_rate": 3.6582927931228516e-05, "epoch": 0.5864755375506389, "percentage": 58.65, "elapsed_time": "1 day, 18:54:34", "remaining_time": "1 day, 6:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5647, "total_steps": 9627, "loss": 1.7285, "learning_rate": 3.656721050329189e-05, "epoch": 0.5865794120702191, "percentage": 58.66, "elapsed_time": "1 day, 18:55:02", "remaining_time": "1 day, 6:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5648, "total_steps": 9627, "loss": 1.6571, "learning_rate": 3.6551494505842554e-05, "epoch": 0.5866832865897995, "percentage": 58.67, "elapsed_time": "1 day, 18:55:31", "remaining_time": "1 day, 6:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5649, "total_steps": 9627, "loss": 1.6641, "learning_rate": 3.653577994055416e-05, "epoch": 0.5867871611093799, "percentage": 58.68, "elapsed_time": "1 day, 18:55:58", "remaining_time": "1 day, 6:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5650, "total_steps": 9627, "loss": 1.5068, "learning_rate": 3.652006680910017e-05, "epoch": 0.5868910356289602, "percentage": 58.69, "elapsed_time": "1 day, 18:56:27", "remaining_time": "1 day, 6:13:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5651, "total_steps": 9627, "loss": 1.7859, "learning_rate": 3.650435511315392e-05, "epoch": 0.5869949101485405, "percentage": 58.7, "elapsed_time": "1 day, 18:56:54", "remaining_time": "1 day, 6:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5652, "total_steps": 9627, "loss": 1.5551, "learning_rate": 3.6488644854388577e-05, "epoch": 0.5870987846681209, "percentage": 58.71, "elapsed_time": "1 day, 18:57:22", "remaining_time": "1 day, 6:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5653, "total_steps": 9627, "loss": 1.8654, "learning_rate": 3.647293603447718e-05, "epoch": 0.5872026591877012, "percentage": 58.72, "elapsed_time": "1 day, 18:57:51", "remaining_time": "1 day, 6:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5654, "total_steps": 9627, "loss": 1.6824, "learning_rate": 3.6457228655092554e-05, "epoch": 0.5873065337072816, "percentage": 58.73, "elapsed_time": "1 day, 18:58:19", "remaining_time": "1 day, 6:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5655, "total_steps": 9627, "loss": 1.7669, "learning_rate": 3.6441522717907443e-05, "epoch": 0.587410408226862, "percentage": 58.74, "elapsed_time": "1 day, 18:58:47", "remaining_time": "1 day, 6:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5656, "total_steps": 9627, "loss": 1.7688, "learning_rate": 3.642581822459441e-05, "epoch": 0.5875142827464424, "percentage": 58.75, "elapsed_time": "1 day, 18:59:14", "remaining_time": "1 day, 6:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5657, "total_steps": 9627, "loss": 1.6345, "learning_rate": 3.641011517682588e-05, "epoch": 0.5876181572660226, "percentage": 58.76, "elapsed_time": "1 day, 18:59:43", "remaining_time": "1 day, 6:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5658, "total_steps": 9627, "loss": 1.6559, "learning_rate": 3.639441357627404e-05, "epoch": 0.587722031785603, "percentage": 58.77, "elapsed_time": "1 day, 19:00:11", "remaining_time": "1 day, 6:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5659, "total_steps": 9627, "loss": 1.6813, "learning_rate": 3.637871342461103e-05, "epoch": 0.5878259063051834, "percentage": 58.78, "elapsed_time": "1 day, 19:00:40", "remaining_time": "1 day, 6:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5660, "total_steps": 9627, "loss": 1.7832, "learning_rate": 3.6363014723508813e-05, "epoch": 0.5879297808247637, "percentage": 58.79, "elapsed_time": "1 day, 19:01:08", "remaining_time": "1 day, 6:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5661, "total_steps": 9627, "loss": 1.6288, "learning_rate": 3.634731747463913e-05, "epoch": 0.588033655344344, "percentage": 58.8, "elapsed_time": "1 day, 19:01:36", "remaining_time": "1 day, 6:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5662, "total_steps": 9627, "loss": 1.6388, "learning_rate": 3.633162167967366e-05, "epoch": 0.5881375298639244, "percentage": 58.81, "elapsed_time": "1 day, 19:02:04", "remaining_time": "1 day, 6:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5663, "total_steps": 9627, "loss": 1.6475, "learning_rate": 3.6315927340283855e-05, "epoch": 0.5882414043835047, "percentage": 58.82, "elapsed_time": "1 day, 19:02:33", "remaining_time": "1 day, 6:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5664, "total_steps": 9627, "loss": 1.7276, "learning_rate": 3.630023445814106e-05, "epoch": 0.5883452789030851, "percentage": 58.83, "elapsed_time": "1 day, 19:03:01", "remaining_time": "1 day, 6:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5665, "total_steps": 9627, "loss": 1.449, "learning_rate": 3.6284543034916405e-05, "epoch": 0.5884491534226655, "percentage": 58.84, "elapsed_time": "1 day, 19:03:30", "remaining_time": "1 day, 6:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5666, "total_steps": 9627, "loss": 1.692, "learning_rate": 3.6268853072280966e-05, "epoch": 0.5885530279422457, "percentage": 58.86, "elapsed_time": "1 day, 19:03:57", "remaining_time": "1 day, 6:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5667, "total_steps": 9627, "loss": 1.7896, "learning_rate": 3.625316457190555e-05, "epoch": 0.5886569024618261, "percentage": 58.87, "elapsed_time": "1 day, 19:04:26", "remaining_time": "1 day, 6:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5668, "total_steps": 9627, "loss": 1.8176, "learning_rate": 3.623747753546086e-05, "epoch": 0.5887607769814065, "percentage": 58.88, "elapsed_time": "1 day, 19:04:53", "remaining_time": "1 day, 6:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5669, "total_steps": 9627, "loss": 1.7778, "learning_rate": 3.62217919646175e-05, "epoch": 0.5888646515009868, "percentage": 58.89, "elapsed_time": "1 day, 19:05:22", "remaining_time": "1 day, 6:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5670, "total_steps": 9627, "loss": 1.8, "learning_rate": 3.6206107861045804e-05, "epoch": 0.5889685260205672, "percentage": 58.9, "elapsed_time": "1 day, 19:05:49", "remaining_time": "1 day, 6:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5671, "total_steps": 9627, "loss": 1.4904, "learning_rate": 3.619042522641601e-05, "epoch": 0.5890724005401475, "percentage": 58.91, "elapsed_time": "1 day, 19:06:19", "remaining_time": "1 day, 6:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5672, "total_steps": 9627, "loss": 1.6863, "learning_rate": 3.617474406239824e-05, "epoch": 0.5891762750597278, "percentage": 58.92, "elapsed_time": "1 day, 19:06:46", "remaining_time": "1 day, 6:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5673, "total_steps": 9627, "loss": 1.5951, "learning_rate": 3.615906437066236e-05, "epoch": 0.5892801495793082, "percentage": 58.93, "elapsed_time": "1 day, 19:07:15", "remaining_time": "1 day, 6:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5674, "total_steps": 9627, "loss": 1.5416, "learning_rate": 3.614338615287816e-05, "epoch": 0.5893840240988886, "percentage": 58.94, "elapsed_time": "1 day, 19:07:43", "remaining_time": "1 day, 6:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5675, "total_steps": 9627, "loss": 1.6345, "learning_rate": 3.612770941071527e-05, "epoch": 0.5894878986184688, "percentage": 58.95, "elapsed_time": "1 day, 19:08:11", "remaining_time": "1 day, 6:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5676, "total_steps": 9627, "loss": 1.7968, "learning_rate": 3.61120341458431e-05, "epoch": 0.5895917731380492, "percentage": 58.96, "elapsed_time": "1 day, 19:08:39", "remaining_time": "1 day, 6:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5677, "total_steps": 9627, "loss": 1.458, "learning_rate": 3.6096360359930984e-05, "epoch": 0.5896956476576296, "percentage": 58.97, "elapsed_time": "1 day, 19:09:08", "remaining_time": "1 day, 6:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5678, "total_steps": 9627, "loss": 1.8428, "learning_rate": 3.608068805464802e-05, "epoch": 0.5897995221772099, "percentage": 58.98, "elapsed_time": "1 day, 19:09:35", "remaining_time": "1 day, 6:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5679, "total_steps": 9627, "loss": 1.4289, "learning_rate": 3.6065017231663214e-05, "epoch": 0.5899033966967903, "percentage": 58.99, "elapsed_time": "1 day, 19:10:04", "remaining_time": "1 day, 6:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5680, "total_steps": 9627, "loss": 1.7567, "learning_rate": 3.6049347892645356e-05, "epoch": 0.5900072712163706, "percentage": 59.0, "elapsed_time": "1 day, 19:10:33", "remaining_time": "1 day, 6:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5681, "total_steps": 9627, "loss": 1.6062, "learning_rate": 3.603368003926314e-05, "epoch": 0.590111145735951, "percentage": 59.01, "elapsed_time": "1 day, 19:11:00", "remaining_time": "1 day, 5:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5682, "total_steps": 9627, "loss": 1.6996, "learning_rate": 3.601801367318507e-05, "epoch": 0.5902150202555313, "percentage": 59.02, "elapsed_time": "1 day, 19:11:29", "remaining_time": "1 day, 5:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5683, "total_steps": 9627, "loss": 1.6467, "learning_rate": 3.600234879607947e-05, "epoch": 0.5903188947751117, "percentage": 59.03, "elapsed_time": "1 day, 19:11:56", "remaining_time": "1 day, 5:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5684, "total_steps": 9627, "loss": 1.8217, "learning_rate": 3.5986685409614526e-05, "epoch": 0.5904227692946921, "percentage": 59.04, "elapsed_time": "1 day, 19:12:26", "remaining_time": "1 day, 5:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5685, "total_steps": 9627, "loss": 1.7504, "learning_rate": 3.597102351545831e-05, "epoch": 0.5905266438142723, "percentage": 59.05, "elapsed_time": "1 day, 19:12:54", "remaining_time": "1 day, 5:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5686, "total_steps": 9627, "loss": 1.6519, "learning_rate": 3.5955363115278626e-05, "epoch": 0.5906305183338527, "percentage": 59.06, "elapsed_time": "1 day, 19:13:21", "remaining_time": "1 day, 5:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5687, "total_steps": 9627, "loss": 1.6564, "learning_rate": 3.593970421074323e-05, "epoch": 0.5907343928534331, "percentage": 59.07, "elapsed_time": "1 day, 19:13:50", "remaining_time": "1 day, 5:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5688, "total_steps": 9627, "loss": 1.5858, "learning_rate": 3.5924046803519675e-05, "epoch": 0.5908382673730134, "percentage": 59.08, "elapsed_time": "1 day, 19:14:18", "remaining_time": "1 day, 5:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5689, "total_steps": 9627, "loss": 1.6495, "learning_rate": 3.590839089527531e-05, "epoch": 0.5909421418925938, "percentage": 59.09, "elapsed_time": "1 day, 19:14:46", "remaining_time": "1 day, 5:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5690, "total_steps": 9627, "loss": 1.6129, "learning_rate": 3.589273648767742e-05, "epoch": 0.5910460164121741, "percentage": 59.1, "elapsed_time": "1 day, 19:15:15", "remaining_time": "1 day, 5:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5691, "total_steps": 9627, "loss": 1.7354, "learning_rate": 3.5877083582393044e-05, "epoch": 0.5911498909317544, "percentage": 59.11, "elapsed_time": "1 day, 19:15:42", "remaining_time": "1 day, 5:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5692, "total_steps": 9627, "loss": 1.891, "learning_rate": 3.586143218108911e-05, "epoch": 0.5912537654513348, "percentage": 59.13, "elapsed_time": "1 day, 19:16:10", "remaining_time": "1 day, 5:54:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5693, "total_steps": 9627, "loss": 1.6225, "learning_rate": 3.584578228543235e-05, "epoch": 0.5913576399709152, "percentage": 59.14, "elapsed_time": "1 day, 19:16:39", "remaining_time": "1 day, 5:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5694, "total_steps": 9627, "loss": 1.671, "learning_rate": 3.5830133897089394e-05, "epoch": 0.5914615144904954, "percentage": 59.15, "elapsed_time": "1 day, 19:17:06", "remaining_time": "1 day, 5:53:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5695, "total_steps": 9627, "loss": 1.648, "learning_rate": 3.5814487017726616e-05, "epoch": 0.5915653890100758, "percentage": 59.16, "elapsed_time": "1 day, 19:17:35", "remaining_time": "1 day, 5:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5696, "total_steps": 9627, "loss": 1.8003, "learning_rate": 3.579884164901033e-05, "epoch": 0.5916692635296562, "percentage": 59.17, "elapsed_time": "1 day, 19:18:04", "remaining_time": "1 day, 5:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5697, "total_steps": 9627, "loss": 1.7439, "learning_rate": 3.5783197792606654e-05, "epoch": 0.5917731380492365, "percentage": 59.18, "elapsed_time": "1 day, 19:18:31", "remaining_time": "1 day, 5:52:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5698, "total_steps": 9627, "loss": 1.6194, "learning_rate": 3.576755545018151e-05, "epoch": 0.5918770125688169, "percentage": 59.19, "elapsed_time": "1 day, 19:19:00", "remaining_time": "1 day, 5:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5699, "total_steps": 9627, "loss": 1.599, "learning_rate": 3.5751914623400675e-05, "epoch": 0.5919808870883972, "percentage": 59.2, "elapsed_time": "1 day, 19:19:28", "remaining_time": "1 day, 5:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5700, "total_steps": 9627, "loss": 1.8195, "learning_rate": 3.573627531392982e-05, "epoch": 0.5920847616079775, "percentage": 59.21, "elapsed_time": "1 day, 19:19:57", "remaining_time": "1 day, 5:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5701, "total_steps": 9627, "loss": 1.6844, "learning_rate": 3.572063752343436e-05, "epoch": 0.5921886361275579, "percentage": 59.22, "elapsed_time": "1 day, 19:20:24", "remaining_time": "1 day, 5:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5702, "total_steps": 9627, "loss": 1.652, "learning_rate": 3.5705001253579615e-05, "epoch": 0.5922925106471383, "percentage": 59.23, "elapsed_time": "1 day, 19:20:53", "remaining_time": "1 day, 5:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5703, "total_steps": 9627, "loss": 1.6053, "learning_rate": 3.568936650603076e-05, "epoch": 0.5923963851667186, "percentage": 59.24, "elapsed_time": "1 day, 19:21:20", "remaining_time": "1 day, 5:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5704, "total_steps": 9627, "loss": 1.3555, "learning_rate": 3.5673733282452725e-05, "epoch": 0.5925002596862989, "percentage": 59.25, "elapsed_time": "1 day, 19:21:49", "remaining_time": "1 day, 5:49:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5705, "total_steps": 9627, "loss": 1.7809, "learning_rate": 3.565810158451036e-05, "epoch": 0.5926041342058793, "percentage": 59.26, "elapsed_time": "1 day, 19:22:18", "remaining_time": "1 day, 5:49:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5706, "total_steps": 9627, "loss": 1.903, "learning_rate": 3.5642471413868305e-05, "epoch": 0.5927080087254596, "percentage": 59.27, "elapsed_time": "1 day, 19:22:46", "remaining_time": "1 day, 5:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5707, "total_steps": 9627, "loss": 1.5994, "learning_rate": 3.562684277219104e-05, "epoch": 0.59281188324504, "percentage": 59.28, "elapsed_time": "1 day, 19:23:13", "remaining_time": "1 day, 5:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5708, "total_steps": 9627, "loss": 1.8916, "learning_rate": 3.5611215661142897e-05, "epoch": 0.5929157577646204, "percentage": 59.29, "elapsed_time": "1 day, 19:23:43", "remaining_time": "1 day, 5:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5709, "total_steps": 9627, "loss": 1.4593, "learning_rate": 3.559559008238805e-05, "epoch": 0.5930196322842007, "percentage": 59.3, "elapsed_time": "1 day, 19:24:09", "remaining_time": "1 day, 5:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5710, "total_steps": 9627, "loss": 1.7235, "learning_rate": 3.5579966037590524e-05, "epoch": 0.593123506803781, "percentage": 59.31, "elapsed_time": "1 day, 19:24:38", "remaining_time": "1 day, 5:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5711, "total_steps": 9627, "loss": 1.631, "learning_rate": 3.556434352841411e-05, "epoch": 0.5932273813233614, "percentage": 59.32, "elapsed_time": "1 day, 19:25:07", "remaining_time": "1 day, 5:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5712, "total_steps": 9627, "loss": 1.8386, "learning_rate": 3.554872255652252e-05, "epoch": 0.5933312558429418, "percentage": 59.33, "elapsed_time": "1 day, 19:25:35", "remaining_time": "1 day, 5:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5713, "total_steps": 9627, "loss": 1.838, "learning_rate": 3.553310312357927e-05, "epoch": 0.593435130362522, "percentage": 59.34, "elapsed_time": "1 day, 19:26:02", "remaining_time": "1 day, 5:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5714, "total_steps": 9627, "loss": 1.7349, "learning_rate": 3.551748523124766e-05, "epoch": 0.5935390048821024, "percentage": 59.35, "elapsed_time": "1 day, 19:26:32", "remaining_time": "1 day, 5:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5715, "total_steps": 9627, "loss": 1.6032, "learning_rate": 3.550186888119091e-05, "epoch": 0.5936428794016828, "percentage": 59.36, "elapsed_time": "1 day, 19:26:59", "remaining_time": "1 day, 5:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5716, "total_steps": 9627, "loss": 1.8558, "learning_rate": 3.5486254075072056e-05, "epoch": 0.5937467539212631, "percentage": 59.37, "elapsed_time": "1 day, 19:27:27", "remaining_time": "1 day, 5:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5717, "total_steps": 9627, "loss": 1.7783, "learning_rate": 3.547064081455391e-05, "epoch": 0.5938506284408435, "percentage": 59.39, "elapsed_time": "1 day, 19:27:55", "remaining_time": "1 day, 5:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5718, "total_steps": 9627, "loss": 1.4527, "learning_rate": 3.5455029101299196e-05, "epoch": 0.5939545029604238, "percentage": 59.4, "elapsed_time": "1 day, 19:28:23", "remaining_time": "1 day, 5:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5719, "total_steps": 9627, "loss": 1.8712, "learning_rate": 3.5439418936970425e-05, "epoch": 0.5940583774800041, "percentage": 59.41, "elapsed_time": "1 day, 19:28:52", "remaining_time": "1 day, 5:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5720, "total_steps": 9627, "loss": 1.548, "learning_rate": 3.542381032322997e-05, "epoch": 0.5941622519995845, "percentage": 59.42, "elapsed_time": "1 day, 19:29:20", "remaining_time": "1 day, 5:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5721, "total_steps": 9627, "loss": 1.5979, "learning_rate": 3.540820326173999e-05, "epoch": 0.5942661265191649, "percentage": 59.43, "elapsed_time": "1 day, 19:29:49", "remaining_time": "1 day, 5:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5722, "total_steps": 9627, "loss": 1.7001, "learning_rate": 3.539259775416257e-05, "epoch": 0.5943700010387452, "percentage": 59.44, "elapsed_time": "1 day, 19:30:17", "remaining_time": "1 day, 5:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5723, "total_steps": 9627, "loss": 1.7146, "learning_rate": 3.537699380215953e-05, "epoch": 0.5944738755583255, "percentage": 59.45, "elapsed_time": "1 day, 19:30:44", "remaining_time": "1 day, 5:40:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5724, "total_steps": 9627, "loss": 1.711, "learning_rate": 3.5361391407392583e-05, "epoch": 0.5945777500779059, "percentage": 59.46, "elapsed_time": "1 day, 19:31:12", "remaining_time": "1 day, 5:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5725, "total_steps": 9627, "loss": 1.9054, "learning_rate": 3.5345790571523286e-05, "epoch": 0.5946816245974862, "percentage": 59.47, "elapsed_time": "1 day, 19:31:41", "remaining_time": "1 day, 5:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5726, "total_steps": 9627, "loss": 1.7314, "learning_rate": 3.5330191296212976e-05, "epoch": 0.5947854991170666, "percentage": 59.48, "elapsed_time": "1 day, 19:32:09", "remaining_time": "1 day, 5:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5727, "total_steps": 9627, "loss": 1.8133, "learning_rate": 3.5314593583122854e-05, "epoch": 0.594889373636647, "percentage": 59.49, "elapsed_time": "1 day, 19:32:36", "remaining_time": "1 day, 5:39:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5728, "total_steps": 9627, "loss": 1.7283, "learning_rate": 3.529899743391398e-05, "epoch": 0.5949932481562272, "percentage": 59.5, "elapsed_time": "1 day, 19:33:04", "remaining_time": "1 day, 5:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5729, "total_steps": 9627, "loss": 1.3802, "learning_rate": 3.5283402850247194e-05, "epoch": 0.5950971226758076, "percentage": 59.51, "elapsed_time": "1 day, 19:33:32", "remaining_time": "1 day, 5:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5730, "total_steps": 9627, "loss": 1.6485, "learning_rate": 3.526780983378321e-05, "epoch": 0.595200997195388, "percentage": 59.52, "elapsed_time": "1 day, 19:34:01", "remaining_time": "1 day, 5:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5731, "total_steps": 9627, "loss": 1.793, "learning_rate": 3.5252218386182585e-05, "epoch": 0.5953048717149683, "percentage": 59.53, "elapsed_time": "1 day, 19:34:28", "remaining_time": "1 day, 5:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5732, "total_steps": 9627, "loss": 1.7508, "learning_rate": 3.523662850910564e-05, "epoch": 0.5954087462345486, "percentage": 59.54, "elapsed_time": "1 day, 19:34:57", "remaining_time": "1 day, 5:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5733, "total_steps": 9627, "loss": 1.6849, "learning_rate": 3.5221040204212606e-05, "epoch": 0.595512620754129, "percentage": 59.55, "elapsed_time": "1 day, 19:35:24", "remaining_time": "1 day, 5:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5734, "total_steps": 9627, "loss": 1.6842, "learning_rate": 3.5205453473163506e-05, "epoch": 0.5956164952737094, "percentage": 59.56, "elapsed_time": "1 day, 19:35:53", "remaining_time": "1 day, 5:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5735, "total_steps": 9627, "loss": 1.6491, "learning_rate": 3.518986831761824e-05, "epoch": 0.5957203697932897, "percentage": 59.57, "elapsed_time": "1 day, 19:36:21", "remaining_time": "1 day, 5:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5736, "total_steps": 9627, "loss": 1.8276, "learning_rate": 3.517428473923644e-05, "epoch": 0.5958242443128701, "percentage": 59.58, "elapsed_time": "1 day, 19:36:50", "remaining_time": "1 day, 5:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5737, "total_steps": 9627, "loss": 1.6447, "learning_rate": 3.515870273967767e-05, "epoch": 0.5959281188324504, "percentage": 59.59, "elapsed_time": "1 day, 19:37:18", "remaining_time": "1 day, 5:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5738, "total_steps": 9627, "loss": 1.6278, "learning_rate": 3.514312232060132e-05, "epoch": 0.5960319933520307, "percentage": 59.6, "elapsed_time": "1 day, 19:37:45", "remaining_time": "1 day, 5:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5739, "total_steps": 9627, "loss": 1.7605, "learning_rate": 3.512754348366652e-05, "epoch": 0.5961358678716111, "percentage": 59.61, "elapsed_time": "1 day, 19:38:14", "remaining_time": "1 day, 5:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5740, "total_steps": 9627, "loss": 2.0161, "learning_rate": 3.5111966230532355e-05, "epoch": 0.5962397423911915, "percentage": 59.62, "elapsed_time": "1 day, 19:38:42", "remaining_time": "1 day, 5:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5741, "total_steps": 9627, "loss": 1.6192, "learning_rate": 3.509639056285766e-05, "epoch": 0.5963436169107718, "percentage": 59.63, "elapsed_time": "1 day, 19:39:09", "remaining_time": "1 day, 5:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5742, "total_steps": 9627, "loss": 1.6114, "learning_rate": 3.50808164823011e-05, "epoch": 0.5964474914303521, "percentage": 59.64, "elapsed_time": "1 day, 19:39:38", "remaining_time": "1 day, 5:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5743, "total_steps": 9627, "loss": 1.7771, "learning_rate": 3.5065243990521205e-05, "epoch": 0.5965513659499325, "percentage": 59.66, "elapsed_time": "1 day, 19:40:07", "remaining_time": "1 day, 5:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5744, "total_steps": 9627, "loss": 1.6355, "learning_rate": 3.504967308917635e-05, "epoch": 0.5966552404695128, "percentage": 59.67, "elapsed_time": "1 day, 19:40:35", "remaining_time": "1 day, 5:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5745, "total_steps": 9627, "loss": 1.5866, "learning_rate": 3.5034103779924674e-05, "epoch": 0.5967591149890932, "percentage": 59.68, "elapsed_time": "1 day, 19:41:03", "remaining_time": "1 day, 5:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5746, "total_steps": 9627, "loss": 1.663, "learning_rate": 3.5018536064424224e-05, "epoch": 0.5968629895086736, "percentage": 59.69, "elapsed_time": "1 day, 19:41:30", "remaining_time": "1 day, 5:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5747, "total_steps": 9627, "loss": 1.7701, "learning_rate": 3.500296994433282e-05, "epoch": 0.5969668640282538, "percentage": 59.7, "elapsed_time": "1 day, 19:41:59", "remaining_time": "1 day, 5:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5748, "total_steps": 9627, "loss": 1.5167, "learning_rate": 3.498740542130813e-05, "epoch": 0.5970707385478342, "percentage": 59.71, "elapsed_time": "1 day, 19:42:27", "remaining_time": "1 day, 5:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5749, "total_steps": 9627, "loss": 1.6903, "learning_rate": 3.497184249700766e-05, "epoch": 0.5971746130674146, "percentage": 59.72, "elapsed_time": "1 day, 19:42:55", "remaining_time": "1 day, 5:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5750, "total_steps": 9627, "loss": 1.3562, "learning_rate": 3.495628117308875e-05, "epoch": 0.5972784875869949, "percentage": 59.73, "elapsed_time": "1 day, 19:43:23", "remaining_time": "1 day, 5:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5751, "total_steps": 9627, "loss": 1.6846, "learning_rate": 3.4940721451208535e-05, "epoch": 0.5973823621065752, "percentage": 59.74, "elapsed_time": "1 day, 19:43:51", "remaining_time": "1 day, 5:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5752, "total_steps": 9627, "loss": 1.6667, "learning_rate": 3.4925163333024015e-05, "epoch": 0.5974862366261556, "percentage": 59.75, "elapsed_time": "1 day, 19:44:20", "remaining_time": "1 day, 5:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5753, "total_steps": 9627, "loss": 1.594, "learning_rate": 3.490960682019203e-05, "epoch": 0.5975901111457359, "percentage": 59.76, "elapsed_time": "1 day, 19:44:47", "remaining_time": "1 day, 5:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5754, "total_steps": 9627, "loss": 1.8576, "learning_rate": 3.489405191436921e-05, "epoch": 0.5976939856653163, "percentage": 59.77, "elapsed_time": "1 day, 19:45:16", "remaining_time": "1 day, 5:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5755, "total_steps": 9627, "loss": 1.7881, "learning_rate": 3.487849861721201e-05, "epoch": 0.5977978601848967, "percentage": 59.78, "elapsed_time": "1 day, 19:45:43", "remaining_time": "1 day, 5:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5756, "total_steps": 9627, "loss": 1.5814, "learning_rate": 3.4862946930376775e-05, "epoch": 0.5979017347044769, "percentage": 59.79, "elapsed_time": "1 day, 19:46:12", "remaining_time": "1 day, 5:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5757, "total_steps": 9627, "loss": 1.688, "learning_rate": 3.4847396855519604e-05, "epoch": 0.5980056092240573, "percentage": 59.8, "elapsed_time": "1 day, 19:46:39", "remaining_time": "1 day, 5:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5758, "total_steps": 9627, "loss": 1.7056, "learning_rate": 3.483184839429647e-05, "epoch": 0.5981094837436377, "percentage": 59.81, "elapsed_time": "1 day, 19:47:08", "remaining_time": "1 day, 5:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5759, "total_steps": 9627, "loss": 1.6278, "learning_rate": 3.481630154836317e-05, "epoch": 0.5982133582632181, "percentage": 59.82, "elapsed_time": "1 day, 19:47:36", "remaining_time": "1 day, 5:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5760, "total_steps": 9627, "loss": 1.5913, "learning_rate": 3.4800756319375325e-05, "epoch": 0.5983172327827984, "percentage": 59.83, "elapsed_time": "1 day, 19:48:04", "remaining_time": "1 day, 5:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5761, "total_steps": 9627, "loss": 1.7894, "learning_rate": 3.478521270898838e-05, "epoch": 0.5984211073023787, "percentage": 59.84, "elapsed_time": "1 day, 19:48:32", "remaining_time": "1 day, 5:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5762, "total_steps": 9627, "loss": 1.6332, "learning_rate": 3.476967071885758e-05, "epoch": 0.5985249818219591, "percentage": 59.85, "elapsed_time": "1 day, 19:49:00", "remaining_time": "1 day, 5:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5763, "total_steps": 9627, "loss": 1.6174, "learning_rate": 3.475413035063807e-05, "epoch": 0.5986288563415394, "percentage": 59.86, "elapsed_time": "1 day, 19:49:29", "remaining_time": "1 day, 5:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5764, "total_steps": 9627, "loss": 1.7204, "learning_rate": 3.473859160598474e-05, "epoch": 0.5987327308611198, "percentage": 59.87, "elapsed_time": "1 day, 19:49:57", "remaining_time": "1 day, 5:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5765, "total_steps": 9627, "loss": 1.7932, "learning_rate": 3.4723054486552354e-05, "epoch": 0.5988366053807002, "percentage": 59.88, "elapsed_time": "1 day, 19:50:24", "remaining_time": "1 day, 5:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5766, "total_steps": 9627, "loss": 1.7966, "learning_rate": 3.4707518993995524e-05, "epoch": 0.5989404799002804, "percentage": 59.89, "elapsed_time": "1 day, 19:50:51", "remaining_time": "1 day, 5:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5767, "total_steps": 9627, "loss": 1.6783, "learning_rate": 3.469198512996863e-05, "epoch": 0.5990443544198608, "percentage": 59.9, "elapsed_time": "1 day, 19:51:21", "remaining_time": "1 day, 5:21:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5768, "total_steps": 9627, "loss": 1.5305, "learning_rate": 3.467645289612589e-05, "epoch": 0.5991482289394412, "percentage": 59.91, "elapsed_time": "1 day, 19:51:48", "remaining_time": "1 day, 5:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5769, "total_steps": 9627, "loss": 1.4935, "learning_rate": 3.4660922294121416e-05, "epoch": 0.5992521034590215, "percentage": 59.93, "elapsed_time": "1 day, 19:52:17", "remaining_time": "1 day, 5:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5770, "total_steps": 9627, "loss": 1.5182, "learning_rate": 3.4645393325609046e-05, "epoch": 0.5993559779786019, "percentage": 59.94, "elapsed_time": "1 day, 19:52:44", "remaining_time": "1 day, 5:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5771, "total_steps": 9627, "loss": 1.7623, "learning_rate": 3.462986599224252e-05, "epoch": 0.5994598524981822, "percentage": 59.95, "elapsed_time": "1 day, 19:53:13", "remaining_time": "1 day, 5:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5772, "total_steps": 9627, "loss": 1.5783, "learning_rate": 3.46143402956754e-05, "epoch": 0.5995637270177625, "percentage": 59.96, "elapsed_time": "1 day, 19:53:41", "remaining_time": "1 day, 5:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5773, "total_steps": 9627, "loss": 1.7221, "learning_rate": 3.4598816237561e-05, "epoch": 0.5996676015373429, "percentage": 59.97, "elapsed_time": "1 day, 19:54:09", "remaining_time": "1 day, 5:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5774, "total_steps": 9627, "loss": 1.5198, "learning_rate": 3.4583293819552534e-05, "epoch": 0.5997714760569233, "percentage": 59.98, "elapsed_time": "1 day, 19:54:37", "remaining_time": "1 day, 5:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5775, "total_steps": 9627, "loss": 1.6871, "learning_rate": 3.456777304330303e-05, "epoch": 0.5998753505765035, "percentage": 59.99, "elapsed_time": "1 day, 19:55:04", "remaining_time": "1 day, 5:17:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5776, "total_steps": 9627, "loss": 1.6126, "learning_rate": 3.455225391046533e-05, "epoch": 0.5999792250960839, "percentage": 60.0, "elapsed_time": "1 day, 19:55:32", "remaining_time": "1 day, 5:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5777, "total_steps": 9627, "loss": 1.4743, "learning_rate": 3.4536736422692076e-05, "epoch": 0.6000830996156643, "percentage": 60.01, "elapsed_time": "1 day, 19:56:00", "remaining_time": "1 day, 5:16:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5778, "total_steps": 9627, "loss": 1.4636, "learning_rate": 3.4521220581635785e-05, "epoch": 0.6001869741352446, "percentage": 60.02, "elapsed_time": "1 day, 19:56:28", "remaining_time": "1 day, 5:16:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5779, "total_steps": 9627, "loss": 1.7064, "learning_rate": 3.4505706388948755e-05, "epoch": 0.600290848654825, "percentage": 60.03, "elapsed_time": "1 day, 19:56:56", "remaining_time": "1 day, 5:15:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5780, "total_steps": 9627, "loss": 1.7697, "learning_rate": 3.4490193846283125e-05, "epoch": 0.6003947231744053, "percentage": 60.04, "elapsed_time": "1 day, 19:57:25", "remaining_time": "1 day, 5:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5781, "total_steps": 9627, "loss": 1.7538, "learning_rate": 3.44746829552909e-05, "epoch": 0.6004985976939856, "percentage": 60.05, "elapsed_time": "1 day, 19:57:52", "remaining_time": "1 day, 5:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5782, "total_steps": 9627, "loss": 1.8034, "learning_rate": 3.445917371762382e-05, "epoch": 0.600602472213566, "percentage": 60.06, "elapsed_time": "1 day, 19:58:21", "remaining_time": "1 day, 5:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5783, "total_steps": 9627, "loss": 1.6961, "learning_rate": 3.444366613493351e-05, "epoch": 0.6007063467331464, "percentage": 60.07, "elapsed_time": "1 day, 19:58:49", "remaining_time": "1 day, 5:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5784, "total_steps": 9627, "loss": 1.6964, "learning_rate": 3.4428160208871414e-05, "epoch": 0.6008102212527268, "percentage": 60.08, "elapsed_time": "1 day, 19:59:17", "remaining_time": "1 day, 5:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5785, "total_steps": 9627, "loss": 1.5853, "learning_rate": 3.441265594108881e-05, "epoch": 0.600914095772307, "percentage": 60.09, "elapsed_time": "1 day, 19:59:45", "remaining_time": "1 day, 5:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5786, "total_steps": 9627, "loss": 1.5617, "learning_rate": 3.4397153333236735e-05, "epoch": 0.6010179702918874, "percentage": 60.1, "elapsed_time": "1 day, 20:00:13", "remaining_time": "1 day, 5:12:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5787, "total_steps": 9627, "loss": 1.642, "learning_rate": 3.438165238696614e-05, "epoch": 0.6011218448114678, "percentage": 60.11, "elapsed_time": "1 day, 20:00:42", "remaining_time": "1 day, 5:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5788, "total_steps": 9627, "loss": 1.5589, "learning_rate": 3.436615310392773e-05, "epoch": 0.6012257193310481, "percentage": 60.12, "elapsed_time": "1 day, 20:01:09", "remaining_time": "1 day, 5:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5789, "total_steps": 9627, "loss": 1.8877, "learning_rate": 3.4350655485772074e-05, "epoch": 0.6013295938506285, "percentage": 60.13, "elapsed_time": "1 day, 20:01:37", "remaining_time": "1 day, 5:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5790, "total_steps": 9627, "loss": 1.5837, "learning_rate": 3.433515953414953e-05, "epoch": 0.6014334683702088, "percentage": 60.14, "elapsed_time": "1 day, 20:02:06", "remaining_time": "1 day, 5:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5791, "total_steps": 9627, "loss": 1.7953, "learning_rate": 3.431966525071033e-05, "epoch": 0.6015373428897891, "percentage": 60.15, "elapsed_time": "1 day, 20:02:33", "remaining_time": "1 day, 5:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5792, "total_steps": 9627, "loss": 1.6294, "learning_rate": 3.4304172637104436e-05, "epoch": 0.6016412174093695, "percentage": 60.16, "elapsed_time": "1 day, 20:03:02", "remaining_time": "1 day, 5:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5793, "total_steps": 9627, "loss": 1.686, "learning_rate": 3.4288681694981735e-05, "epoch": 0.6017450919289499, "percentage": 60.17, "elapsed_time": "1 day, 20:03:30", "remaining_time": "1 day, 5:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5794, "total_steps": 9627, "loss": 1.6336, "learning_rate": 3.42731924259919e-05, "epoch": 0.6018489664485301, "percentage": 60.18, "elapsed_time": "1 day, 20:03:58", "remaining_time": "1 day, 5:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5795, "total_steps": 9627, "loss": 1.6593, "learning_rate": 3.4257704831784375e-05, "epoch": 0.6019528409681105, "percentage": 60.2, "elapsed_time": "1 day, 20:04:26", "remaining_time": "1 day, 5:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5796, "total_steps": 9627, "loss": 1.8737, "learning_rate": 3.42422189140085e-05, "epoch": 0.6020567154876909, "percentage": 60.21, "elapsed_time": "1 day, 20:04:55", "remaining_time": "1 day, 5:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5797, "total_steps": 9627, "loss": 1.7137, "learning_rate": 3.42267346743134e-05, "epoch": 0.6021605900072712, "percentage": 60.22, "elapsed_time": "1 day, 20:05:22", "remaining_time": "1 day, 5:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5798, "total_steps": 9627, "loss": 1.7122, "learning_rate": 3.4211252114348e-05, "epoch": 0.6022644645268516, "percentage": 60.23, "elapsed_time": "1 day, 20:05:50", "remaining_time": "1 day, 5:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5799, "total_steps": 9627, "loss": 1.6723, "learning_rate": 3.41957712357611e-05, "epoch": 0.6023683390464319, "percentage": 60.24, "elapsed_time": "1 day, 20:06:18", "remaining_time": "1 day, 5:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5800, "total_steps": 9627, "loss": 1.6197, "learning_rate": 3.41802920402013e-05, "epoch": 0.6024722135660122, "percentage": 60.25, "elapsed_time": "1 day, 20:06:46", "remaining_time": "1 day, 5:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5801, "total_steps": 9627, "loss": 1.5572, "learning_rate": 3.416481452931699e-05, "epoch": 0.6025760880855926, "percentage": 60.26, "elapsed_time": "1 day, 20:07:15", "remaining_time": "1 day, 5:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5802, "total_steps": 9627, "loss": 1.6363, "learning_rate": 3.4149338704756416e-05, "epoch": 0.602679962605173, "percentage": 60.27, "elapsed_time": "1 day, 20:07:43", "remaining_time": "1 day, 5:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5803, "total_steps": 9627, "loss": 1.8986, "learning_rate": 3.413386456816763e-05, "epoch": 0.6027838371247533, "percentage": 60.28, "elapsed_time": "1 day, 20:08:11", "remaining_time": "1 day, 5:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5804, "total_steps": 9627, "loss": 1.64, "learning_rate": 3.411839212119851e-05, "epoch": 0.6028877116443336, "percentage": 60.29, "elapsed_time": "1 day, 20:08:38", "remaining_time": "1 day, 5:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5805, "total_steps": 9627, "loss": 1.577, "learning_rate": 3.410292136549673e-05, "epoch": 0.602991586163914, "percentage": 60.3, "elapsed_time": "1 day, 20:09:07", "remaining_time": "1 day, 5:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5806, "total_steps": 9627, "loss": 1.6308, "learning_rate": 3.408745230270985e-05, "epoch": 0.6030954606834943, "percentage": 60.31, "elapsed_time": "1 day, 20:09:35", "remaining_time": "1 day, 5:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5807, "total_steps": 9627, "loss": 1.6313, "learning_rate": 3.407198493448516e-05, "epoch": 0.6031993352030747, "percentage": 60.32, "elapsed_time": "1 day, 20:10:03", "remaining_time": "1 day, 5:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5808, "total_steps": 9627, "loss": 1.7215, "learning_rate": 3.405651926246982e-05, "epoch": 0.603303209722655, "percentage": 60.33, "elapsed_time": "1 day, 20:10:30", "remaining_time": "1 day, 5:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5809, "total_steps": 9627, "loss": 1.665, "learning_rate": 3.4041055288310844e-05, "epoch": 0.6034070842422353, "percentage": 60.34, "elapsed_time": "1 day, 20:11:00", "remaining_time": "1 day, 5:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5810, "total_steps": 9627, "loss": 1.6458, "learning_rate": 3.402559301365498e-05, "epoch": 0.6035109587618157, "percentage": 60.35, "elapsed_time": "1 day, 20:11:27", "remaining_time": "1 day, 5:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5811, "total_steps": 9627, "loss": 1.6737, "learning_rate": 3.401013244014884e-05, "epoch": 0.6036148332813961, "percentage": 60.36, "elapsed_time": "1 day, 20:11:56", "remaining_time": "1 day, 5:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5812, "total_steps": 9627, "loss": 1.702, "learning_rate": 3.3994673569438886e-05, "epoch": 0.6037187078009765, "percentage": 60.37, "elapsed_time": "1 day, 20:12:24", "remaining_time": "1 day, 5:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5813, "total_steps": 9627, "loss": 1.6435, "learning_rate": 3.397921640317136e-05, "epoch": 0.6038225823205567, "percentage": 60.38, "elapsed_time": "1 day, 20:12:51", "remaining_time": "1 day, 5:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5814, "total_steps": 9627, "loss": 1.7202, "learning_rate": 3.39637609429923e-05, "epoch": 0.6039264568401371, "percentage": 60.39, "elapsed_time": "1 day, 20:13:20", "remaining_time": "1 day, 5:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5815, "total_steps": 9627, "loss": 1.664, "learning_rate": 3.3948307190547624e-05, "epoch": 0.6040303313597175, "percentage": 60.4, "elapsed_time": "1 day, 20:13:49", "remaining_time": "1 day, 4:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5816, "total_steps": 9627, "loss": 1.6268, "learning_rate": 3.3932855147483024e-05, "epoch": 0.6041342058792978, "percentage": 60.41, "elapsed_time": "1 day, 20:14:16", "remaining_time": "1 day, 4:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5817, "total_steps": 9627, "loss": 1.7967, "learning_rate": 3.391740481544402e-05, "epoch": 0.6042380803988782, "percentage": 60.42, "elapsed_time": "1 day, 20:14:45", "remaining_time": "1 day, 4:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5818, "total_steps": 9627, "loss": 1.5787, "learning_rate": 3.3901956196075945e-05, "epoch": 0.6043419549184585, "percentage": 60.43, "elapsed_time": "1 day, 20:15:13", "remaining_time": "1 day, 4:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5819, "total_steps": 9627, "loss": 1.6593, "learning_rate": 3.3886509291023986e-05, "epoch": 0.6044458294380388, "percentage": 60.44, "elapsed_time": "1 day, 20:15:42", "remaining_time": "1 day, 4:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5820, "total_steps": 9627, "loss": 1.6942, "learning_rate": 3.387106410193308e-05, "epoch": 0.6045497039576192, "percentage": 60.45, "elapsed_time": "1 day, 20:16:09", "remaining_time": "1 day, 4:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5821, "total_steps": 9627, "loss": 1.5867, "learning_rate": 3.385562063044803e-05, "epoch": 0.6046535784771996, "percentage": 60.47, "elapsed_time": "1 day, 20:16:38", "remaining_time": "1 day, 4:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5822, "total_steps": 9627, "loss": 1.8252, "learning_rate": 3.384017887821348e-05, "epoch": 0.6047574529967799, "percentage": 60.48, "elapsed_time": "1 day, 20:17:05", "remaining_time": "1 day, 4:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5823, "total_steps": 9627, "loss": 1.8101, "learning_rate": 3.382473884687382e-05, "epoch": 0.6048613275163602, "percentage": 60.49, "elapsed_time": "1 day, 20:17:34", "remaining_time": "1 day, 4:56:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5824, "total_steps": 9627, "loss": 1.6124, "learning_rate": 3.380930053807328e-05, "epoch": 0.6049652020359406, "percentage": 60.5, "elapsed_time": "1 day, 20:18:02", "remaining_time": "1 day, 4:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5825, "total_steps": 9627, "loss": 1.575, "learning_rate": 3.379386395345596e-05, "epoch": 0.6050690765555209, "percentage": 60.51, "elapsed_time": "1 day, 20:18:30", "remaining_time": "1 day, 4:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5826, "total_steps": 9627, "loss": 1.6505, "learning_rate": 3.377842909466571e-05, "epoch": 0.6051729510751013, "percentage": 60.52, "elapsed_time": "1 day, 20:18:57", "remaining_time": "1 day, 4:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5827, "total_steps": 9627, "loss": 1.7677, "learning_rate": 3.376299596334622e-05, "epoch": 0.6052768255946817, "percentage": 60.53, "elapsed_time": "1 day, 20:19:26", "remaining_time": "1 day, 4:54:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5828, "total_steps": 9627, "loss": 1.5649, "learning_rate": 3.374756456114102e-05, "epoch": 0.6053807001142619, "percentage": 60.54, "elapsed_time": "1 day, 20:19:55", "remaining_time": "1 day, 4:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5829, "total_steps": 9627, "loss": 1.8967, "learning_rate": 3.373213488969341e-05, "epoch": 0.6054845746338423, "percentage": 60.55, "elapsed_time": "1 day, 20:20:23", "remaining_time": "1 day, 4:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5830, "total_steps": 9627, "loss": 1.6626, "learning_rate": 3.371670695064655e-05, "epoch": 0.6055884491534227, "percentage": 60.56, "elapsed_time": "1 day, 20:20:51", "remaining_time": "1 day, 4:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5831, "total_steps": 9627, "loss": 1.9178, "learning_rate": 3.370128074564338e-05, "epoch": 0.605692323673003, "percentage": 60.57, "elapsed_time": "1 day, 20:21:19", "remaining_time": "1 day, 4:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5832, "total_steps": 9627, "loss": 1.7219, "learning_rate": 3.368585627632668e-05, "epoch": 0.6057961981925833, "percentage": 60.58, "elapsed_time": "1 day, 20:21:47", "remaining_time": "1 day, 4:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5833, "total_steps": 9627, "loss": 1.6541, "learning_rate": 3.3670433544339014e-05, "epoch": 0.6059000727121637, "percentage": 60.59, "elapsed_time": "1 day, 20:22:15", "remaining_time": "1 day, 4:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5834, "total_steps": 9627, "loss": 1.5446, "learning_rate": 3.365501255132283e-05, "epoch": 0.606003947231744, "percentage": 60.6, "elapsed_time": "1 day, 20:22:42", "remaining_time": "1 day, 4:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5835, "total_steps": 9627, "loss": 1.5639, "learning_rate": 3.363959329892029e-05, "epoch": 0.6061078217513244, "percentage": 60.61, "elapsed_time": "1 day, 20:23:10", "remaining_time": "1 day, 4:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5836, "total_steps": 9627, "loss": 1.5162, "learning_rate": 3.362417578877344e-05, "epoch": 0.6062116962709048, "percentage": 60.62, "elapsed_time": "1 day, 20:23:39", "remaining_time": "1 day, 4:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5837, "total_steps": 9627, "loss": 1.6176, "learning_rate": 3.360876002252415e-05, "epoch": 0.6063155707904851, "percentage": 60.63, "elapsed_time": "1 day, 20:24:06", "remaining_time": "1 day, 4:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5838, "total_steps": 9627, "loss": 1.7371, "learning_rate": 3.359334600181407e-05, "epoch": 0.6064194453100654, "percentage": 60.64, "elapsed_time": "1 day, 20:24:36", "remaining_time": "1 day, 4:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5839, "total_steps": 9627, "loss": 1.4975, "learning_rate": 3.357793372828464e-05, "epoch": 0.6065233198296458, "percentage": 60.65, "elapsed_time": "1 day, 20:25:03", "remaining_time": "1 day, 4:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5840, "total_steps": 9627, "loss": 1.623, "learning_rate": 3.356252320357718e-05, "epoch": 0.6066271943492262, "percentage": 60.66, "elapsed_time": "1 day, 20:25:31", "remaining_time": "1 day, 4:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5841, "total_steps": 9627, "loss": 1.5882, "learning_rate": 3.354711442933279e-05, "epoch": 0.6067310688688065, "percentage": 60.67, "elapsed_time": "1 day, 20:25:59", "remaining_time": "1 day, 4:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5842, "total_steps": 9627, "loss": 1.814, "learning_rate": 3.353170740719236e-05, "epoch": 0.6068349433883868, "percentage": 60.68, "elapsed_time": "1 day, 20:26:27", "remaining_time": "1 day, 4:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5843, "total_steps": 9627, "loss": 1.5899, "learning_rate": 3.351630213879665e-05, "epoch": 0.6069388179079672, "percentage": 60.69, "elapsed_time": "1 day, 20:26:55", "remaining_time": "1 day, 4:47:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5844, "total_steps": 9627, "loss": 1.6746, "learning_rate": 3.3500898625786184e-05, "epoch": 0.6070426924275475, "percentage": 60.7, "elapsed_time": "1 day, 20:27:23", "remaining_time": "1 day, 4:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5845, "total_steps": 9627, "loss": 1.5783, "learning_rate": 3.34854968698013e-05, "epoch": 0.6071465669471279, "percentage": 60.71, "elapsed_time": "1 day, 20:27:52", "remaining_time": "1 day, 4:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5846, "total_steps": 9627, "loss": 1.7318, "learning_rate": 3.347009687248219e-05, "epoch": 0.6072504414667083, "percentage": 60.73, "elapsed_time": "1 day, 20:28:20", "remaining_time": "1 day, 4:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5847, "total_steps": 9627, "loss": 1.5555, "learning_rate": 3.345469863546884e-05, "epoch": 0.6073543159862885, "percentage": 60.74, "elapsed_time": "1 day, 20:28:48", "remaining_time": "1 day, 4:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5848, "total_steps": 9627, "loss": 1.5914, "learning_rate": 3.3439302160401e-05, "epoch": 0.6074581905058689, "percentage": 60.75, "elapsed_time": "1 day, 20:29:16", "remaining_time": "1 day, 4:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5849, "total_steps": 9627, "loss": 1.7131, "learning_rate": 3.342390744891831e-05, "epoch": 0.6075620650254493, "percentage": 60.76, "elapsed_time": "1 day, 20:29:44", "remaining_time": "1 day, 4:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5850, "total_steps": 9627, "loss": 1.7986, "learning_rate": 3.340851450266019e-05, "epoch": 0.6076659395450296, "percentage": 60.77, "elapsed_time": "1 day, 20:30:12", "remaining_time": "1 day, 4:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5851, "total_steps": 9627, "loss": 1.7041, "learning_rate": 3.3393123323265855e-05, "epoch": 0.60776981406461, "percentage": 60.78, "elapsed_time": "1 day, 20:30:40", "remaining_time": "1 day, 4:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5852, "total_steps": 9627, "loss": 1.5044, "learning_rate": 3.337773391237433e-05, "epoch": 0.6078736885841903, "percentage": 60.79, "elapsed_time": "1 day, 20:31:08", "remaining_time": "1 day, 4:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5853, "total_steps": 9627, "loss": 1.6597, "learning_rate": 3.336234627162451e-05, "epoch": 0.6079775631037706, "percentage": 60.8, "elapsed_time": "1 day, 20:31:36", "remaining_time": "1 day, 4:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5854, "total_steps": 9627, "loss": 1.6794, "learning_rate": 3.3346960402655016e-05, "epoch": 0.608081437623351, "percentage": 60.81, "elapsed_time": "1 day, 20:32:04", "remaining_time": "1 day, 4:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5855, "total_steps": 9627, "loss": 1.8548, "learning_rate": 3.333157630710434e-05, "epoch": 0.6081853121429314, "percentage": 60.82, "elapsed_time": "1 day, 20:32:33", "remaining_time": "1 day, 4:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5856, "total_steps": 9627, "loss": 1.597, "learning_rate": 3.331619398661078e-05, "epoch": 0.6082891866625116, "percentage": 60.83, "elapsed_time": "1 day, 20:33:00", "remaining_time": "1 day, 4:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5857, "total_steps": 9627, "loss": 1.5453, "learning_rate": 3.3300813442812406e-05, "epoch": 0.608393061182092, "percentage": 60.84, "elapsed_time": "1 day, 20:33:29", "remaining_time": "1 day, 4:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5858, "total_steps": 9627, "loss": 1.6159, "learning_rate": 3.328543467734715e-05, "epoch": 0.6084969357016724, "percentage": 60.85, "elapsed_time": "1 day, 20:33:58", "remaining_time": "1 day, 4:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5859, "total_steps": 9627, "loss": 1.9154, "learning_rate": 3.327005769185273e-05, "epoch": 0.6086008102212527, "percentage": 60.86, "elapsed_time": "1 day, 20:34:26", "remaining_time": "1 day, 4:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5860, "total_steps": 9627, "loss": 1.6842, "learning_rate": 3.325468248796666e-05, "epoch": 0.6087046847408331, "percentage": 60.87, "elapsed_time": "1 day, 20:34:54", "remaining_time": "1 day, 4:39:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5861, "total_steps": 9627, "loss": 1.5068, "learning_rate": 3.323930906732628e-05, "epoch": 0.6088085592604134, "percentage": 60.88, "elapsed_time": "1 day, 20:35:21", "remaining_time": "1 day, 4:39:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5862, "total_steps": 9627, "loss": 1.8432, "learning_rate": 3.322393743156874e-05, "epoch": 0.6089124337799938, "percentage": 60.89, "elapsed_time": "1 day, 20:35:51", "remaining_time": "1 day, 4:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5863, "total_steps": 9627, "loss": 1.7516, "learning_rate": 3.3208567582331034e-05, "epoch": 0.6090163082995741, "percentage": 60.9, "elapsed_time": "1 day, 20:36:18", "remaining_time": "1 day, 4:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5864, "total_steps": 9627, "loss": 1.7277, "learning_rate": 3.3193199521249876e-05, "epoch": 0.6091201828191545, "percentage": 60.91, "elapsed_time": "1 day, 20:36:47", "remaining_time": "1 day, 4:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5865, "total_steps": 9627, "loss": 1.5975, "learning_rate": 3.3177833249961886e-05, "epoch": 0.6092240573387349, "percentage": 60.92, "elapsed_time": "1 day, 20:37:15", "remaining_time": "1 day, 4:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5866, "total_steps": 9627, "loss": 1.6415, "learning_rate": 3.316246877010344e-05, "epoch": 0.6093279318583151, "percentage": 60.93, "elapsed_time": "1 day, 20:37:43", "remaining_time": "1 day, 4:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5867, "total_steps": 9627, "loss": 1.7596, "learning_rate": 3.314710608331072e-05, "epoch": 0.6094318063778955, "percentage": 60.94, "elapsed_time": "1 day, 20:38:12", "remaining_time": "1 day, 4:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5868, "total_steps": 9627, "loss": 1.7909, "learning_rate": 3.3131745191219744e-05, "epoch": 0.6095356808974759, "percentage": 60.95, "elapsed_time": "1 day, 20:38:39", "remaining_time": "1 day, 4:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5869, "total_steps": 9627, "loss": 1.6518, "learning_rate": 3.311638609546635e-05, "epoch": 0.6096395554170562, "percentage": 60.96, "elapsed_time": "1 day, 20:39:08", "remaining_time": "1 day, 4:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5870, "total_steps": 9627, "loss": 1.6841, "learning_rate": 3.3101028797686106e-05, "epoch": 0.6097434299366365, "percentage": 60.97, "elapsed_time": "1 day, 20:39:35", "remaining_time": "1 day, 4:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5871, "total_steps": 9627, "loss": 1.7182, "learning_rate": 3.3085673299514496e-05, "epoch": 0.6098473044562169, "percentage": 60.98, "elapsed_time": "1 day, 20:40:04", "remaining_time": "1 day, 4:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5872, "total_steps": 9627, "loss": 1.5292, "learning_rate": 3.307031960258674e-05, "epoch": 0.6099511789757972, "percentage": 61.0, "elapsed_time": "1 day, 20:40:32", "remaining_time": "1 day, 4:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5873, "total_steps": 9627, "loss": 1.6406, "learning_rate": 3.30549677085379e-05, "epoch": 0.6100550534953776, "percentage": 61.01, "elapsed_time": "1 day, 20:41:01", "remaining_time": "1 day, 4:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5874, "total_steps": 9627, "loss": 1.5848, "learning_rate": 3.30396176190028e-05, "epoch": 0.610158928014958, "percentage": 61.02, "elapsed_time": "1 day, 20:41:28", "remaining_time": "1 day, 4:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5875, "total_steps": 9627, "loss": 1.6565, "learning_rate": 3.3024269335616155e-05, "epoch": 0.6102628025345382, "percentage": 61.03, "elapsed_time": "1 day, 20:41:57", "remaining_time": "1 day, 4:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5876, "total_steps": 9627, "loss": 1.72, "learning_rate": 3.300892286001238e-05, "epoch": 0.6103666770541186, "percentage": 61.04, "elapsed_time": "1 day, 20:42:24", "remaining_time": "1 day, 4:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5877, "total_steps": 9627, "loss": 1.5959, "learning_rate": 3.29935781938258e-05, "epoch": 0.610470551573699, "percentage": 61.05, "elapsed_time": "1 day, 20:42:54", "remaining_time": "1 day, 4:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5878, "total_steps": 9627, "loss": 1.7009, "learning_rate": 3.29782353386905e-05, "epoch": 0.6105744260932793, "percentage": 61.06, "elapsed_time": "1 day, 20:43:22", "remaining_time": "1 day, 4:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5879, "total_steps": 9627, "loss": 1.5514, "learning_rate": 3.296289429624035e-05, "epoch": 0.6106783006128597, "percentage": 61.07, "elapsed_time": "1 day, 20:43:49", "remaining_time": "1 day, 4:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5880, "total_steps": 9627, "loss": 1.6511, "learning_rate": 3.294755506810905e-05, "epoch": 0.61078217513244, "percentage": 61.08, "elapsed_time": "1 day, 20:44:18", "remaining_time": "1 day, 4:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5881, "total_steps": 9627, "loss": 1.4797, "learning_rate": 3.293221765593015e-05, "epoch": 0.6108860496520203, "percentage": 61.09, "elapsed_time": "1 day, 20:44:45", "remaining_time": "1 day, 4:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5882, "total_steps": 9627, "loss": 1.77, "learning_rate": 3.291688206133691e-05, "epoch": 0.6109899241716007, "percentage": 61.1, "elapsed_time": "1 day, 20:45:15", "remaining_time": "1 day, 4:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5883, "total_steps": 9627, "loss": 1.6022, "learning_rate": 3.290154828596248e-05, "epoch": 0.6110937986911811, "percentage": 61.11, "elapsed_time": "1 day, 20:45:43", "remaining_time": "1 day, 4:29:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5884, "total_steps": 9627, "loss": 1.5761, "learning_rate": 3.28862163314398e-05, "epoch": 0.6111976732107613, "percentage": 61.12, "elapsed_time": "1 day, 20:46:10", "remaining_time": "1 day, 4:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5885, "total_steps": 9627, "loss": 1.7047, "learning_rate": 3.287088619940158e-05, "epoch": 0.6113015477303417, "percentage": 61.13, "elapsed_time": "1 day, 20:46:39", "remaining_time": "1 day, 4:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5886, "total_steps": 9627, "loss": 1.5804, "learning_rate": 3.285555789148036e-05, "epoch": 0.6114054222499221, "percentage": 61.14, "elapsed_time": "1 day, 20:47:06", "remaining_time": "1 day, 4:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5887, "total_steps": 9627, "loss": 1.7646, "learning_rate": 3.284023140930851e-05, "epoch": 0.6115092967695024, "percentage": 61.15, "elapsed_time": "1 day, 20:47:35", "remaining_time": "1 day, 4:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5888, "total_steps": 9627, "loss": 1.6731, "learning_rate": 3.2824906754518146e-05, "epoch": 0.6116131712890828, "percentage": 61.16, "elapsed_time": "1 day, 20:48:03", "remaining_time": "1 day, 4:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5889, "total_steps": 9627, "loss": 1.7342, "learning_rate": 3.280958392874124e-05, "epoch": 0.6117170458086632, "percentage": 61.17, "elapsed_time": "1 day, 20:48:31", "remaining_time": "1 day, 4:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5890, "total_steps": 9627, "loss": 1.6333, "learning_rate": 3.2794262933609555e-05, "epoch": 0.6118209203282435, "percentage": 61.18, "elapsed_time": "1 day, 20:49:00", "remaining_time": "1 day, 4:26:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5891, "total_steps": 9627, "loss": 1.8507, "learning_rate": 3.277894377075468e-05, "epoch": 0.6119247948478238, "percentage": 61.19, "elapsed_time": "1 day, 20:49:28", "remaining_time": "1 day, 4:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5892, "total_steps": 9627, "loss": 1.712, "learning_rate": 3.276362644180794e-05, "epoch": 0.6120286693674042, "percentage": 61.2, "elapsed_time": "1 day, 20:49:56", "remaining_time": "1 day, 4:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5893, "total_steps": 9627, "loss": 1.6575, "learning_rate": 3.2748310948400545e-05, "epoch": 0.6121325438869846, "percentage": 61.21, "elapsed_time": "1 day, 20:50:25", "remaining_time": "1 day, 4:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5894, "total_steps": 9627, "loss": 1.9697, "learning_rate": 3.273299729216348e-05, "epoch": 0.6122364184065648, "percentage": 61.22, "elapsed_time": "1 day, 20:50:52", "remaining_time": "1 day, 4:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5895, "total_steps": 9627, "loss": 1.7102, "learning_rate": 3.2717685474727495e-05, "epoch": 0.6123402929261452, "percentage": 61.23, "elapsed_time": "1 day, 20:51:21", "remaining_time": "1 day, 4:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5896, "total_steps": 9627, "loss": 1.6602, "learning_rate": 3.270237549772319e-05, "epoch": 0.6124441674457256, "percentage": 61.24, "elapsed_time": "1 day, 20:51:49", "remaining_time": "1 day, 4:23:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5897, "total_steps": 9627, "loss": 1.6355, "learning_rate": 3.2687067362780997e-05, "epoch": 0.6125480419653059, "percentage": 61.25, "elapsed_time": "1 day, 20:52:17", "remaining_time": "1 day, 4:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5898, "total_steps": 9627, "loss": 1.5367, "learning_rate": 3.267176107153107e-05, "epoch": 0.6126519164848863, "percentage": 61.27, "elapsed_time": "1 day, 20:52:45", "remaining_time": "1 day, 4:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5899, "total_steps": 9627, "loss": 1.7275, "learning_rate": 3.2656456625603425e-05, "epoch": 0.6127557910044666, "percentage": 61.28, "elapsed_time": "1 day, 20:53:14", "remaining_time": "1 day, 4:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5900, "total_steps": 9627, "loss": 1.7106, "learning_rate": 3.2641154026627866e-05, "epoch": 0.6128596655240469, "percentage": 61.29, "elapsed_time": "1 day, 20:53:41", "remaining_time": "1 day, 4:21:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5901, "total_steps": 9627, "loss": 1.6203, "learning_rate": 3.2625853276234e-05, "epoch": 0.6129635400436273, "percentage": 61.3, "elapsed_time": "1 day, 20:54:10", "remaining_time": "1 day, 4:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5902, "total_steps": 9627, "loss": 1.6936, "learning_rate": 3.2610554376051224e-05, "epoch": 0.6130674145632077, "percentage": 61.31, "elapsed_time": "1 day, 20:54:38", "remaining_time": "1 day, 4:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5903, "total_steps": 9627, "loss": 1.9501, "learning_rate": 3.2595257327708785e-05, "epoch": 0.613171289082788, "percentage": 61.32, "elapsed_time": "1 day, 20:55:06", "remaining_time": "1 day, 4:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5904, "total_steps": 9627, "loss": 1.5555, "learning_rate": 3.257996213283566e-05, "epoch": 0.6132751636023683, "percentage": 61.33, "elapsed_time": "1 day, 20:55:34", "remaining_time": "1 day, 4:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5905, "total_steps": 9627, "loss": 1.5927, "learning_rate": 3.256466879306068e-05, "epoch": 0.6133790381219487, "percentage": 61.34, "elapsed_time": "1 day, 20:56:03", "remaining_time": "1 day, 4:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5906, "total_steps": 9627, "loss": 1.6676, "learning_rate": 3.25493773100125e-05, "epoch": 0.613482912641529, "percentage": 61.35, "elapsed_time": "1 day, 20:56:30", "remaining_time": "1 day, 4:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5907, "total_steps": 9627, "loss": 1.5935, "learning_rate": 3.2534087685319506e-05, "epoch": 0.6135867871611094, "percentage": 61.36, "elapsed_time": "1 day, 20:57:00", "remaining_time": "1 day, 4:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5908, "total_steps": 9627, "loss": 1.7057, "learning_rate": 3.2518799920609924e-05, "epoch": 0.6136906616806898, "percentage": 61.37, "elapsed_time": "1 day, 20:57:27", "remaining_time": "1 day, 4:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5909, "total_steps": 9627, "loss": 1.6022, "learning_rate": 3.2503514017511806e-05, "epoch": 0.61379453620027, "percentage": 61.38, "elapsed_time": "1 day, 20:57:56", "remaining_time": "1 day, 4:17:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5910, "total_steps": 9627, "loss": 1.7709, "learning_rate": 3.2488229977652954e-05, "epoch": 0.6138984107198504, "percentage": 61.39, "elapsed_time": "1 day, 20:58:23", "remaining_time": "1 day, 4:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5911, "total_steps": 9627, "loss": 1.702, "learning_rate": 3.2472947802661005e-05, "epoch": 0.6140022852394308, "percentage": 61.4, "elapsed_time": "1 day, 20:58:52", "remaining_time": "1 day, 4:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5912, "total_steps": 9627, "loss": 1.6426, "learning_rate": 3.245766749416342e-05, "epoch": 0.6141061597590111, "percentage": 61.41, "elapsed_time": "1 day, 20:59:20", "remaining_time": "1 day, 4:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5913, "total_steps": 9627, "loss": 1.6559, "learning_rate": 3.24423890537874e-05, "epoch": 0.6142100342785914, "percentage": 61.42, "elapsed_time": "1 day, 20:59:48", "remaining_time": "1 day, 4:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5914, "total_steps": 9627, "loss": 1.7074, "learning_rate": 3.242711248316e-05, "epoch": 0.6143139087981718, "percentage": 61.43, "elapsed_time": "1 day, 21:00:17", "remaining_time": "1 day, 4:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5915, "total_steps": 9627, "loss": 1.8111, "learning_rate": 3.241183778390803e-05, "epoch": 0.6144177833177522, "percentage": 61.44, "elapsed_time": "1 day, 21:00:44", "remaining_time": "1 day, 4:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5916, "total_steps": 9627, "loss": 1.5673, "learning_rate": 3.239656495765817e-05, "epoch": 0.6145216578373325, "percentage": 61.45, "elapsed_time": "1 day, 21:01:13", "remaining_time": "1 day, 4:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5917, "total_steps": 9627, "loss": 1.6545, "learning_rate": 3.23812940060368e-05, "epoch": 0.6146255323569129, "percentage": 61.46, "elapsed_time": "1 day, 21:01:40", "remaining_time": "1 day, 4:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5918, "total_steps": 9627, "loss": 1.6233, "learning_rate": 3.2366024930670194e-05, "epoch": 0.6147294068764932, "percentage": 61.47, "elapsed_time": "1 day, 21:02:10", "remaining_time": "1 day, 4:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5919, "total_steps": 9627, "loss": 1.7184, "learning_rate": 3.23507577331844e-05, "epoch": 0.6148332813960735, "percentage": 61.48, "elapsed_time": "1 day, 21:02:37", "remaining_time": "1 day, 4:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5920, "total_steps": 9627, "loss": 1.6877, "learning_rate": 3.2335492415205224e-05, "epoch": 0.6149371559156539, "percentage": 61.49, "elapsed_time": "1 day, 21:03:06", "remaining_time": "1 day, 4:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5921, "total_steps": 9627, "loss": 1.6024, "learning_rate": 3.2320228978358324e-05, "epoch": 0.6150410304352343, "percentage": 61.5, "elapsed_time": "1 day, 21:03:34", "remaining_time": "1 day, 4:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5922, "total_steps": 9627, "loss": 1.5523, "learning_rate": 3.230496742426914e-05, "epoch": 0.6151449049548146, "percentage": 61.51, "elapsed_time": "1 day, 21:04:02", "remaining_time": "1 day, 4:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5923, "total_steps": 9627, "loss": 1.6793, "learning_rate": 3.228970775456288e-05, "epoch": 0.6152487794743949, "percentage": 61.52, "elapsed_time": "1 day, 21:04:30", "remaining_time": "1 day, 4:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5924, "total_steps": 9627, "loss": 1.6962, "learning_rate": 3.2274449970864595e-05, "epoch": 0.6153526539939753, "percentage": 61.54, "elapsed_time": "1 day, 21:04:59", "remaining_time": "1 day, 4:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5925, "total_steps": 9627, "loss": 1.7432, "learning_rate": 3.225919407479914e-05, "epoch": 0.6154565285135556, "percentage": 61.55, "elapsed_time": "1 day, 21:05:26", "remaining_time": "1 day, 4:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5926, "total_steps": 9627, "loss": 1.6198, "learning_rate": 3.224394006799112e-05, "epoch": 0.615560403033136, "percentage": 61.56, "elapsed_time": "1 day, 21:05:54", "remaining_time": "1 day, 4:09:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5927, "total_steps": 9627, "loss": 1.5267, "learning_rate": 3.222868795206498e-05, "epoch": 0.6156642775527164, "percentage": 61.57, "elapsed_time": "1 day, 21:06:22", "remaining_time": "1 day, 4:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5928, "total_steps": 9627, "loss": 1.8421, "learning_rate": 3.221343772864497e-05, "epoch": 0.6157681520722966, "percentage": 61.58, "elapsed_time": "1 day, 21:06:50", "remaining_time": "1 day, 4:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5929, "total_steps": 9627, "loss": 1.701, "learning_rate": 3.2198189399355085e-05, "epoch": 0.615872026591877, "percentage": 61.59, "elapsed_time": "1 day, 21:07:20", "remaining_time": "1 day, 4:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5930, "total_steps": 9627, "loss": 1.5238, "learning_rate": 3.218294296581916e-05, "epoch": 0.6159759011114574, "percentage": 61.6, "elapsed_time": "1 day, 21:07:47", "remaining_time": "1 day, 4:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5931, "total_steps": 9627, "loss": 1.7779, "learning_rate": 3.2167698429660866e-05, "epoch": 0.6160797756310377, "percentage": 61.61, "elapsed_time": "1 day, 21:08:16", "remaining_time": "1 day, 4:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5932, "total_steps": 9627, "loss": 1.6755, "learning_rate": 3.215245579250355e-05, "epoch": 0.616183650150618, "percentage": 61.62, "elapsed_time": "1 day, 21:08:44", "remaining_time": "1 day, 4:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5933, "total_steps": 9627, "loss": 1.8098, "learning_rate": 3.2137215055970496e-05, "epoch": 0.6162875246701984, "percentage": 61.63, "elapsed_time": "1 day, 21:09:11", "remaining_time": "1 day, 4:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5934, "total_steps": 9627, "loss": 1.5704, "learning_rate": 3.2121976221684714e-05, "epoch": 0.6163913991897787, "percentage": 61.64, "elapsed_time": "1 day, 21:09:40", "remaining_time": "1 day, 4:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5935, "total_steps": 9627, "loss": 1.7943, "learning_rate": 3.2106739291269005e-05, "epoch": 0.6164952737093591, "percentage": 61.65, "elapsed_time": "1 day, 21:10:09", "remaining_time": "1 day, 4:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5936, "total_steps": 9627, "loss": 1.7347, "learning_rate": 3.209150426634597e-05, "epoch": 0.6165991482289395, "percentage": 61.66, "elapsed_time": "1 day, 21:10:36", "remaining_time": "1 day, 4:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5937, "total_steps": 9627, "loss": 1.6469, "learning_rate": 3.2076271148538066e-05, "epoch": 0.6167030227485197, "percentage": 61.67, "elapsed_time": "1 day, 21:11:04", "remaining_time": "1 day, 4:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5938, "total_steps": 9627, "loss": 1.7029, "learning_rate": 3.2061039939467454e-05, "epoch": 0.6168068972681001, "percentage": 61.68, "elapsed_time": "1 day, 21:11:33", "remaining_time": "1 day, 4:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5939, "total_steps": 9627, "loss": 2.0553, "learning_rate": 3.204581064075616e-05, "epoch": 0.6169107717876805, "percentage": 61.69, "elapsed_time": "1 day, 21:12:00", "remaining_time": "1 day, 4:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5940, "total_steps": 9627, "loss": 1.7076, "learning_rate": 3.203058325402599e-05, "epoch": 0.6170146463072609, "percentage": 61.7, "elapsed_time": "1 day, 21:12:30", "remaining_time": "1 day, 4:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5941, "total_steps": 9627, "loss": 1.5993, "learning_rate": 3.201535778089853e-05, "epoch": 0.6171185208268412, "percentage": 61.71, "elapsed_time": "1 day, 21:12:58", "remaining_time": "1 day, 4:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5942, "total_steps": 9627, "loss": 1.3709, "learning_rate": 3.20001342229952e-05, "epoch": 0.6172223953464215, "percentage": 61.72, "elapsed_time": "1 day, 21:13:25", "remaining_time": "1 day, 4:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5943, "total_steps": 9627, "loss": 1.6183, "learning_rate": 3.1984912581937146e-05, "epoch": 0.6173262698660019, "percentage": 61.73, "elapsed_time": "1 day, 21:13:54", "remaining_time": "1 day, 4:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5944, "total_steps": 9627, "loss": 1.5723, "learning_rate": 3.196969285934541e-05, "epoch": 0.6174301443855822, "percentage": 61.74, "elapsed_time": "1 day, 21:14:22", "remaining_time": "1 day, 4:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5945, "total_steps": 9627, "loss": 1.593, "learning_rate": 3.1954475056840714e-05, "epoch": 0.6175340189051626, "percentage": 61.75, "elapsed_time": "1 day, 21:14:50", "remaining_time": "1 day, 4:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5946, "total_steps": 9627, "loss": 1.7796, "learning_rate": 3.193925917604367e-05, "epoch": 0.617637893424743, "percentage": 61.76, "elapsed_time": "1 day, 21:15:19", "remaining_time": "1 day, 4:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5947, "total_steps": 9627, "loss": 1.8134, "learning_rate": 3.1924045218574654e-05, "epoch": 0.6177417679443232, "percentage": 61.77, "elapsed_time": "1 day, 21:15:47", "remaining_time": "1 day, 4:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5948, "total_steps": 9627, "loss": 1.5344, "learning_rate": 3.190883318605382e-05, "epoch": 0.6178456424639036, "percentage": 61.78, "elapsed_time": "1 day, 21:16:16", "remaining_time": "1 day, 4:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5949, "total_steps": 9627, "loss": 1.6706, "learning_rate": 3.189362308010113e-05, "epoch": 0.617949516983484, "percentage": 61.79, "elapsed_time": "1 day, 21:16:44", "remaining_time": "1 day, 3:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5950, "total_steps": 9627, "loss": 1.5388, "learning_rate": 3.187841490233636e-05, "epoch": 0.6180533915030643, "percentage": 61.81, "elapsed_time": "1 day, 21:17:12", "remaining_time": "1 day, 3:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5951, "total_steps": 9627, "loss": 1.7468, "learning_rate": 3.1863208654379036e-05, "epoch": 0.6181572660226446, "percentage": 61.82, "elapsed_time": "1 day, 21:17:41", "remaining_time": "1 day, 3:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5952, "total_steps": 9627, "loss": 1.5909, "learning_rate": 3.184800433784851e-05, "epoch": 0.618261140542225, "percentage": 61.83, "elapsed_time": "1 day, 21:18:09", "remaining_time": "1 day, 3:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5953, "total_steps": 9627, "loss": 1.8014, "learning_rate": 3.1832801954363955e-05, "epoch": 0.6183650150618053, "percentage": 61.84, "elapsed_time": "1 day, 21:18:38", "remaining_time": "1 day, 3:57:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5954, "total_steps": 9627, "loss": 1.6452, "learning_rate": 3.1817601505544264e-05, "epoch": 0.6184688895813857, "percentage": 61.85, "elapsed_time": "1 day, 21:19:07", "remaining_time": "1 day, 3:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5955, "total_steps": 9627, "loss": 1.6638, "learning_rate": 3.18024029930082e-05, "epoch": 0.6185727641009661, "percentage": 61.86, "elapsed_time": "1 day, 21:19:35", "remaining_time": "1 day, 3:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5956, "total_steps": 9627, "loss": 1.6237, "learning_rate": 3.178720641837426e-05, "epoch": 0.6186766386205463, "percentage": 61.87, "elapsed_time": "1 day, 21:20:04", "remaining_time": "1 day, 3:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5957, "total_steps": 9627, "loss": 1.6954, "learning_rate": 3.177201178326077e-05, "epoch": 0.6187805131401267, "percentage": 61.88, "elapsed_time": "1 day, 21:20:32", "remaining_time": "1 day, 3:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5958, "total_steps": 9627, "loss": 1.7631, "learning_rate": 3.175681908928584e-05, "epoch": 0.6188843876597071, "percentage": 61.89, "elapsed_time": "1 day, 21:21:01", "remaining_time": "1 day, 3:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5959, "total_steps": 9627, "loss": 1.6, "learning_rate": 3.174162833806739e-05, "epoch": 0.6189882621792874, "percentage": 61.9, "elapsed_time": "1 day, 21:21:30", "remaining_time": "1 day, 3:55:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5960, "total_steps": 9627, "loss": 1.7953, "learning_rate": 3.172643953122308e-05, "epoch": 0.6190921366988678, "percentage": 61.91, "elapsed_time": "1 day, 21:21:57", "remaining_time": "1 day, 3:54:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5961, "total_steps": 9627, "loss": 1.779, "learning_rate": 3.171125267037042e-05, "epoch": 0.6191960112184481, "percentage": 61.92, "elapsed_time": "1 day, 21:22:25", "remaining_time": "1 day, 3:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5962, "total_steps": 9627, "loss": 1.7738, "learning_rate": 3.169606775712672e-05, "epoch": 0.6192998857380284, "percentage": 61.93, "elapsed_time": "1 day, 21:22:55", "remaining_time": "1 day, 3:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5963, "total_steps": 9627, "loss": 1.488, "learning_rate": 3.1680884793109014e-05, "epoch": 0.6194037602576088, "percentage": 61.94, "elapsed_time": "1 day, 21:23:23", "remaining_time": "1 day, 3:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5964, "total_steps": 9627, "loss": 1.6613, "learning_rate": 3.166570377993417e-05, "epoch": 0.6195076347771892, "percentage": 61.95, "elapsed_time": "1 day, 21:23:52", "remaining_time": "1 day, 3:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5965, "total_steps": 9627, "loss": 1.6224, "learning_rate": 3.165052471921888e-05, "epoch": 0.6196115092967694, "percentage": 61.96, "elapsed_time": "1 day, 21:24:20", "remaining_time": "1 day, 3:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5966, "total_steps": 9627, "loss": 1.6947, "learning_rate": 3.163534761257956e-05, "epoch": 0.6197153838163498, "percentage": 61.97, "elapsed_time": "1 day, 21:24:50", "remaining_time": "1 day, 3:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5967, "total_steps": 9627, "loss": 1.7144, "learning_rate": 3.162017246163247e-05, "epoch": 0.6198192583359302, "percentage": 61.98, "elapsed_time": "1 day, 21:25:18", "remaining_time": "1 day, 3:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5968, "total_steps": 9627, "loss": 1.6563, "learning_rate": 3.160499926799365e-05, "epoch": 0.6199231328555106, "percentage": 61.99, "elapsed_time": "1 day, 21:25:46", "remaining_time": "1 day, 3:51:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5969, "total_steps": 9627, "loss": 1.7237, "learning_rate": 3.1589828033278925e-05, "epoch": 0.6200270073750909, "percentage": 62.0, "elapsed_time": "1 day, 21:26:14", "remaining_time": "1 day, 3:50:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5970, "total_steps": 9627, "loss": 1.6751, "learning_rate": 3.157465875910391e-05, "epoch": 0.6201308818946712, "percentage": 62.01, "elapsed_time": "1 day, 21:26:43", "remaining_time": "1 day, 3:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5971, "total_steps": 9627, "loss": 1.547, "learning_rate": 3.1559491447084e-05, "epoch": 0.6202347564142516, "percentage": 62.02, "elapsed_time": "1 day, 21:27:13", "remaining_time": "1 day, 3:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5972, "total_steps": 9627, "loss": 1.6595, "learning_rate": 3.1544326098834433e-05, "epoch": 0.6203386309338319, "percentage": 62.03, "elapsed_time": "1 day, 21:27:41", "remaining_time": "1 day, 3:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5973, "total_steps": 9627, "loss": 1.755, "learning_rate": 3.152916271597015e-05, "epoch": 0.6204425054534123, "percentage": 62.04, "elapsed_time": "1 day, 21:28:09", "remaining_time": "1 day, 3:48:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5974, "total_steps": 9627, "loss": 1.6521, "learning_rate": 3.151400130010597e-05, "epoch": 0.6205463799729927, "percentage": 62.05, "elapsed_time": "1 day, 21:28:38", "remaining_time": "1 day, 3:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5975, "total_steps": 9627, "loss": 1.6084, "learning_rate": 3.149884185285647e-05, "epoch": 0.6206502544925729, "percentage": 62.07, "elapsed_time": "1 day, 21:29:06", "remaining_time": "1 day, 3:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5976, "total_steps": 9627, "loss": 1.5866, "learning_rate": 3.148368437583599e-05, "epoch": 0.6207541290121533, "percentage": 62.08, "elapsed_time": "1 day, 21:29:36", "remaining_time": "1 day, 3:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5977, "total_steps": 9627, "loss": 1.8135, "learning_rate": 3.146852887065868e-05, "epoch": 0.6208580035317337, "percentage": 62.09, "elapsed_time": "1 day, 21:30:03", "remaining_time": "1 day, 3:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5978, "total_steps": 9627, "loss": 1.6958, "learning_rate": 3.145337533893851e-05, "epoch": 0.620961878051314, "percentage": 62.1, "elapsed_time": "1 day, 21:30:33", "remaining_time": "1 day, 3:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5979, "total_steps": 9627, "loss": 1.5397, "learning_rate": 3.143822378228918e-05, "epoch": 0.6210657525708944, "percentage": 62.11, "elapsed_time": "1 day, 21:31:01", "remaining_time": "1 day, 3:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5980, "total_steps": 9627, "loss": 1.7797, "learning_rate": 3.142307420232423e-05, "epoch": 0.6211696270904747, "percentage": 62.12, "elapsed_time": "1 day, 21:31:29", "remaining_time": "1 day, 3:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5981, "total_steps": 9627, "loss": 1.8221, "learning_rate": 3.1407926600657e-05, "epoch": 0.621273501610055, "percentage": 62.13, "elapsed_time": "1 day, 21:31:59", "remaining_time": "1 day, 3:45:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5982, "total_steps": 9627, "loss": 1.6687, "learning_rate": 3.1392780978900535e-05, "epoch": 0.6213773761296354, "percentage": 62.14, "elapsed_time": "1 day, 21:32:27", "remaining_time": "1 day, 3:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5983, "total_steps": 9627, "loss": 1.719, "learning_rate": 3.1377637338667764e-05, "epoch": 0.6214812506492158, "percentage": 62.15, "elapsed_time": "1 day, 21:32:55", "remaining_time": "1 day, 3:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5984, "total_steps": 9627, "loss": 1.6722, "learning_rate": 3.136249568157136e-05, "epoch": 0.621585125168796, "percentage": 62.16, "elapsed_time": "1 day, 21:33:25", "remaining_time": "1 day, 3:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5985, "total_steps": 9627, "loss": 1.6432, "learning_rate": 3.1347356009223786e-05, "epoch": 0.6216889996883764, "percentage": 62.17, "elapsed_time": "1 day, 21:33:53", "remaining_time": "1 day, 3:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5986, "total_steps": 9627, "loss": 1.747, "learning_rate": 3.133221832323728e-05, "epoch": 0.6217928742079568, "percentage": 62.18, "elapsed_time": "1 day, 21:34:22", "remaining_time": "1 day, 3:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5987, "total_steps": 9627, "loss": 1.6543, "learning_rate": 3.131708262522395e-05, "epoch": 0.6218967487275371, "percentage": 62.19, "elapsed_time": "1 day, 21:34:51", "remaining_time": "1 day, 3:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5988, "total_steps": 9627, "loss": 1.5967, "learning_rate": 3.1301948916795554e-05, "epoch": 0.6220006232471175, "percentage": 62.2, "elapsed_time": "1 day, 21:35:20", "remaining_time": "1 day, 3:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5989, "total_steps": 9627, "loss": 1.647, "learning_rate": 3.128681719956375e-05, "epoch": 0.6221044977666979, "percentage": 62.21, "elapsed_time": "1 day, 21:35:49", "remaining_time": "1 day, 3:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5990, "total_steps": 9627, "loss": 1.7831, "learning_rate": 3.1271687475139966e-05, "epoch": 0.6222083722862781, "percentage": 62.22, "elapsed_time": "1 day, 21:36:17", "remaining_time": "1 day, 3:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5991, "total_steps": 9627, "loss": 1.6214, "learning_rate": 3.125655974513537e-05, "epoch": 0.6223122468058585, "percentage": 62.23, "elapsed_time": "1 day, 21:36:47", "remaining_time": "1 day, 3:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5992, "total_steps": 9627, "loss": 1.7274, "learning_rate": 3.124143401116094e-05, "epoch": 0.6224161213254389, "percentage": 62.24, "elapsed_time": "1 day, 21:37:15", "remaining_time": "1 day, 3:40:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5993, "total_steps": 9627, "loss": 1.7371, "learning_rate": 3.1226310274827473e-05, "epoch": 0.6225199958450193, "percentage": 62.25, "elapsed_time": "1 day, 21:37:45", "remaining_time": "1 day, 3:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5994, "total_steps": 9627, "loss": 1.5706, "learning_rate": 3.121118853774554e-05, "epoch": 0.6226238703645995, "percentage": 62.26, "elapsed_time": "1 day, 21:38:12", "remaining_time": "1 day, 3:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5995, "total_steps": 9627, "loss": 1.7618, "learning_rate": 3.119606880152545e-05, "epoch": 0.6227277448841799, "percentage": 62.27, "elapsed_time": "1 day, 21:38:42", "remaining_time": "1 day, 3:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5996, "total_steps": 9627, "loss": 1.6264, "learning_rate": 3.1180951067777365e-05, "epoch": 0.6228316194037603, "percentage": 62.28, "elapsed_time": "1 day, 21:39:10", "remaining_time": "1 day, 3:38:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5997, "total_steps": 9627, "loss": 1.7759, "learning_rate": 3.11658353381112e-05, "epoch": 0.6229354939233406, "percentage": 62.29, "elapsed_time": "1 day, 21:39:39", "remaining_time": "1 day, 3:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5998, "total_steps": 9627, "loss": 1.7063, "learning_rate": 3.1150721614136655e-05, "epoch": 0.623039368442921, "percentage": 62.3, "elapsed_time": "1 day, 21:40:08", "remaining_time": "1 day, 3:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5999, "total_steps": 9627, "loss": 1.4695, "learning_rate": 3.113560989746322e-05, "epoch": 0.6231432429625013, "percentage": 62.31, "elapsed_time": "1 day, 21:40:38", "remaining_time": "1 day, 3:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6000, "total_steps": 9627, "loss": 1.7207, "learning_rate": 3.11205001897002e-05, "epoch": 0.6232471174820816, "percentage": 62.32, "elapsed_time": "1 day, 21:41:07", "remaining_time": "1 day, 3:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6001, "total_steps": 9627, "loss": 1.4959, "learning_rate": 3.110539249245663e-05, "epoch": 0.623350992001662, "percentage": 62.34, "elapsed_time": "1 day, 21:41:36", "remaining_time": "1 day, 3:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6002, "total_steps": 9627, "loss": 1.7322, "learning_rate": 3.1090286807341374e-05, "epoch": 0.6234548665212424, "percentage": 62.35, "elapsed_time": "1 day, 21:42:06", "remaining_time": "1 day, 3:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6003, "total_steps": 9627, "loss": 1.8031, "learning_rate": 3.107518313596309e-05, "epoch": 0.6235587410408227, "percentage": 62.36, "elapsed_time": "1 day, 21:42:34", "remaining_time": "1 day, 3:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6004, "total_steps": 9627, "loss": 1.5662, "learning_rate": 3.106008147993017e-05, "epoch": 0.623662615560403, "percentage": 62.37, "elapsed_time": "1 day, 21:43:04", "remaining_time": "1 day, 3:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6005, "total_steps": 9627, "loss": 1.7387, "learning_rate": 3.1044981840850826e-05, "epoch": 0.6237664900799834, "percentage": 62.38, "elapsed_time": "1 day, 21:43:32", "remaining_time": "1 day, 3:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6006, "total_steps": 9627, "loss": 1.6261, "learning_rate": 3.102988422033309e-05, "epoch": 0.6238703645995637, "percentage": 62.39, "elapsed_time": "1 day, 21:44:01", "remaining_time": "1 day, 3:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6007, "total_steps": 9627, "loss": 1.8022, "learning_rate": 3.101478861998469e-05, "epoch": 0.6239742391191441, "percentage": 62.4, "elapsed_time": "1 day, 21:44:29", "remaining_time": "1 day, 3:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6008, "total_steps": 9627, "loss": 1.7152, "learning_rate": 3.09996950414132e-05, "epoch": 0.6240781136387245, "percentage": 62.41, "elapsed_time": "1 day, 21:44:58", "remaining_time": "1 day, 3:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6009, "total_steps": 9627, "loss": 1.7273, "learning_rate": 3.098460348622601e-05, "epoch": 0.6241819881583047, "percentage": 62.42, "elapsed_time": "1 day, 21:45:27", "remaining_time": "1 day, 3:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6010, "total_steps": 9627, "loss": 1.525, "learning_rate": 3.09695139560302e-05, "epoch": 0.6242858626778851, "percentage": 62.43, "elapsed_time": "1 day, 21:45:56", "remaining_time": "1 day, 3:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6011, "total_steps": 9627, "loss": 1.8, "learning_rate": 3.095442645243272e-05, "epoch": 0.6243897371974655, "percentage": 62.44, "elapsed_time": "1 day, 21:46:25", "remaining_time": "1 day, 3:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6012, "total_steps": 9627, "loss": 1.7008, "learning_rate": 3.0939340977040267e-05, "epoch": 0.6244936117170458, "percentage": 62.45, "elapsed_time": "1 day, 21:46:54", "remaining_time": "1 day, 3:31:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6013, "total_steps": 9627, "loss": 1.5997, "learning_rate": 3.092425753145931e-05, "epoch": 0.6245974862366261, "percentage": 62.46, "elapsed_time": "1 day, 21:47:22", "remaining_time": "1 day, 3:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6014, "total_steps": 9627, "loss": 1.6308, "learning_rate": 3.0909176117296126e-05, "epoch": 0.6247013607562065, "percentage": 62.47, "elapsed_time": "1 day, 21:47:51", "remaining_time": "1 day, 3:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6015, "total_steps": 9627, "loss": 1.6706, "learning_rate": 3.08940967361568e-05, "epoch": 0.6248052352757868, "percentage": 62.48, "elapsed_time": "1 day, 21:48:19", "remaining_time": "1 day, 3:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6016, "total_steps": 9627, "loss": 1.6422, "learning_rate": 3.08790193896471e-05, "epoch": 0.6249091097953672, "percentage": 62.49, "elapsed_time": "1 day, 21:48:49", "remaining_time": "1 day, 3:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6017, "total_steps": 9627, "loss": 1.6133, "learning_rate": 3.0863944079372694e-05, "epoch": 0.6250129843149476, "percentage": 62.5, "elapsed_time": "1 day, 21:49:17", "remaining_time": "1 day, 3:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6018, "total_steps": 9627, "loss": 1.741, "learning_rate": 3.0848870806938995e-05, "epoch": 0.6251168588345279, "percentage": 62.51, "elapsed_time": "1 day, 21:49:45", "remaining_time": "1 day, 3:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6019, "total_steps": 9627, "loss": 1.618, "learning_rate": 3.083379957395117e-05, "epoch": 0.6252207333541082, "percentage": 62.52, "elapsed_time": "1 day, 21:50:15", "remaining_time": "1 day, 3:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6020, "total_steps": 9627, "loss": 1.7609, "learning_rate": 3.081873038201418e-05, "epoch": 0.6253246078736886, "percentage": 62.53, "elapsed_time": "1 day, 21:50:44", "remaining_time": "1 day, 3:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6021, "total_steps": 9627, "loss": 1.7222, "learning_rate": 3.0803663232732775e-05, "epoch": 0.625428482393269, "percentage": 62.54, "elapsed_time": "1 day, 21:51:13", "remaining_time": "1 day, 3:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6022, "total_steps": 9627, "loss": 1.5955, "learning_rate": 3.078859812771152e-05, "epoch": 0.6255323569128493, "percentage": 62.55, "elapsed_time": "1 day, 21:51:41", "remaining_time": "1 day, 3:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6023, "total_steps": 9627, "loss": 1.6507, "learning_rate": 3.0773535068554695e-05, "epoch": 0.6256362314324296, "percentage": 62.56, "elapsed_time": "1 day, 21:52:11", "remaining_time": "1 day, 3:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6024, "total_steps": 9627, "loss": 1.6731, "learning_rate": 3.075847405686641e-05, "epoch": 0.62574010595201, "percentage": 62.57, "elapsed_time": "1 day, 21:52:38", "remaining_time": "1 day, 3:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6025, "total_steps": 9627, "loss": 1.5718, "learning_rate": 3.074341509425056e-05, "epoch": 0.6258439804715903, "percentage": 62.58, "elapsed_time": "1 day, 21:53:06", "remaining_time": "1 day, 3:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6026, "total_steps": 9627, "loss": 1.6525, "learning_rate": 3.07283581823108e-05, "epoch": 0.6259478549911707, "percentage": 62.59, "elapsed_time": "1 day, 21:53:36", "remaining_time": "1 day, 3:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6027, "total_steps": 9627, "loss": 1.6681, "learning_rate": 3.071330332265054e-05, "epoch": 0.626051729510751, "percentage": 62.61, "elapsed_time": "1 day, 21:54:04", "remaining_time": "1 day, 3:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6028, "total_steps": 9627, "loss": 1.68, "learning_rate": 3.069825051687307e-05, "epoch": 0.6261556040303313, "percentage": 62.62, "elapsed_time": "1 day, 21:54:33", "remaining_time": "1 day, 3:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6029, "total_steps": 9627, "loss": 1.7587, "learning_rate": 3.068319976658134e-05, "epoch": 0.6262594785499117, "percentage": 62.63, "elapsed_time": "1 day, 21:55:01", "remaining_time": "1 day, 3:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6030, "total_steps": 9627, "loss": 1.6564, "learning_rate": 3.066815107337815e-05, "epoch": 0.6263633530694921, "percentage": 62.64, "elapsed_time": "1 day, 21:55:31", "remaining_time": "1 day, 3:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6031, "total_steps": 9627, "loss": 1.7046, "learning_rate": 3.0653104438866104e-05, "epoch": 0.6264672275890724, "percentage": 62.65, "elapsed_time": "1 day, 21:55:59", "remaining_time": "1 day, 3:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6032, "total_steps": 9627, "loss": 1.7082, "learning_rate": 3.063805986464751e-05, "epoch": 0.6265711021086527, "percentage": 62.66, "elapsed_time": "1 day, 21:56:29", "remaining_time": "1 day, 3:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6033, "total_steps": 9627, "loss": 1.7456, "learning_rate": 3.06230173523245e-05, "epoch": 0.6266749766282331, "percentage": 62.67, "elapsed_time": "1 day, 21:56:57", "remaining_time": "1 day, 3:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6034, "total_steps": 9627, "loss": 1.5457, "learning_rate": 3.060797690349902e-05, "epoch": 0.6267788511478134, "percentage": 62.68, "elapsed_time": "1 day, 21:57:26", "remaining_time": "1 day, 3:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6035, "total_steps": 9627, "loss": 1.3377, "learning_rate": 3.0592938519772715e-05, "epoch": 0.6268827256673938, "percentage": 62.69, "elapsed_time": "1 day, 21:57:54", "remaining_time": "1 day, 3:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6036, "total_steps": 9627, "loss": 1.5863, "learning_rate": 3.057790220274707e-05, "epoch": 0.6269866001869742, "percentage": 62.7, "elapsed_time": "1 day, 21:58:24", "remaining_time": "1 day, 3:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6037, "total_steps": 9627, "loss": 1.6182, "learning_rate": 3.056286795402337e-05, "epoch": 0.6270904747065544, "percentage": 62.71, "elapsed_time": "1 day, 21:58:52", "remaining_time": "1 day, 3:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6038, "total_steps": 9627, "loss": 1.6674, "learning_rate": 3.0547835775202597e-05, "epoch": 0.6271943492261348, "percentage": 62.72, "elapsed_time": "1 day, 21:59:21", "remaining_time": "1 day, 3:20:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6039, "total_steps": 9627, "loss": 1.5321, "learning_rate": 3.053280566788559e-05, "epoch": 0.6272982237457152, "percentage": 62.73, "elapsed_time": "1 day, 21:59:50", "remaining_time": "1 day, 3:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6040, "total_steps": 9627, "loss": 1.5838, "learning_rate": 3.051777763367293e-05, "epoch": 0.6274020982652955, "percentage": 62.74, "elapsed_time": "1 day, 22:00:19", "remaining_time": "1 day, 3:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6041, "total_steps": 9627, "loss": 1.6502, "learning_rate": 3.0502751674164976e-05, "epoch": 0.6275059727848759, "percentage": 62.75, "elapsed_time": "1 day, 22:00:47", "remaining_time": "1 day, 3:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6042, "total_steps": 9627, "loss": 1.6534, "learning_rate": 3.0487727790961884e-05, "epoch": 0.6276098473044562, "percentage": 62.76, "elapsed_time": "1 day, 22:01:17", "remaining_time": "1 day, 3:18:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6043, "total_steps": 9627, "loss": 1.6755, "learning_rate": 3.0472705985663575e-05, "epoch": 0.6277137218240366, "percentage": 62.77, "elapsed_time": "1 day, 22:01:44", "remaining_time": "1 day, 3:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6044, "total_steps": 9627, "loss": 1.8234, "learning_rate": 3.045768625986979e-05, "epoch": 0.6278175963436169, "percentage": 62.78, "elapsed_time": "1 day, 22:02:14", "remaining_time": "1 day, 3:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6045, "total_steps": 9627, "loss": 1.794, "learning_rate": 3.0442668615179953e-05, "epoch": 0.6279214708631973, "percentage": 62.79, "elapsed_time": "1 day, 22:02:43", "remaining_time": "1 day, 3:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6046, "total_steps": 9627, "loss": 1.6738, "learning_rate": 3.0427653053193366e-05, "epoch": 0.6280253453827777, "percentage": 62.8, "elapsed_time": "1 day, 22:03:12", "remaining_time": "1 day, 3:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6047, "total_steps": 9627, "loss": 1.6268, "learning_rate": 3.0412639575509073e-05, "epoch": 0.6281292199023579, "percentage": 62.81, "elapsed_time": "1 day, 22:03:40", "remaining_time": "1 day, 3:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6048, "total_steps": 9627, "loss": 1.4388, "learning_rate": 3.0397628183725856e-05, "epoch": 0.6282330944219383, "percentage": 62.82, "elapsed_time": "1 day, 22:04:10", "remaining_time": "1 day, 3:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6049, "total_steps": 9627, "loss": 1.613, "learning_rate": 3.038261887944233e-05, "epoch": 0.6283369689415187, "percentage": 62.83, "elapsed_time": "1 day, 22:04:38", "remaining_time": "1 day, 3:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6050, "total_steps": 9627, "loss": 1.8034, "learning_rate": 3.0367611664256895e-05, "epoch": 0.628440843461099, "percentage": 62.84, "elapsed_time": "1 day, 22:05:07", "remaining_time": "1 day, 3:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6051, "total_steps": 9627, "loss": 1.669, "learning_rate": 3.0352606539767657e-05, "epoch": 0.6285447179806793, "percentage": 62.85, "elapsed_time": "1 day, 22:05:36", "remaining_time": "1 day, 3:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6052, "total_steps": 9627, "loss": 1.5992, "learning_rate": 3.033760350757258e-05, "epoch": 0.6286485925002597, "percentage": 62.86, "elapsed_time": "1 day, 22:06:05", "remaining_time": "1 day, 3:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6053, "total_steps": 9627, "loss": 1.5102, "learning_rate": 3.0322602569269355e-05, "epoch": 0.62875246701984, "percentage": 62.88, "elapsed_time": "1 day, 22:06:33", "remaining_time": "1 day, 3:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6054, "total_steps": 9627, "loss": 1.5752, "learning_rate": 3.030760372645547e-05, "epoch": 0.6288563415394204, "percentage": 62.89, "elapsed_time": "1 day, 22:07:02", "remaining_time": "1 day, 3:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6055, "total_steps": 9627, "loss": 1.715, "learning_rate": 3.0292606980728165e-05, "epoch": 0.6289602160590008, "percentage": 62.9, "elapsed_time": "1 day, 22:07:32", "remaining_time": "1 day, 3:12:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6056, "total_steps": 9627, "loss": 1.6543, "learning_rate": 3.0277612333684526e-05, "epoch": 0.629064090578581, "percentage": 62.91, "elapsed_time": "1 day, 22:08:00", "remaining_time": "1 day, 3:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6057, "total_steps": 9627, "loss": 1.7277, "learning_rate": 3.02626197869213e-05, "epoch": 0.6291679650981614, "percentage": 62.92, "elapsed_time": "1 day, 22:08:28", "remaining_time": "1 day, 3:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6058, "total_steps": 9627, "loss": 1.8181, "learning_rate": 3.024762934203511e-05, "epoch": 0.6292718396177418, "percentage": 62.93, "elapsed_time": "1 day, 22:08:57", "remaining_time": "1 day, 3:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6059, "total_steps": 9627, "loss": 1.5467, "learning_rate": 3.023264100062234e-05, "epoch": 0.6293757141373221, "percentage": 62.94, "elapsed_time": "1 day, 22:09:26", "remaining_time": "1 day, 3:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6060, "total_steps": 9627, "loss": 1.9913, "learning_rate": 3.0217654764279114e-05, "epoch": 0.6294795886569025, "percentage": 62.95, "elapsed_time": "1 day, 22:09:55", "remaining_time": "1 day, 3:10:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6061, "total_steps": 9627, "loss": 1.6593, "learning_rate": 3.0202670634601325e-05, "epoch": 0.6295834631764828, "percentage": 62.96, "elapsed_time": "1 day, 22:10:24", "remaining_time": "1 day, 3:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6062, "total_steps": 9627, "loss": 1.4867, "learning_rate": 3.0187688613184717e-05, "epoch": 0.6296873376960631, "percentage": 62.97, "elapsed_time": "1 day, 22:10:53", "remaining_time": "1 day, 3:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6063, "total_steps": 9627, "loss": 1.6254, "learning_rate": 3.0172708701624704e-05, "epoch": 0.6297912122156435, "percentage": 62.98, "elapsed_time": "1 day, 22:11:21", "remaining_time": "1 day, 3:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6064, "total_steps": 9627, "loss": 1.7055, "learning_rate": 3.0157730901516556e-05, "epoch": 0.6298950867352239, "percentage": 62.99, "elapsed_time": "1 day, 22:11:49", "remaining_time": "1 day, 3:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6065, "total_steps": 9627, "loss": 1.4714, "learning_rate": 3.014275521445531e-05, "epoch": 0.6299989612548041, "percentage": 63.0, "elapsed_time": "1 day, 22:12:19", "remaining_time": "1 day, 3:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6066, "total_steps": 9627, "loss": 1.5278, "learning_rate": 3.0127781642035725e-05, "epoch": 0.6301028357743845, "percentage": 63.01, "elapsed_time": "1 day, 22:12:47", "remaining_time": "1 day, 3:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6067, "total_steps": 9627, "loss": 1.4645, "learning_rate": 3.0112810185852393e-05, "epoch": 0.6302067102939649, "percentage": 63.02, "elapsed_time": "1 day, 22:13:17", "remaining_time": "1 day, 3:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6068, "total_steps": 9627, "loss": 1.6989, "learning_rate": 3.009784084749966e-05, "epoch": 0.6303105848135452, "percentage": 63.03, "elapsed_time": "1 day, 22:13:45", "remaining_time": "1 day, 3:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6069, "total_steps": 9627, "loss": 1.7468, "learning_rate": 3.0082873628571616e-05, "epoch": 0.6304144593331256, "percentage": 63.04, "elapsed_time": "1 day, 22:14:15", "remaining_time": "1 day, 3:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6070, "total_steps": 9627, "loss": 1.7116, "learning_rate": 3.006790853066217e-05, "epoch": 0.630518333852706, "percentage": 63.05, "elapsed_time": "1 day, 22:14:44", "remaining_time": "1 day, 3:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6071, "total_steps": 9627, "loss": 1.8164, "learning_rate": 3.0052945555364987e-05, "epoch": 0.6306222083722863, "percentage": 63.06, "elapsed_time": "1 day, 22:15:12", "remaining_time": "1 day, 3:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6072, "total_steps": 9627, "loss": 1.7011, "learning_rate": 3.0037984704273536e-05, "epoch": 0.6307260828918666, "percentage": 63.07, "elapsed_time": "1 day, 22:15:41", "remaining_time": "1 day, 3:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6073, "total_steps": 9627, "loss": 1.8097, "learning_rate": 3.0023025978980977e-05, "epoch": 0.630829957411447, "percentage": 63.08, "elapsed_time": "1 day, 22:16:09", "remaining_time": "1 day, 3:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6074, "total_steps": 9627, "loss": 1.7535, "learning_rate": 3.000806938108034e-05, "epoch": 0.6309338319310274, "percentage": 63.09, "elapsed_time": "1 day, 22:16:39", "remaining_time": "1 day, 3:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6075, "total_steps": 9627, "loss": 1.6294, "learning_rate": 2.9993114912164378e-05, "epoch": 0.6310377064506076, "percentage": 63.1, "elapsed_time": "1 day, 22:17:07", "remaining_time": "1 day, 3:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6076, "total_steps": 9627, "loss": 1.7187, "learning_rate": 2.9978162573825597e-05, "epoch": 0.631141580970188, "percentage": 63.11, "elapsed_time": "1 day, 22:17:36", "remaining_time": "1 day, 3:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6077, "total_steps": 9627, "loss": 1.7397, "learning_rate": 2.996321236765633e-05, "epoch": 0.6312454554897684, "percentage": 63.12, "elapsed_time": "1 day, 22:18:04", "remaining_time": "1 day, 3:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6078, "total_steps": 9627, "loss": 1.5252, "learning_rate": 2.994826429524867e-05, "epoch": 0.6313493300093487, "percentage": 63.13, "elapsed_time": "1 day, 22:18:34", "remaining_time": "1 day, 3:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6079, "total_steps": 9627, "loss": 1.4488, "learning_rate": 2.9933318358194427e-05, "epoch": 0.6314532045289291, "percentage": 63.15, "elapsed_time": "1 day, 22:19:02", "remaining_time": "1 day, 3:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6080, "total_steps": 9627, "loss": 1.705, "learning_rate": 2.9918374558085272e-05, "epoch": 0.6315570790485094, "percentage": 63.16, "elapsed_time": "1 day, 22:19:31", "remaining_time": "1 day, 3:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6081, "total_steps": 9627, "loss": 1.5949, "learning_rate": 2.9903432896512583e-05, "epoch": 0.6316609535680897, "percentage": 63.17, "elapsed_time": "1 day, 22:20:01", "remaining_time": "1 day, 3:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6082, "total_steps": 9627, "loss": 1.5759, "learning_rate": 2.988849337506753e-05, "epoch": 0.6317648280876701, "percentage": 63.18, "elapsed_time": "1 day, 22:20:29", "remaining_time": "1 day, 3:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6083, "total_steps": 9627, "loss": 1.6129, "learning_rate": 2.9873555995341045e-05, "epoch": 0.6318687026072505, "percentage": 63.19, "elapsed_time": "1 day, 22:20:59", "remaining_time": "1 day, 3:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6084, "total_steps": 9627, "loss": 1.6637, "learning_rate": 2.9858620758923872e-05, "epoch": 0.6319725771268307, "percentage": 63.2, "elapsed_time": "1 day, 22:21:27", "remaining_time": "1 day, 2:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6085, "total_steps": 9627, "loss": 1.7608, "learning_rate": 2.9843687667406466e-05, "epoch": 0.6320764516464111, "percentage": 63.21, "elapsed_time": "1 day, 22:21:56", "remaining_time": "1 day, 2:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6086, "total_steps": 9627, "loss": 1.5836, "learning_rate": 2.982875672237909e-05, "epoch": 0.6321803261659915, "percentage": 63.22, "elapsed_time": "1 day, 22:22:23", "remaining_time": "1 day, 2:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6087, "total_steps": 9627, "loss": 1.6473, "learning_rate": 2.9813827925431813e-05, "epoch": 0.6322842006855718, "percentage": 63.23, "elapsed_time": "1 day, 22:22:53", "remaining_time": "1 day, 2:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6088, "total_steps": 9627, "loss": 1.6633, "learning_rate": 2.9798901278154384e-05, "epoch": 0.6323880752051522, "percentage": 63.24, "elapsed_time": "1 day, 22:23:22", "remaining_time": "1 day, 2:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6089, "total_steps": 9627, "loss": 1.6624, "learning_rate": 2.9783976782136385e-05, "epoch": 0.6324919497247325, "percentage": 63.25, "elapsed_time": "1 day, 22:23:51", "remaining_time": "1 day, 2:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6090, "total_steps": 9627, "loss": 1.516, "learning_rate": 2.976905443896719e-05, "epoch": 0.6325958242443128, "percentage": 63.26, "elapsed_time": "1 day, 22:24:19", "remaining_time": "1 day, 2:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6091, "total_steps": 9627, "loss": 1.8359, "learning_rate": 2.975413425023587e-05, "epoch": 0.6326996987638932, "percentage": 63.27, "elapsed_time": "1 day, 22:24:49", "remaining_time": "1 day, 2:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6092, "total_steps": 9627, "loss": 1.5251, "learning_rate": 2.973921621753133e-05, "epoch": 0.6328035732834736, "percentage": 63.28, "elapsed_time": "1 day, 22:25:17", "remaining_time": "1 day, 2:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6093, "total_steps": 9627, "loss": 1.7986, "learning_rate": 2.972430034244224e-05, "epoch": 0.6329074478030539, "percentage": 63.29, "elapsed_time": "1 day, 22:25:46", "remaining_time": "1 day, 2:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6094, "total_steps": 9627, "loss": 1.6558, "learning_rate": 2.970938662655699e-05, "epoch": 0.6330113223226342, "percentage": 63.3, "elapsed_time": "1 day, 22:26:14", "remaining_time": "1 day, 2:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6095, "total_steps": 9627, "loss": 1.6296, "learning_rate": 2.9694475071463797e-05, "epoch": 0.6331151968422146, "percentage": 63.31, "elapsed_time": "1 day, 22:26:43", "remaining_time": "1 day, 2:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6096, "total_steps": 9627, "loss": 1.6559, "learning_rate": 2.9679565678750608e-05, "epoch": 0.633219071361795, "percentage": 63.32, "elapsed_time": "1 day, 22:27:12", "remaining_time": "1 day, 2:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6097, "total_steps": 9627, "loss": 1.6724, "learning_rate": 2.9664658450005195e-05, "epoch": 0.6333229458813753, "percentage": 63.33, "elapsed_time": "1 day, 22:27:40", "remaining_time": "1 day, 2:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6098, "total_steps": 9627, "loss": 1.7473, "learning_rate": 2.9649753386815017e-05, "epoch": 0.6334268204009557, "percentage": 63.34, "elapsed_time": "1 day, 22:28:10", "remaining_time": "1 day, 2:53:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6099, "total_steps": 9627, "loss": 1.7247, "learning_rate": 2.963485049076736e-05, "epoch": 0.633530694920536, "percentage": 63.35, "elapsed_time": "1 day, 22:28:38", "remaining_time": "1 day, 2:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6100, "total_steps": 9627, "loss": 1.7161, "learning_rate": 2.961994976344929e-05, "epoch": 0.6336345694401163, "percentage": 63.36, "elapsed_time": "1 day, 22:29:07", "remaining_time": "1 day, 2:52:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6101, "total_steps": 9627, "loss": 1.6737, "learning_rate": 2.9605051206447582e-05, "epoch": 0.6337384439596967, "percentage": 63.37, "elapsed_time": "1 day, 22:29:36", "remaining_time": "1 day, 2:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6102, "total_steps": 9627, "loss": 1.8074, "learning_rate": 2.959015482134885e-05, "epoch": 0.6338423184792771, "percentage": 63.38, "elapsed_time": "1 day, 22:30:05", "remaining_time": "1 day, 2:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6103, "total_steps": 9627, "loss": 1.7882, "learning_rate": 2.9575260609739423e-05, "epoch": 0.6339461929988573, "percentage": 63.39, "elapsed_time": "1 day, 22:30:34", "remaining_time": "1 day, 2:51:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6104, "total_steps": 9627, "loss": 1.6736, "learning_rate": 2.956036857320541e-05, "epoch": 0.6340500675184377, "percentage": 63.41, "elapsed_time": "1 day, 22:31:02", "remaining_time": "1 day, 2:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6105, "total_steps": 9627, "loss": 1.7257, "learning_rate": 2.9545478713332707e-05, "epoch": 0.6341539420380181, "percentage": 63.42, "elapsed_time": "1 day, 22:31:31", "remaining_time": "1 day, 2:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6106, "total_steps": 9627, "loss": 1.6384, "learning_rate": 2.9530591031706988e-05, "epoch": 0.6342578165575984, "percentage": 63.43, "elapsed_time": "1 day, 22:32:00", "remaining_time": "1 day, 2:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6107, "total_steps": 9627, "loss": 1.7593, "learning_rate": 2.9515705529913644e-05, "epoch": 0.6343616910771788, "percentage": 63.44, "elapsed_time": "1 day, 22:32:30", "remaining_time": "1 day, 2:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6108, "total_steps": 9627, "loss": 1.7383, "learning_rate": 2.9500822209537883e-05, "epoch": 0.6344655655967592, "percentage": 63.45, "elapsed_time": "1 day, 22:32:58", "remaining_time": "1 day, 2:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6109, "total_steps": 9627, "loss": 1.6363, "learning_rate": 2.9485941072164656e-05, "epoch": 0.6345694401163394, "percentage": 63.46, "elapsed_time": "1 day, 22:33:28", "remaining_time": "1 day, 2:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6110, "total_steps": 9627, "loss": 1.7249, "learning_rate": 2.9471062119378688e-05, "epoch": 0.6346733146359198, "percentage": 63.47, "elapsed_time": "1 day, 22:33:55", "remaining_time": "1 day, 2:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6111, "total_steps": 9627, "loss": 1.4506, "learning_rate": 2.9456185352764465e-05, "epoch": 0.6347771891555002, "percentage": 63.48, "elapsed_time": "1 day, 22:34:26", "remaining_time": "1 day, 2:47:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6112, "total_steps": 9627, "loss": 1.6051, "learning_rate": 2.944131077390627e-05, "epoch": 0.6348810636750805, "percentage": 63.49, "elapsed_time": "1 day, 22:34:53", "remaining_time": "1 day, 2:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6113, "total_steps": 9627, "loss": 1.7506, "learning_rate": 2.94264383843881e-05, "epoch": 0.6349849381946608, "percentage": 63.5, "elapsed_time": "1 day, 22:35:24", "remaining_time": "1 day, 2:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6114, "total_steps": 9627, "loss": 1.7382, "learning_rate": 2.9411568185793757e-05, "epoch": 0.6350888127142412, "percentage": 63.51, "elapsed_time": "1 day, 22:35:52", "remaining_time": "1 day, 2:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6115, "total_steps": 9627, "loss": 1.4555, "learning_rate": 2.939670017970683e-05, "epoch": 0.6351926872338215, "percentage": 63.52, "elapsed_time": "1 day, 22:36:22", "remaining_time": "1 day, 2:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6116, "total_steps": 9627, "loss": 1.7941, "learning_rate": 2.9381834367710616e-05, "epoch": 0.6352965617534019, "percentage": 63.53, "elapsed_time": "1 day, 22:36:50", "remaining_time": "1 day, 2:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6117, "total_steps": 9627, "loss": 1.7317, "learning_rate": 2.9366970751388196e-05, "epoch": 0.6354004362729823, "percentage": 63.54, "elapsed_time": "1 day, 22:37:20", "remaining_time": "1 day, 2:45:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6118, "total_steps": 9627, "loss": 1.652, "learning_rate": 2.9352109332322468e-05, "epoch": 0.6355043107925625, "percentage": 63.55, "elapsed_time": "1 day, 22:37:49", "remaining_time": "1 day, 2:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6119, "total_steps": 9627, "loss": 1.6144, "learning_rate": 2.9337250112096016e-05, "epoch": 0.6356081853121429, "percentage": 63.56, "elapsed_time": "1 day, 22:38:18", "remaining_time": "1 day, 2:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6120, "total_steps": 9627, "loss": 1.7013, "learning_rate": 2.9322393092291256e-05, "epoch": 0.6357120598317233, "percentage": 63.57, "elapsed_time": "1 day, 22:38:46", "remaining_time": "1 day, 2:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6121, "total_steps": 9627, "loss": 1.7454, "learning_rate": 2.9307538274490348e-05, "epoch": 0.6358159343513037, "percentage": 63.58, "elapsed_time": "1 day, 22:39:16", "remaining_time": "1 day, 2:43:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6122, "total_steps": 9627, "loss": 1.7023, "learning_rate": 2.9292685660275204e-05, "epoch": 0.635919808870884, "percentage": 63.59, "elapsed_time": "1 day, 22:39:44", "remaining_time": "1 day, 2:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6123, "total_steps": 9627, "loss": 1.7887, "learning_rate": 2.9277835251227514e-05, "epoch": 0.6360236833904643, "percentage": 63.6, "elapsed_time": "1 day, 22:40:13", "remaining_time": "1 day, 2:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6124, "total_steps": 9627, "loss": 1.8606, "learning_rate": 2.9262987048928725e-05, "epoch": 0.6361275579100447, "percentage": 63.61, "elapsed_time": "1 day, 22:40:43", "remaining_time": "1 day, 2:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6125, "total_steps": 9627, "loss": 1.5617, "learning_rate": 2.9248141054960076e-05, "epoch": 0.636231432429625, "percentage": 63.62, "elapsed_time": "1 day, 22:41:12", "remaining_time": "1 day, 2:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6126, "total_steps": 9627, "loss": 1.5637, "learning_rate": 2.9233297270902514e-05, "epoch": 0.6363353069492054, "percentage": 63.63, "elapsed_time": "1 day, 22:41:40", "remaining_time": "1 day, 2:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6127, "total_steps": 9627, "loss": 1.6716, "learning_rate": 2.921845569833681e-05, "epoch": 0.6364391814687858, "percentage": 63.64, "elapsed_time": "1 day, 22:42:10", "remaining_time": "1 day, 2:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6128, "total_steps": 9627, "loss": 1.5734, "learning_rate": 2.9203616338843486e-05, "epoch": 0.636543055988366, "percentage": 63.65, "elapsed_time": "1 day, 22:42:38", "remaining_time": "1 day, 2:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6129, "total_steps": 9627, "loss": 1.6421, "learning_rate": 2.9188779194002803e-05, "epoch": 0.6366469305079464, "percentage": 63.66, "elapsed_time": "1 day, 22:43:09", "remaining_time": "1 day, 2:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6130, "total_steps": 9627, "loss": 1.777, "learning_rate": 2.917394426539477e-05, "epoch": 0.6367508050275268, "percentage": 63.68, "elapsed_time": "1 day, 22:43:37", "remaining_time": "1 day, 2:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6131, "total_steps": 9627, "loss": 1.7351, "learning_rate": 2.915911155459927e-05, "epoch": 0.6368546795471071, "percentage": 63.69, "elapsed_time": "1 day, 22:44:07", "remaining_time": "1 day, 2:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6132, "total_steps": 9627, "loss": 1.7189, "learning_rate": 2.914428106319579e-05, "epoch": 0.6369585540666874, "percentage": 63.7, "elapsed_time": "1 day, 22:44:35", "remaining_time": "1 day, 2:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6133, "total_steps": 9627, "loss": 2.0055, "learning_rate": 2.912945279276371e-05, "epoch": 0.6370624285862678, "percentage": 63.71, "elapsed_time": "1 day, 22:45:05", "remaining_time": "1 day, 2:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6134, "total_steps": 9627, "loss": 1.8263, "learning_rate": 2.9114626744882128e-05, "epoch": 0.6371663031058481, "percentage": 63.72, "elapsed_time": "1 day, 22:45:33", "remaining_time": "1 day, 2:37:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6135, "total_steps": 9627, "loss": 1.7515, "learning_rate": 2.909980292112985e-05, "epoch": 0.6372701776254285, "percentage": 63.73, "elapsed_time": "1 day, 22:46:02", "remaining_time": "1 day, 2:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6136, "total_steps": 9627, "loss": 1.7123, "learning_rate": 2.9084981323085547e-05, "epoch": 0.6373740521450089, "percentage": 63.74, "elapsed_time": "1 day, 22:46:31", "remaining_time": "1 day, 2:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6137, "total_steps": 9627, "loss": 1.6792, "learning_rate": 2.90701619523276e-05, "epoch": 0.6374779266645891, "percentage": 63.75, "elapsed_time": "1 day, 22:47:00", "remaining_time": "1 day, 2:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6138, "total_steps": 9627, "loss": 1.6872, "learning_rate": 2.9055344810434137e-05, "epoch": 0.6375818011841695, "percentage": 63.76, "elapsed_time": "1 day, 22:47:30", "remaining_time": "1 day, 2:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6139, "total_steps": 9627, "loss": 1.908, "learning_rate": 2.904052989898308e-05, "epoch": 0.6376856757037499, "percentage": 63.77, "elapsed_time": "1 day, 22:48:00", "remaining_time": "1 day, 2:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6140, "total_steps": 9627, "loss": 1.6729, "learning_rate": 2.90257172195521e-05, "epoch": 0.6377895502233302, "percentage": 63.78, "elapsed_time": "1 day, 22:48:28", "remaining_time": "1 day, 2:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6141, "total_steps": 9627, "loss": 1.6487, "learning_rate": 2.9010906773718627e-05, "epoch": 0.6378934247429106, "percentage": 63.79, "elapsed_time": "1 day, 22:48:58", "remaining_time": "1 day, 2:34:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6142, "total_steps": 9627, "loss": 1.508, "learning_rate": 2.899609856305985e-05, "epoch": 0.6379972992624909, "percentage": 63.8, "elapsed_time": "1 day, 22:49:26", "remaining_time": "1 day, 2:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6143, "total_steps": 9627, "loss": 1.8111, "learning_rate": 2.8981292589152768e-05, "epoch": 0.6381011737820712, "percentage": 63.81, "elapsed_time": "1 day, 22:49:57", "remaining_time": "1 day, 2:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6144, "total_steps": 9627, "loss": 1.6826, "learning_rate": 2.8966488853574036e-05, "epoch": 0.6382050483016516, "percentage": 63.82, "elapsed_time": "1 day, 22:50:26", "remaining_time": "1 day, 2:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6145, "total_steps": 9627, "loss": 1.7693, "learning_rate": 2.8951687357900203e-05, "epoch": 0.638308922821232, "percentage": 63.83, "elapsed_time": "1 day, 22:50:54", "remaining_time": "1 day, 2:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6146, "total_steps": 9627, "loss": 1.883, "learning_rate": 2.8936888103707473e-05, "epoch": 0.6384127973408122, "percentage": 63.84, "elapsed_time": "1 day, 22:51:25", "remaining_time": "1 day, 2:32:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6147, "total_steps": 9627, "loss": 1.5675, "learning_rate": 2.8922091092571862e-05, "epoch": 0.6385166718603926, "percentage": 63.85, "elapsed_time": "1 day, 22:51:53", "remaining_time": "1 day, 2:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6148, "total_steps": 9627, "loss": 1.7282, "learning_rate": 2.8907296326069137e-05, "epoch": 0.638620546379973, "percentage": 63.86, "elapsed_time": "1 day, 22:52:23", "remaining_time": "1 day, 2:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6149, "total_steps": 9627, "loss": 1.6623, "learning_rate": 2.8892503805774806e-05, "epoch": 0.6387244208995534, "percentage": 63.87, "elapsed_time": "1 day, 22:52:52", "remaining_time": "1 day, 2:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6150, "total_steps": 9627, "loss": 1.6275, "learning_rate": 2.8877713533264217e-05, "epoch": 0.6388282954191337, "percentage": 63.88, "elapsed_time": "1 day, 22:53:21", "remaining_time": "1 day, 2:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6151, "total_steps": 9627, "loss": 1.6549, "learning_rate": 2.8862925510112327e-05, "epoch": 0.638932169938714, "percentage": 63.89, "elapsed_time": "1 day, 22:53:50", "remaining_time": "1 day, 2:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6152, "total_steps": 9627, "loss": 1.7372, "learning_rate": 2.884813973789402e-05, "epoch": 0.6390360444582944, "percentage": 63.9, "elapsed_time": "1 day, 22:54:20", "remaining_time": "1 day, 2:29:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6153, "total_steps": 9627, "loss": 1.5238, "learning_rate": 2.8833356218183843e-05, "epoch": 0.6391399189778747, "percentage": 63.91, "elapsed_time": "1 day, 22:54:49", "remaining_time": "1 day, 2:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6154, "total_steps": 9627, "loss": 1.8191, "learning_rate": 2.881857495255612e-05, "epoch": 0.6392437934974551, "percentage": 63.92, "elapsed_time": "1 day, 22:55:18", "remaining_time": "1 day, 2:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6155, "total_steps": 9627, "loss": 1.4469, "learning_rate": 2.8803795942584945e-05, "epoch": 0.6393476680170355, "percentage": 63.93, "elapsed_time": "1 day, 22:55:48", "remaining_time": "1 day, 2:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6156, "total_steps": 9627, "loss": 1.5771, "learning_rate": 2.8789019189844163e-05, "epoch": 0.6394515425366157, "percentage": 63.95, "elapsed_time": "1 day, 22:56:17", "remaining_time": "1 day, 2:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6157, "total_steps": 9627, "loss": 1.6283, "learning_rate": 2.877424469590739e-05, "epoch": 0.6395554170561961, "percentage": 63.96, "elapsed_time": "1 day, 22:56:46", "remaining_time": "1 day, 2:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6158, "total_steps": 9627, "loss": 1.6039, "learning_rate": 2.8759472462347965e-05, "epoch": 0.6396592915757765, "percentage": 63.97, "elapsed_time": "1 day, 22:57:16", "remaining_time": "1 day, 2:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6159, "total_steps": 9627, "loss": 1.6585, "learning_rate": 2.8744702490739077e-05, "epoch": 0.6397631660953568, "percentage": 63.98, "elapsed_time": "1 day, 22:57:45", "remaining_time": "1 day, 2:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6160, "total_steps": 9627, "loss": 1.6049, "learning_rate": 2.8729934782653545e-05, "epoch": 0.6398670406149372, "percentage": 63.99, "elapsed_time": "1 day, 22:58:15", "remaining_time": "1 day, 2:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6161, "total_steps": 9627, "loss": 1.4499, "learning_rate": 2.8715169339664062e-05, "epoch": 0.6399709151345175, "percentage": 64.0, "elapsed_time": "1 day, 22:58:44", "remaining_time": "1 day, 2:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6162, "total_steps": 9627, "loss": 1.7916, "learning_rate": 2.870040616334303e-05, "epoch": 0.6400747896540978, "percentage": 64.01, "elapsed_time": "1 day, 22:59:12", "remaining_time": "1 day, 2:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6163, "total_steps": 9627, "loss": 1.6107, "learning_rate": 2.8685645255262562e-05, "epoch": 0.6401786641736782, "percentage": 64.02, "elapsed_time": "1 day, 22:59:41", "remaining_time": "1 day, 2:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6164, "total_steps": 9627, "loss": 1.7303, "learning_rate": 2.867088661699464e-05, "epoch": 0.6402825386932586, "percentage": 64.03, "elapsed_time": "1 day, 23:00:10", "remaining_time": "1 day, 2:24:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6165, "total_steps": 9627, "loss": 1.5763, "learning_rate": 2.8656130250110913e-05, "epoch": 0.6403864132128388, "percentage": 64.04, "elapsed_time": "1 day, 23:00:41", "remaining_time": "1 day, 2:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6166, "total_steps": 9627, "loss": 1.6337, "learning_rate": 2.864137615618283e-05, "epoch": 0.6404902877324192, "percentage": 64.05, "elapsed_time": "1 day, 23:01:10", "remaining_time": "1 day, 2:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6167, "total_steps": 9627, "loss": 1.5719, "learning_rate": 2.862662433678158e-05, "epoch": 0.6405941622519996, "percentage": 64.06, "elapsed_time": "1 day, 23:01:39", "remaining_time": "1 day, 2:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6168, "total_steps": 9627, "loss": 1.4238, "learning_rate": 2.861187479347813e-05, "epoch": 0.6406980367715799, "percentage": 64.07, "elapsed_time": "1 day, 23:02:08", "remaining_time": "1 day, 2:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6169, "total_steps": 9627, "loss": 1.7344, "learning_rate": 2.8597127527843172e-05, "epoch": 0.6408019112911603, "percentage": 64.08, "elapsed_time": "1 day, 23:02:36", "remaining_time": "1 day, 2:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6170, "total_steps": 9627, "loss": 1.8152, "learning_rate": 2.858238254144716e-05, "epoch": 0.6409057858107406, "percentage": 64.09, "elapsed_time": "1 day, 23:03:05", "remaining_time": "1 day, 2:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6171, "total_steps": 9627, "loss": 1.612, "learning_rate": 2.8567639835860394e-05, "epoch": 0.6410096603303209, "percentage": 64.1, "elapsed_time": "1 day, 23:03:35", "remaining_time": "1 day, 2:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6172, "total_steps": 9627, "loss": 1.7688, "learning_rate": 2.8552899412652757e-05, "epoch": 0.6411135348499013, "percentage": 64.11, "elapsed_time": "1 day, 23:04:05", "remaining_time": "1 day, 2:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6173, "total_steps": 9627, "loss": 1.779, "learning_rate": 2.853816127339406e-05, "epoch": 0.6412174093694817, "percentage": 64.12, "elapsed_time": "1 day, 23:04:33", "remaining_time": "1 day, 2:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6174, "total_steps": 9627, "loss": 1.723, "learning_rate": 2.8523425419653784e-05, "epoch": 0.6413212838890621, "percentage": 64.13, "elapsed_time": "1 day, 23:05:03", "remaining_time": "1 day, 2:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6175, "total_steps": 9627, "loss": 1.74, "learning_rate": 2.8508691853001174e-05, "epoch": 0.6414251584086423, "percentage": 64.14, "elapsed_time": "1 day, 23:05:31", "remaining_time": "1 day, 2:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6176, "total_steps": 9627, "loss": 1.8088, "learning_rate": 2.8493960575005242e-05, "epoch": 0.6415290329282227, "percentage": 64.15, "elapsed_time": "1 day, 23:06:01", "remaining_time": "1 day, 2:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6177, "total_steps": 9627, "loss": 1.6215, "learning_rate": 2.8479231587234734e-05, "epoch": 0.6416329074478031, "percentage": 64.16, "elapsed_time": "1 day, 23:06:29", "remaining_time": "1 day, 2:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6178, "total_steps": 9627, "loss": 1.6694, "learning_rate": 2.8464504891258237e-05, "epoch": 0.6417367819673834, "percentage": 64.17, "elapsed_time": "1 day, 23:06:58", "remaining_time": "1 day, 2:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6179, "total_steps": 9627, "loss": 1.8489, "learning_rate": 2.8449780488643944e-05, "epoch": 0.6418406564869638, "percentage": 64.18, "elapsed_time": "1 day, 23:07:28", "remaining_time": "1 day, 2:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6180, "total_steps": 9627, "loss": 1.691, "learning_rate": 2.8435058380959956e-05, "epoch": 0.6419445310065441, "percentage": 64.19, "elapsed_time": "1 day, 23:07:59", "remaining_time": "1 day, 2:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6181, "total_steps": 9627, "loss": 1.7029, "learning_rate": 2.842033856977403e-05, "epoch": 0.6420484055261244, "percentage": 64.2, "elapsed_time": "1 day, 23:08:27", "remaining_time": "1 day, 2:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6182, "total_steps": 9627, "loss": 1.7289, "learning_rate": 2.840562105665372e-05, "epoch": 0.6421522800457048, "percentage": 64.22, "elapsed_time": "1 day, 23:08:56", "remaining_time": "1 day, 2:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6183, "total_steps": 9627, "loss": 1.8544, "learning_rate": 2.8390905843166326e-05, "epoch": 0.6422561545652852, "percentage": 64.23, "elapsed_time": "1 day, 23:09:26", "remaining_time": "1 day, 2:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6184, "total_steps": 9627, "loss": 1.6042, "learning_rate": 2.8376192930878898e-05, "epoch": 0.6423600290848654, "percentage": 64.24, "elapsed_time": "1 day, 23:09:55", "remaining_time": "1 day, 2:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6185, "total_steps": 9627, "loss": 1.7571, "learning_rate": 2.8361482321358256e-05, "epoch": 0.6424639036044458, "percentage": 64.25, "elapsed_time": "1 day, 23:10:23", "remaining_time": "1 day, 2:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6186, "total_steps": 9627, "loss": 1.7529, "learning_rate": 2.834677401617094e-05, "epoch": 0.6425677781240262, "percentage": 64.26, "elapsed_time": "1 day, 23:10:52", "remaining_time": "1 day, 2:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6187, "total_steps": 9627, "loss": 1.7456, "learning_rate": 2.833206801688333e-05, "epoch": 0.6426716526436065, "percentage": 64.27, "elapsed_time": "1 day, 23:11:22", "remaining_time": "1 day, 2:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6188, "total_steps": 9627, "loss": 1.5975, "learning_rate": 2.8317364325061412e-05, "epoch": 0.6427755271631869, "percentage": 64.28, "elapsed_time": "1 day, 23:11:51", "remaining_time": "1 day, 2:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6189, "total_steps": 9627, "loss": 1.6589, "learning_rate": 2.8302662942271098e-05, "epoch": 0.6428794016827672, "percentage": 64.29, "elapsed_time": "1 day, 23:12:20", "remaining_time": "1 day, 2:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6190, "total_steps": 9627, "loss": 1.7522, "learning_rate": 2.828796387007794e-05, "epoch": 0.6429832762023475, "percentage": 64.3, "elapsed_time": "1 day, 23:12:49", "remaining_time": "1 day, 2:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6191, "total_steps": 9627, "loss": 1.4194, "learning_rate": 2.8273267110047234e-05, "epoch": 0.6430871507219279, "percentage": 64.31, "elapsed_time": "1 day, 23:13:18", "remaining_time": "1 day, 2:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6192, "total_steps": 9627, "loss": 1.6241, "learning_rate": 2.8258572663744132e-05, "epoch": 0.6431910252415083, "percentage": 64.32, "elapsed_time": "1 day, 23:13:47", "remaining_time": "1 day, 2:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6193, "total_steps": 9627, "loss": 1.6012, "learning_rate": 2.824388053273344e-05, "epoch": 0.6432948997610886, "percentage": 64.33, "elapsed_time": "1 day, 23:14:17", "remaining_time": "1 day, 2:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6194, "total_steps": 9627, "loss": 1.5466, "learning_rate": 2.8229190718579777e-05, "epoch": 0.6433987742806689, "percentage": 64.34, "elapsed_time": "1 day, 23:14:45", "remaining_time": "1 day, 2:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6195, "total_steps": 9627, "loss": 1.6249, "learning_rate": 2.8214503222847477e-05, "epoch": 0.6435026488002493, "percentage": 64.35, "elapsed_time": "1 day, 23:15:16", "remaining_time": "1 day, 2:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6196, "total_steps": 9627, "loss": 1.8056, "learning_rate": 2.8199818047100656e-05, "epoch": 0.6436065233198296, "percentage": 64.36, "elapsed_time": "1 day, 23:15:44", "remaining_time": "1 day, 2:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6197, "total_steps": 9627, "loss": 1.9505, "learning_rate": 2.8185135192903163e-05, "epoch": 0.64371039783941, "percentage": 64.37, "elapsed_time": "1 day, 23:16:13", "remaining_time": "1 day, 2:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6198, "total_steps": 9627, "loss": 1.4729, "learning_rate": 2.8170454661818583e-05, "epoch": 0.6438142723589904, "percentage": 64.38, "elapsed_time": "1 day, 23:16:44", "remaining_time": "1 day, 2:09:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6199, "total_steps": 9627, "loss": 1.8712, "learning_rate": 2.815577645541033e-05, "epoch": 0.6439181468785707, "percentage": 64.39, "elapsed_time": "1 day, 23:17:12", "remaining_time": "1 day, 2:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6200, "total_steps": 9627, "loss": 1.5689, "learning_rate": 2.8141100575241498e-05, "epoch": 0.644022021398151, "percentage": 64.4, "elapsed_time": "1 day, 23:17:42", "remaining_time": "1 day, 2:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6201, "total_steps": 9627, "loss": 1.7155, "learning_rate": 2.8126427022874948e-05, "epoch": 0.6441258959177314, "percentage": 64.41, "elapsed_time": "1 day, 23:18:11", "remaining_time": "1 day, 2:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6202, "total_steps": 9627, "loss": 1.9476, "learning_rate": 2.811175579987329e-05, "epoch": 0.6442297704373118, "percentage": 64.42, "elapsed_time": "1 day, 23:18:40", "remaining_time": "1 day, 2:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6203, "total_steps": 9627, "loss": 1.6353, "learning_rate": 2.809708690779891e-05, "epoch": 0.644333644956892, "percentage": 64.43, "elapsed_time": "1 day, 23:19:10", "remaining_time": "1 day, 2:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6204, "total_steps": 9627, "loss": 1.5309, "learning_rate": 2.8082420348213922e-05, "epoch": 0.6444375194764724, "percentage": 64.44, "elapsed_time": "1 day, 23:19:39", "remaining_time": "1 day, 2:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6205, "total_steps": 9627, "loss": 1.5944, "learning_rate": 2.806775612268019e-05, "epoch": 0.6445413939960528, "percentage": 64.45, "elapsed_time": "1 day, 23:20:08", "remaining_time": "1 day, 2:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6206, "total_steps": 9627, "loss": 1.5079, "learning_rate": 2.8053094232759393e-05, "epoch": 0.6446452685156331, "percentage": 64.46, "elapsed_time": "1 day, 23:20:38", "remaining_time": "1 day, 2:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6207, "total_steps": 9627, "loss": 1.7176, "learning_rate": 2.8038434680012814e-05, "epoch": 0.6447491430352135, "percentage": 64.47, "elapsed_time": "1 day, 23:21:07", "remaining_time": "1 day, 2:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6208, "total_steps": 9627, "loss": 1.7649, "learning_rate": 2.8023777466001666e-05, "epoch": 0.6448530175547939, "percentage": 64.49, "elapsed_time": "1 day, 23:21:36", "remaining_time": "1 day, 2:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6209, "total_steps": 9627, "loss": 1.6787, "learning_rate": 2.8009122592286795e-05, "epoch": 0.6449568920743741, "percentage": 64.5, "elapsed_time": "1 day, 23:22:05", "remaining_time": "1 day, 2:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6210, "total_steps": 9627, "loss": 1.626, "learning_rate": 2.7994470060428834e-05, "epoch": 0.6450607665939545, "percentage": 64.51, "elapsed_time": "1 day, 23:22:34", "remaining_time": "1 day, 2:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6211, "total_steps": 9627, "loss": 1.6221, "learning_rate": 2.7979819871988166e-05, "epoch": 0.6451646411135349, "percentage": 64.52, "elapsed_time": "1 day, 23:23:05", "remaining_time": "1 day, 2:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6212, "total_steps": 9627, "loss": 1.6874, "learning_rate": 2.796517202852491e-05, "epoch": 0.6452685156331152, "percentage": 64.53, "elapsed_time": "1 day, 23:23:33", "remaining_time": "1 day, 2:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6213, "total_steps": 9627, "loss": 1.6113, "learning_rate": 2.795052653159896e-05, "epoch": 0.6453723901526955, "percentage": 64.54, "elapsed_time": "1 day, 23:24:02", "remaining_time": "1 day, 2:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6214, "total_steps": 9627, "loss": 1.5794, "learning_rate": 2.7935883382769918e-05, "epoch": 0.6454762646722759, "percentage": 64.55, "elapsed_time": "1 day, 23:24:32", "remaining_time": "1 day, 2:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6215, "total_steps": 9627, "loss": 1.716, "learning_rate": 2.7921242583597228e-05, "epoch": 0.6455801391918562, "percentage": 64.56, "elapsed_time": "1 day, 23:25:02", "remaining_time": "1 day, 2:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6216, "total_steps": 9627, "loss": 1.6549, "learning_rate": 2.7906604135639945e-05, "epoch": 0.6456840137114366, "percentage": 64.57, "elapsed_time": "1 day, 23:25:31", "remaining_time": "1 day, 2:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6217, "total_steps": 9627, "loss": 1.7255, "learning_rate": 2.7891968040457007e-05, "epoch": 0.645787888231017, "percentage": 64.58, "elapsed_time": "1 day, 23:26:01", "remaining_time": "1 day, 2:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6218, "total_steps": 9627, "loss": 1.993, "learning_rate": 2.7877334299607037e-05, "epoch": 0.6458917627505972, "percentage": 64.59, "elapsed_time": "1 day, 23:26:31", "remaining_time": "1 day, 2:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6219, "total_steps": 9627, "loss": 1.6315, "learning_rate": 2.7862702914648364e-05, "epoch": 0.6459956372701776, "percentage": 64.6, "elapsed_time": "1 day, 23:27:00", "remaining_time": "1 day, 2:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6220, "total_steps": 9627, "loss": 1.521, "learning_rate": 2.784807388713918e-05, "epoch": 0.646099511789758, "percentage": 64.61, "elapsed_time": "1 day, 23:27:30", "remaining_time": "1 day, 1:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6221, "total_steps": 9627, "loss": 1.6055, "learning_rate": 2.7833447218637332e-05, "epoch": 0.6462033863093383, "percentage": 64.62, "elapsed_time": "1 day, 23:28:00", "remaining_time": "1 day, 1:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6222, "total_steps": 9627, "loss": 1.6364, "learning_rate": 2.7818822910700442e-05, "epoch": 0.6463072608289187, "percentage": 64.63, "elapsed_time": "1 day, 23:28:28", "remaining_time": "1 day, 1:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6223, "total_steps": 9627, "loss": 1.6882, "learning_rate": 2.7804200964885897e-05, "epoch": 0.646411135348499, "percentage": 64.64, "elapsed_time": "1 day, 23:28:58", "remaining_time": "1 day, 1:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6224, "total_steps": 9627, "loss": 1.6535, "learning_rate": 2.7789581382750794e-05, "epoch": 0.6465150098680794, "percentage": 64.65, "elapsed_time": "1 day, 23:29:27", "remaining_time": "1 day, 1:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6225, "total_steps": 9627, "loss": 1.5526, "learning_rate": 2.777496416585207e-05, "epoch": 0.6466188843876597, "percentage": 64.66, "elapsed_time": "1 day, 23:29:58", "remaining_time": "1 day, 1:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6226, "total_steps": 9627, "loss": 1.6387, "learning_rate": 2.776034931574626e-05, "epoch": 0.6467227589072401, "percentage": 64.67, "elapsed_time": "1 day, 23:30:26", "remaining_time": "1 day, 1:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6227, "total_steps": 9627, "loss": 1.7418, "learning_rate": 2.7745736833989788e-05, "epoch": 0.6468266334268205, "percentage": 64.68, "elapsed_time": "1 day, 23:30:55", "remaining_time": "1 day, 1:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6228, "total_steps": 9627, "loss": 1.7758, "learning_rate": 2.7731126722138756e-05, "epoch": 0.6469305079464007, "percentage": 64.69, "elapsed_time": "1 day, 23:31:26", "remaining_time": "1 day, 1:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6229, "total_steps": 9627, "loss": 1.7876, "learning_rate": 2.7716518981749022e-05, "epoch": 0.6470343824659811, "percentage": 64.7, "elapsed_time": "1 day, 23:31:56", "remaining_time": "1 day, 1:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6230, "total_steps": 9627, "loss": 1.5814, "learning_rate": 2.77019136143762e-05, "epoch": 0.6471382569855615, "percentage": 64.71, "elapsed_time": "1 day, 23:32:25", "remaining_time": "1 day, 1:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6231, "total_steps": 9627, "loss": 1.6095, "learning_rate": 2.7687310621575646e-05, "epoch": 0.6472421315051418, "percentage": 64.72, "elapsed_time": "1 day, 23:32:53", "remaining_time": "1 day, 1:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6232, "total_steps": 9627, "loss": 1.5995, "learning_rate": 2.767271000490247e-05, "epoch": 0.6473460060247221, "percentage": 64.73, "elapsed_time": "1 day, 23:33:24", "remaining_time": "1 day, 1:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6233, "total_steps": 9627, "loss": 1.8424, "learning_rate": 2.7658111765911486e-05, "epoch": 0.6474498805443025, "percentage": 64.74, "elapsed_time": "1 day, 23:33:52", "remaining_time": "1 day, 1:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6234, "total_steps": 9627, "loss": 1.544, "learning_rate": 2.764351590615738e-05, "epoch": 0.6475537550638828, "percentage": 64.76, "elapsed_time": "1 day, 23:34:23", "remaining_time": "1 day, 1:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6235, "total_steps": 9627, "loss": 1.6898, "learning_rate": 2.762892242719439e-05, "epoch": 0.6476576295834632, "percentage": 64.77, "elapsed_time": "1 day, 23:34:51", "remaining_time": "1 day, 1:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6236, "total_steps": 9627, "loss": 1.4979, "learning_rate": 2.7614331330576694e-05, "epoch": 0.6477615041030436, "percentage": 64.78, "elapsed_time": "1 day, 23:35:22", "remaining_time": "1 day, 1:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6237, "total_steps": 9627, "loss": 1.8237, "learning_rate": 2.7599742617858088e-05, "epoch": 0.6478653786226238, "percentage": 64.79, "elapsed_time": "1 day, 23:35:51", "remaining_time": "1 day, 1:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6238, "total_steps": 9627, "loss": 1.482, "learning_rate": 2.7585156290592164e-05, "epoch": 0.6479692531422042, "percentage": 64.8, "elapsed_time": "1 day, 23:36:19", "remaining_time": "1 day, 1:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6239, "total_steps": 9627, "loss": 1.7348, "learning_rate": 2.7570572350332258e-05, "epoch": 0.6480731276617846, "percentage": 64.81, "elapsed_time": "1 day, 23:36:48", "remaining_time": "1 day, 1:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6240, "total_steps": 9627, "loss": 1.6357, "learning_rate": 2.7555990798631436e-05, "epoch": 0.6481770021813649, "percentage": 64.82, "elapsed_time": "1 day, 23:37:19", "remaining_time": "1 day, 1:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6241, "total_steps": 9627, "loss": 1.8034, "learning_rate": 2.7541411637042526e-05, "epoch": 0.6482808767009453, "percentage": 64.83, "elapsed_time": "1 day, 23:37:48", "remaining_time": "1 day, 1:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6242, "total_steps": 9627, "loss": 1.6212, "learning_rate": 2.752683486711807e-05, "epoch": 0.6483847512205256, "percentage": 64.84, "elapsed_time": "1 day, 23:38:17", "remaining_time": "1 day, 1:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6243, "total_steps": 9627, "loss": 1.5956, "learning_rate": 2.7512260490410448e-05, "epoch": 0.6484886257401059, "percentage": 64.85, "elapsed_time": "1 day, 23:38:47", "remaining_time": "1 day, 1:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6244, "total_steps": 9627, "loss": 1.5114, "learning_rate": 2.7497688508471625e-05, "epoch": 0.6485925002596863, "percentage": 64.86, "elapsed_time": "1 day, 23:39:16", "remaining_time": "1 day, 1:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6245, "total_steps": 9627, "loss": 1.4739, "learning_rate": 2.748311892285348e-05, "epoch": 0.6486963747792667, "percentage": 64.87, "elapsed_time": "1 day, 23:39:46", "remaining_time": "1 day, 1:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6246, "total_steps": 9627, "loss": 1.5095, "learning_rate": 2.746855173510754e-05, "epoch": 0.6488002492988469, "percentage": 64.88, "elapsed_time": "1 day, 23:40:14", "remaining_time": "1 day, 1:48:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6247, "total_steps": 9627, "loss": 1.8714, "learning_rate": 2.745398694678506e-05, "epoch": 0.6489041238184273, "percentage": 64.89, "elapsed_time": "1 day, 23:40:44", "remaining_time": "1 day, 1:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6248, "total_steps": 9627, "loss": 1.7226, "learning_rate": 2.7439424559437122e-05, "epoch": 0.6490079983380077, "percentage": 64.9, "elapsed_time": "1 day, 23:41:13", "remaining_time": "1 day, 1:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6249, "total_steps": 9627, "loss": 1.5442, "learning_rate": 2.7424864574614484e-05, "epoch": 0.649111872857588, "percentage": 64.91, "elapsed_time": "1 day, 23:41:42", "remaining_time": "1 day, 1:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6250, "total_steps": 9627, "loss": 1.713, "learning_rate": 2.7410306993867675e-05, "epoch": 0.6492157473771684, "percentage": 64.92, "elapsed_time": "1 day, 23:42:12", "remaining_time": "1 day, 1:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6251, "total_steps": 9627, "loss": 1.6123, "learning_rate": 2.7395751818746972e-05, "epoch": 0.6493196218967487, "percentage": 64.93, "elapsed_time": "1 day, 23:42:42", "remaining_time": "1 day, 1:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6252, "total_steps": 9627, "loss": 1.642, "learning_rate": 2.738119905080235e-05, "epoch": 0.6494234964163291, "percentage": 64.94, "elapsed_time": "1 day, 23:43:10", "remaining_time": "1 day, 1:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6253, "total_steps": 9627, "loss": 1.4608, "learning_rate": 2.7366648691583646e-05, "epoch": 0.6495273709359094, "percentage": 64.95, "elapsed_time": "1 day, 23:43:40", "remaining_time": "1 day, 1:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6254, "total_steps": 9627, "loss": 1.5948, "learning_rate": 2.735210074264027e-05, "epoch": 0.6496312454554898, "percentage": 64.96, "elapsed_time": "1 day, 23:44:09", "remaining_time": "1 day, 1:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6255, "total_steps": 9627, "loss": 1.5191, "learning_rate": 2.7337555205521514e-05, "epoch": 0.6497351199750702, "percentage": 64.97, "elapsed_time": "1 day, 23:44:40", "remaining_time": "1 day, 1:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6256, "total_steps": 9627, "loss": 1.5952, "learning_rate": 2.7323012081776368e-05, "epoch": 0.6498389944946504, "percentage": 64.98, "elapsed_time": "1 day, 23:45:09", "remaining_time": "1 day, 1:43:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6257, "total_steps": 9627, "loss": 1.644, "learning_rate": 2.7308471372953538e-05, "epoch": 0.6499428690142308, "percentage": 64.99, "elapsed_time": "1 day, 23:45:38", "remaining_time": "1 day, 1:43:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6258, "total_steps": 9627, "loss": 1.7363, "learning_rate": 2.7293933080601507e-05, "epoch": 0.6500467435338112, "percentage": 65.0, "elapsed_time": "1 day, 23:46:07", "remaining_time": "1 day, 1:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6259, "total_steps": 9627, "loss": 1.7536, "learning_rate": 2.727939720626849e-05, "epoch": 0.6501506180533915, "percentage": 65.02, "elapsed_time": "1 day, 23:46:37", "remaining_time": "1 day, 1:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6260, "total_steps": 9627, "loss": 1.8819, "learning_rate": 2.7264863751502446e-05, "epoch": 0.6502544925729719, "percentage": 65.03, "elapsed_time": "1 day, 23:47:06", "remaining_time": "1 day, 1:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6261, "total_steps": 9627, "loss": 1.6615, "learning_rate": 2.725033271785105e-05, "epoch": 0.6503583670925522, "percentage": 65.04, "elapsed_time": "1 day, 23:47:35", "remaining_time": "1 day, 1:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6262, "total_steps": 9627, "loss": 1.5312, "learning_rate": 2.7235804106861807e-05, "epoch": 0.6504622416121325, "percentage": 65.05, "elapsed_time": "1 day, 23:48:05", "remaining_time": "1 day, 1:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6263, "total_steps": 9627, "loss": 1.8898, "learning_rate": 2.7221277920081818e-05, "epoch": 0.6505661161317129, "percentage": 65.06, "elapsed_time": "1 day, 23:48:35", "remaining_time": "1 day, 1:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6264, "total_steps": 9627, "loss": 1.779, "learning_rate": 2.720675415905807e-05, "epoch": 0.6506699906512933, "percentage": 65.07, "elapsed_time": "1 day, 23:49:03", "remaining_time": "1 day, 1:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6265, "total_steps": 9627, "loss": 1.6765, "learning_rate": 2.7192232825337206e-05, "epoch": 0.6507738651708735, "percentage": 65.08, "elapsed_time": "1 day, 23:49:33", "remaining_time": "1 day, 1:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6266, "total_steps": 9627, "loss": 1.631, "learning_rate": 2.7177713920465643e-05, "epoch": 0.6508777396904539, "percentage": 65.09, "elapsed_time": "1 day, 23:50:03", "remaining_time": "1 day, 1:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6267, "total_steps": 9627, "loss": 1.5956, "learning_rate": 2.7163197445989518e-05, "epoch": 0.6509816142100343, "percentage": 65.1, "elapsed_time": "1 day, 23:50:33", "remaining_time": "1 day, 1:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6268, "total_steps": 9627, "loss": 1.5979, "learning_rate": 2.7148683403454746e-05, "epoch": 0.6510854887296146, "percentage": 65.11, "elapsed_time": "1 day, 23:51:01", "remaining_time": "1 day, 1:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6269, "total_steps": 9627, "loss": 1.546, "learning_rate": 2.7134171794406932e-05, "epoch": 0.651189363249195, "percentage": 65.12, "elapsed_time": "1 day, 23:51:31", "remaining_time": "1 day, 1:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6270, "total_steps": 9627, "loss": 1.7254, "learning_rate": 2.711966262039145e-05, "epoch": 0.6512932377687753, "percentage": 65.13, "elapsed_time": "1 day, 23:52:02", "remaining_time": "1 day, 1:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6271, "total_steps": 9627, "loss": 1.7585, "learning_rate": 2.710515588295346e-05, "epoch": 0.6513971122883556, "percentage": 65.14, "elapsed_time": "1 day, 23:52:30", "remaining_time": "1 day, 1:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6272, "total_steps": 9627, "loss": 1.5776, "learning_rate": 2.709065158363774e-05, "epoch": 0.651500986807936, "percentage": 65.15, "elapsed_time": "1 day, 23:53:01", "remaining_time": "1 day, 1:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6273, "total_steps": 9627, "loss": 1.7011, "learning_rate": 2.7076149723988954e-05, "epoch": 0.6516048613275164, "percentage": 65.16, "elapsed_time": "1 day, 23:53:30", "remaining_time": "1 day, 1:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6274, "total_steps": 9627, "loss": 1.7816, "learning_rate": 2.7061650305551424e-05, "epoch": 0.6517087358470967, "percentage": 65.17, "elapsed_time": "1 day, 23:54:00", "remaining_time": "1 day, 1:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6275, "total_steps": 9627, "loss": 1.8013, "learning_rate": 2.7047153329869167e-05, "epoch": 0.651812610366677, "percentage": 65.18, "elapsed_time": "1 day, 23:54:30", "remaining_time": "1 day, 1:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6276, "total_steps": 9627, "loss": 1.4257, "learning_rate": 2.7032658798486072e-05, "epoch": 0.6519164848862574, "percentage": 65.19, "elapsed_time": "1 day, 23:55:00", "remaining_time": "1 day, 1:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6277, "total_steps": 9627, "loss": 1.732, "learning_rate": 2.7018166712945635e-05, "epoch": 0.6520203594058378, "percentage": 65.2, "elapsed_time": "1 day, 23:55:28", "remaining_time": "1 day, 1:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6278, "total_steps": 9627, "loss": 1.7406, "learning_rate": 2.700367707479122e-05, "epoch": 0.6521242339254181, "percentage": 65.21, "elapsed_time": "1 day, 23:55:59", "remaining_time": "1 day, 1:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6279, "total_steps": 9627, "loss": 1.7469, "learning_rate": 2.6989189885565803e-05, "epoch": 0.6522281084449985, "percentage": 65.22, "elapsed_time": "1 day, 23:56:29", "remaining_time": "1 day, 1:33:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6280, "total_steps": 9627, "loss": 1.6946, "learning_rate": 2.697470514681214e-05, "epoch": 0.6523319829645788, "percentage": 65.23, "elapsed_time": "1 day, 23:56:57", "remaining_time": "1 day, 1:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6281, "total_steps": 9627, "loss": 1.5709, "learning_rate": 2.6960222860072826e-05, "epoch": 0.6524358574841591, "percentage": 65.24, "elapsed_time": "1 day, 23:57:27", "remaining_time": "1 day, 1:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6282, "total_steps": 9627, "loss": 1.4393, "learning_rate": 2.6945743026890012e-05, "epoch": 0.6525397320037395, "percentage": 65.25, "elapsed_time": "1 day, 23:57:56", "remaining_time": "1 day, 1:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6283, "total_steps": 9627, "loss": 1.68, "learning_rate": 2.693126564880576e-05, "epoch": 0.6526436065233199, "percentage": 65.26, "elapsed_time": "1 day, 23:58:26", "remaining_time": "1 day, 1:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6284, "total_steps": 9627, "loss": 1.6189, "learning_rate": 2.6916790727361773e-05, "epoch": 0.6527474810429001, "percentage": 65.27, "elapsed_time": "1 day, 23:58:56", "remaining_time": "1 day, 1:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6285, "total_steps": 9627, "loss": 1.8985, "learning_rate": 2.6902318264099517e-05, "epoch": 0.6528513555624805, "percentage": 65.29, "elapsed_time": "1 day, 23:59:25", "remaining_time": "1 day, 1:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6286, "total_steps": 9627, "loss": 1.7447, "learning_rate": 2.68878482605602e-05, "epoch": 0.6529552300820609, "percentage": 65.3, "elapsed_time": "1 day, 23:59:54", "remaining_time": "1 day, 1:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6287, "total_steps": 9627, "loss": 1.5522, "learning_rate": 2.6873380718284757e-05, "epoch": 0.6530591046016412, "percentage": 65.31, "elapsed_time": "2 days, 0:00:25", "remaining_time": "1 day, 1:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6288, "total_steps": 9627, "loss": 1.8171, "learning_rate": 2.6858915638813874e-05, "epoch": 0.6531629791212216, "percentage": 65.32, "elapsed_time": "2 days, 0:00:53", "remaining_time": "1 day, 1:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6289, "total_steps": 9627, "loss": 1.5586, "learning_rate": 2.6844453023687956e-05, "epoch": 0.653266853640802, "percentage": 65.33, "elapsed_time": "2 days, 0:01:22", "remaining_time": "1 day, 1:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6290, "total_steps": 9627, "loss": 1.8163, "learning_rate": 2.6829992874447196e-05, "epoch": 0.6533707281603822, "percentage": 65.34, "elapsed_time": "2 days, 0:01:52", "remaining_time": "1 day, 1:28:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6291, "total_steps": 9627, "loss": 1.4798, "learning_rate": 2.6815535192631437e-05, "epoch": 0.6534746026799626, "percentage": 65.35, "elapsed_time": "2 days, 0:02:20", "remaining_time": "1 day, 1:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6292, "total_steps": 9627, "loss": 1.7423, "learning_rate": 2.6801079979780343e-05, "epoch": 0.653578477199543, "percentage": 65.36, "elapsed_time": "2 days, 0:02:50", "remaining_time": "1 day, 1:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6293, "total_steps": 9627, "loss": 1.7352, "learning_rate": 2.6786627237433275e-05, "epoch": 0.6536823517191233, "percentage": 65.37, "elapsed_time": "2 days, 0:03:20", "remaining_time": "1 day, 1:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6294, "total_steps": 9627, "loss": 1.892, "learning_rate": 2.6772176967129336e-05, "epoch": 0.6537862262387036, "percentage": 65.38, "elapsed_time": "2 days, 0:03:49", "remaining_time": "1 day, 1:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6295, "total_steps": 9627, "loss": 1.7635, "learning_rate": 2.6757729170407368e-05, "epoch": 0.653890100758284, "percentage": 65.39, "elapsed_time": "2 days, 0:04:19", "remaining_time": "1 day, 1:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6296, "total_steps": 9627, "loss": 1.7023, "learning_rate": 2.6743283848805945e-05, "epoch": 0.6539939752778643, "percentage": 65.4, "elapsed_time": "2 days, 0:04:47", "remaining_time": "1 day, 1:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6297, "total_steps": 9627, "loss": 1.6528, "learning_rate": 2.672884100386338e-05, "epoch": 0.6540978497974447, "percentage": 65.41, "elapsed_time": "2 days, 0:05:17", "remaining_time": "1 day, 1:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6298, "total_steps": 9627, "loss": 1.7864, "learning_rate": 2.6714400637117708e-05, "epoch": 0.6542017243170251, "percentage": 65.42, "elapsed_time": "2 days, 0:05:46", "remaining_time": "1 day, 1:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6299, "total_steps": 9627, "loss": 1.7531, "learning_rate": 2.669996275010678e-05, "epoch": 0.6543055988366053, "percentage": 65.43, "elapsed_time": "2 days, 0:06:15", "remaining_time": "1 day, 1:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6300, "total_steps": 9627, "loss": 1.7993, "learning_rate": 2.6685527344368022e-05, "epoch": 0.6544094733561857, "percentage": 65.44, "elapsed_time": "2 days, 0:06:45", "remaining_time": "1 day, 1:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6301, "total_steps": 9627, "loss": 1.7012, "learning_rate": 2.667109442143877e-05, "epoch": 0.6545133478757661, "percentage": 65.45, "elapsed_time": "2 days, 0:07:14", "remaining_time": "1 day, 1:24:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6302, "total_steps": 9627, "loss": 1.6973, "learning_rate": 2.665666398285599e-05, "epoch": 0.6546172223953465, "percentage": 65.46, "elapsed_time": "2 days, 0:07:44", "remaining_time": "1 day, 1:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6303, "total_steps": 9627, "loss": 1.6828, "learning_rate": 2.6642236030156405e-05, "epoch": 0.6547210969149267, "percentage": 65.47, "elapsed_time": "2 days, 0:08:12", "remaining_time": "1 day, 1:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6304, "total_steps": 9627, "loss": 1.7191, "learning_rate": 2.6627810564876488e-05, "epoch": 0.6548249714345071, "percentage": 65.48, "elapsed_time": "2 days, 0:08:42", "remaining_time": "1 day, 1:22:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6305, "total_steps": 9627, "loss": 1.6014, "learning_rate": 2.6613387588552406e-05, "epoch": 0.6549288459540875, "percentage": 65.49, "elapsed_time": "2 days, 0:09:11", "remaining_time": "1 day, 1:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6306, "total_steps": 9627, "loss": 1.794, "learning_rate": 2.6598967102720174e-05, "epoch": 0.6550327204736678, "percentage": 65.5, "elapsed_time": "2 days, 0:09:40", "remaining_time": "1 day, 1:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6307, "total_steps": 9627, "loss": 1.697, "learning_rate": 2.658454910891539e-05, "epoch": 0.6551365949932482, "percentage": 65.51, "elapsed_time": "2 days, 0:10:09", "remaining_time": "1 day, 1:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6308, "total_steps": 9627, "loss": 1.5579, "learning_rate": 2.657013360867346e-05, "epoch": 0.6552404695128285, "percentage": 65.52, "elapsed_time": "2 days, 0:10:39", "remaining_time": "1 day, 1:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6309, "total_steps": 9627, "loss": 1.61, "learning_rate": 2.6555720603529578e-05, "epoch": 0.6553443440324088, "percentage": 65.53, "elapsed_time": "2 days, 0:11:09", "remaining_time": "1 day, 1:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6310, "total_steps": 9627, "loss": 1.4753, "learning_rate": 2.6541310095018533e-05, "epoch": 0.6554482185519892, "percentage": 65.54, "elapsed_time": "2 days, 0:11:39", "remaining_time": "1 day, 1:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6311, "total_steps": 9627, "loss": 1.7289, "learning_rate": 2.6526902084675008e-05, "epoch": 0.6555520930715696, "percentage": 65.56, "elapsed_time": "2 days, 0:12:07", "remaining_time": "1 day, 1:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6312, "total_steps": 9627, "loss": 1.5964, "learning_rate": 2.6512496574033307e-05, "epoch": 0.6556559675911499, "percentage": 65.57, "elapsed_time": "2 days, 0:12:37", "remaining_time": "1 day, 1:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6313, "total_steps": 9627, "loss": 1.5983, "learning_rate": 2.6498093564627515e-05, "epoch": 0.6557598421107302, "percentage": 65.58, "elapsed_time": "2 days, 0:13:07", "remaining_time": "1 day, 1:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6314, "total_steps": 9627, "loss": 1.719, "learning_rate": 2.6483693057991433e-05, "epoch": 0.6558637166303106, "percentage": 65.59, "elapsed_time": "2 days, 0:13:36", "remaining_time": "1 day, 1:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6315, "total_steps": 9627, "loss": 1.7625, "learning_rate": 2.646929505565861e-05, "epoch": 0.6559675911498909, "percentage": 65.6, "elapsed_time": "2 days, 0:14:05", "remaining_time": "1 day, 1:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6316, "total_steps": 9627, "loss": 1.6035, "learning_rate": 2.6454899559162316e-05, "epoch": 0.6560714656694713, "percentage": 65.61, "elapsed_time": "2 days, 0:14:34", "remaining_time": "1 day, 1:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6317, "total_steps": 9627, "loss": 1.8204, "learning_rate": 2.644050657003554e-05, "epoch": 0.6561753401890517, "percentage": 65.62, "elapsed_time": "2 days, 0:15:04", "remaining_time": "1 day, 1:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6318, "total_steps": 9627, "loss": 1.5586, "learning_rate": 2.642611608981108e-05, "epoch": 0.6562792147086319, "percentage": 65.63, "elapsed_time": "2 days, 0:15:33", "remaining_time": "1 day, 1:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6319, "total_steps": 9627, "loss": 1.9185, "learning_rate": 2.641172812002134e-05, "epoch": 0.6563830892282123, "percentage": 65.64, "elapsed_time": "2 days, 0:16:03", "remaining_time": "1 day, 1:16:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6320, "total_steps": 9627, "loss": 1.7196, "learning_rate": 2.6397342662198578e-05, "epoch": 0.6564869637477927, "percentage": 65.65, "elapsed_time": "2 days, 0:16:32", "remaining_time": "1 day, 1:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6321, "total_steps": 9627, "loss": 1.7506, "learning_rate": 2.638295971787471e-05, "epoch": 0.656590838267373, "percentage": 65.66, "elapsed_time": "2 days, 0:17:02", "remaining_time": "1 day, 1:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6322, "total_steps": 9627, "loss": 1.5984, "learning_rate": 2.6368579288581414e-05, "epoch": 0.6566947127869533, "percentage": 65.67, "elapsed_time": "2 days, 0:17:30", "remaining_time": "1 day, 1:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6323, "total_steps": 9627, "loss": 1.5823, "learning_rate": 2.635420137585009e-05, "epoch": 0.6567985873065337, "percentage": 65.68, "elapsed_time": "2 days, 0:17:59", "remaining_time": "1 day, 1:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6324, "total_steps": 9627, "loss": 1.8616, "learning_rate": 2.6339825981211873e-05, "epoch": 0.656902461826114, "percentage": 65.69, "elapsed_time": "2 days, 0:18:28", "remaining_time": "1 day, 1:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6325, "total_steps": 9627, "loss": 1.4848, "learning_rate": 2.632545310619764e-05, "epoch": 0.6570063363456944, "percentage": 65.7, "elapsed_time": "2 days, 0:18:59", "remaining_time": "1 day, 1:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6326, "total_steps": 9627, "loss": 1.4897, "learning_rate": 2.6311082752337957e-05, "epoch": 0.6571102108652748, "percentage": 65.71, "elapsed_time": "2 days, 0:19:27", "remaining_time": "1 day, 1:12:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6327, "total_steps": 9627, "loss": 1.5465, "learning_rate": 2.6296714921163224e-05, "epoch": 0.657214085384855, "percentage": 65.72, "elapsed_time": "2 days, 0:19:57", "remaining_time": "1 day, 1:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6328, "total_steps": 9627, "loss": 1.4289, "learning_rate": 2.6282349614203415e-05, "epoch": 0.6573179599044354, "percentage": 65.73, "elapsed_time": "2 days, 0:20:25", "remaining_time": "1 day, 1:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6329, "total_steps": 9627, "loss": 1.64, "learning_rate": 2.626798683298839e-05, "epoch": 0.6574218344240158, "percentage": 65.74, "elapsed_time": "2 days, 0:20:56", "remaining_time": "1 day, 1:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6330, "total_steps": 9627, "loss": 1.4736, "learning_rate": 2.6253626579047654e-05, "epoch": 0.6575257089435962, "percentage": 65.75, "elapsed_time": "2 days, 0:21:25", "remaining_time": "1 day, 1:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6331, "total_steps": 9627, "loss": 1.5444, "learning_rate": 2.6239268853910452e-05, "epoch": 0.6576295834631765, "percentage": 65.76, "elapsed_time": "2 days, 0:21:54", "remaining_time": "1 day, 1:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6332, "total_steps": 9627, "loss": 1.5782, "learning_rate": 2.6224913659105775e-05, "epoch": 0.6577334579827568, "percentage": 65.77, "elapsed_time": "2 days, 0:22:25", "remaining_time": "1 day, 1:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6333, "total_steps": 9627, "loss": 1.5784, "learning_rate": 2.621056099616233e-05, "epoch": 0.6578373325023372, "percentage": 65.78, "elapsed_time": "2 days, 0:22:55", "remaining_time": "1 day, 1:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6334, "total_steps": 9627, "loss": 1.6442, "learning_rate": 2.6196210866608606e-05, "epoch": 0.6579412070219175, "percentage": 65.79, "elapsed_time": "2 days, 0:23:25", "remaining_time": "1 day, 1:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6335, "total_steps": 9627, "loss": 1.6947, "learning_rate": 2.6181863271972735e-05, "epoch": 0.6580450815414979, "percentage": 65.8, "elapsed_time": "2 days, 0:23:54", "remaining_time": "1 day, 1:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6336, "total_steps": 9627, "loss": 1.6055, "learning_rate": 2.616751821378261e-05, "epoch": 0.6581489560610783, "percentage": 65.81, "elapsed_time": "2 days, 0:24:24", "remaining_time": "1 day, 1:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6337, "total_steps": 9627, "loss": 1.5574, "learning_rate": 2.6153175693565933e-05, "epoch": 0.6582528305806585, "percentage": 65.83, "elapsed_time": "2 days, 0:24:54", "remaining_time": "1 day, 1:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6338, "total_steps": 9627, "loss": 1.6478, "learning_rate": 2.6138835712850003e-05, "epoch": 0.6583567051002389, "percentage": 65.84, "elapsed_time": "2 days, 0:25:24", "remaining_time": "1 day, 1:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6339, "total_steps": 9627, "loss": 1.6545, "learning_rate": 2.6124498273161957e-05, "epoch": 0.6584605796198193, "percentage": 65.85, "elapsed_time": "2 days, 0:25:54", "remaining_time": "1 day, 1:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6340, "total_steps": 9627, "loss": 1.5861, "learning_rate": 2.6110163376028613e-05, "epoch": 0.6585644541393996, "percentage": 65.86, "elapsed_time": "2 days, 0:26:24", "remaining_time": "1 day, 1:06:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6341, "total_steps": 9627, "loss": 1.6366, "learning_rate": 2.6095831022976514e-05, "epoch": 0.65866832865898, "percentage": 65.87, "elapsed_time": "2 days, 0:26:54", "remaining_time": "1 day, 1:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6342, "total_steps": 9627, "loss": 1.6307, "learning_rate": 2.6081501215531955e-05, "epoch": 0.6587722031785603, "percentage": 65.88, "elapsed_time": "2 days, 0:27:24", "remaining_time": "1 day, 1:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6343, "total_steps": 9627, "loss": 1.6515, "learning_rate": 2.606717395522095e-05, "epoch": 0.6588760776981406, "percentage": 65.89, "elapsed_time": "2 days, 0:27:54", "remaining_time": "1 day, 1:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6344, "total_steps": 9627, "loss": 1.6791, "learning_rate": 2.6052849243569233e-05, "epoch": 0.658979952217721, "percentage": 65.9, "elapsed_time": "2 days, 0:28:24", "remaining_time": "1 day, 1:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6345, "total_steps": 9627, "loss": 1.7317, "learning_rate": 2.603852708210226e-05, "epoch": 0.6590838267373014, "percentage": 65.91, "elapsed_time": "2 days, 0:28:53", "remaining_time": "1 day, 1:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6346, "total_steps": 9627, "loss": 1.6033, "learning_rate": 2.6024207472345273e-05, "epoch": 0.6591877012568816, "percentage": 65.92, "elapsed_time": "2 days, 0:29:23", "remaining_time": "1 day, 1:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6347, "total_steps": 9627, "loss": 1.6101, "learning_rate": 2.6009890415823147e-05, "epoch": 0.659291575776462, "percentage": 65.93, "elapsed_time": "2 days, 0:29:53", "remaining_time": "1 day, 1:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6348, "total_steps": 9627, "loss": 1.5903, "learning_rate": 2.5995575914060576e-05, "epoch": 0.6593954502960424, "percentage": 65.94, "elapsed_time": "2 days, 0:30:23", "remaining_time": "1 day, 1:03:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6349, "total_steps": 9627, "loss": 1.663, "learning_rate": 2.5981263968581925e-05, "epoch": 0.6594993248156227, "percentage": 65.95, "elapsed_time": "2 days, 0:30:54", "remaining_time": "1 day, 1:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6350, "total_steps": 9627, "loss": 1.5257, "learning_rate": 2.5966954580911314e-05, "epoch": 0.6596031993352031, "percentage": 65.96, "elapsed_time": "2 days, 0:31:24", "remaining_time": "1 day, 1:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6351, "total_steps": 9627, "loss": 1.8657, "learning_rate": 2.5952647752572566e-05, "epoch": 0.6597070738547834, "percentage": 65.97, "elapsed_time": "2 days, 0:31:53", "remaining_time": "1 day, 1:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6352, "total_steps": 9627, "loss": 1.9287, "learning_rate": 2.5938343485089267e-05, "epoch": 0.6598109483743637, "percentage": 65.98, "elapsed_time": "2 days, 0:32:24", "remaining_time": "1 day, 1:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6353, "total_steps": 9627, "loss": 1.7726, "learning_rate": 2.5924041779984692e-05, "epoch": 0.6599148228939441, "percentage": 65.99, "elapsed_time": "2 days, 0:32:54", "remaining_time": "1 day, 1:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6354, "total_steps": 9627, "loss": 1.6406, "learning_rate": 2.5909742638781852e-05, "epoch": 0.6600186974135245, "percentage": 66.0, "elapsed_time": "2 days, 0:33:24", "remaining_time": "1 day, 1:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6355, "total_steps": 9627, "loss": 1.6795, "learning_rate": 2.5895446063003526e-05, "epoch": 0.6601225719331049, "percentage": 66.01, "elapsed_time": "2 days, 0:33:55", "remaining_time": "1 day, 1:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6356, "total_steps": 9627, "loss": 1.6828, "learning_rate": 2.5881152054172193e-05, "epoch": 0.6602264464526851, "percentage": 66.02, "elapsed_time": "2 days, 0:34:25", "remaining_time": "1 day, 0:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6357, "total_steps": 9627, "loss": 1.6548, "learning_rate": 2.586686061380999e-05, "epoch": 0.6603303209722655, "percentage": 66.03, "elapsed_time": "2 days, 0:34:55", "remaining_time": "1 day, 0:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6358, "total_steps": 9627, "loss": 1.5247, "learning_rate": 2.5852571743438908e-05, "epoch": 0.6604341954918459, "percentage": 66.04, "elapsed_time": "2 days, 0:35:25", "remaining_time": "1 day, 0:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6359, "total_steps": 9627, "loss": 1.6892, "learning_rate": 2.583828544458058e-05, "epoch": 0.6605380700114262, "percentage": 66.05, "elapsed_time": "2 days, 0:35:55", "remaining_time": "1 day, 0:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6360, "total_steps": 9627, "loss": 1.6188, "learning_rate": 2.582400171875638e-05, "epoch": 0.6606419445310066, "percentage": 66.06, "elapsed_time": "2 days, 0:36:26", "remaining_time": "1 day, 0:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6361, "total_steps": 9627, "loss": 1.4864, "learning_rate": 2.5809720567487395e-05, "epoch": 0.6607458190505869, "percentage": 66.07, "elapsed_time": "2 days, 0:36:56", "remaining_time": "1 day, 0:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6362, "total_steps": 9627, "loss": 1.7432, "learning_rate": 2.5795441992294523e-05, "epoch": 0.6608496935701672, "percentage": 66.08, "elapsed_time": "2 days, 0:37:26", "remaining_time": "1 day, 0:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6363, "total_steps": 9627, "loss": 1.8233, "learning_rate": 2.578116599469825e-05, "epoch": 0.6609535680897476, "percentage": 66.1, "elapsed_time": "2 days, 0:37:56", "remaining_time": "1 day, 0:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6364, "total_steps": 9627, "loss": 1.7842, "learning_rate": 2.576689257621887e-05, "epoch": 0.661057442609328, "percentage": 66.11, "elapsed_time": "2 days, 0:38:26", "remaining_time": "1 day, 0:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6365, "total_steps": 9627, "loss": 1.4591, "learning_rate": 2.5752621738376447e-05, "epoch": 0.6611613171289082, "percentage": 66.12, "elapsed_time": "2 days, 0:38:56", "remaining_time": "1 day, 0:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6366, "total_steps": 9627, "loss": 1.527, "learning_rate": 2.5738353482690624e-05, "epoch": 0.6612651916484886, "percentage": 66.13, "elapsed_time": "2 days, 0:39:28", "remaining_time": "1 day, 0:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6367, "total_steps": 9627, "loss": 1.7582, "learning_rate": 2.5724087810680937e-05, "epoch": 0.661369066168069, "percentage": 66.14, "elapsed_time": "2 days, 0:39:57", "remaining_time": "1 day, 0:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6368, "total_steps": 9627, "loss": 1.7625, "learning_rate": 2.570982472386653e-05, "epoch": 0.6614729406876493, "percentage": 66.15, "elapsed_time": "2 days, 0:40:27", "remaining_time": "1 day, 0:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6369, "total_steps": 9627, "loss": 1.6903, "learning_rate": 2.569556422376632e-05, "epoch": 0.6615768152072297, "percentage": 66.16, "elapsed_time": "2 days, 0:40:57", "remaining_time": "1 day, 0:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6370, "total_steps": 9627, "loss": 1.6276, "learning_rate": 2.5681306311898945e-05, "epoch": 0.66168068972681, "percentage": 66.17, "elapsed_time": "2 days, 0:41:29", "remaining_time": "1 day, 0:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6371, "total_steps": 9627, "loss": 1.7003, "learning_rate": 2.566705098978275e-05, "epoch": 0.6617845642463903, "percentage": 66.18, "elapsed_time": "2 days, 0:41:59", "remaining_time": "1 day, 0:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6372, "total_steps": 9627, "loss": 1.6817, "learning_rate": 2.5652798258935825e-05, "epoch": 0.6618884387659707, "percentage": 66.19, "elapsed_time": "2 days, 0:42:30", "remaining_time": "1 day, 0:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6373, "total_steps": 9627, "loss": 1.7853, "learning_rate": 2.5638548120875945e-05, "epoch": 0.6619923132855511, "percentage": 66.2, "elapsed_time": "2 days, 0:43:00", "remaining_time": "1 day, 0:52:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6374, "total_steps": 9627, "loss": 1.7259, "learning_rate": 2.5624300577120703e-05, "epoch": 0.6620961878051314, "percentage": 66.21, "elapsed_time": "2 days, 0:43:30", "remaining_time": "1 day, 0:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6375, "total_steps": 9627, "loss": 1.6924, "learning_rate": 2.5610055629187275e-05, "epoch": 0.6622000623247117, "percentage": 66.22, "elapsed_time": "2 days, 0:44:00", "remaining_time": "1 day, 0:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6376, "total_steps": 9627, "loss": 1.8033, "learning_rate": 2.559581327859269e-05, "epoch": 0.6623039368442921, "percentage": 66.23, "elapsed_time": "2 days, 0:44:31", "remaining_time": "1 day, 0:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6377, "total_steps": 9627, "loss": 1.9298, "learning_rate": 2.558157352685363e-05, "epoch": 0.6624078113638724, "percentage": 66.24, "elapsed_time": "2 days, 0:45:01", "remaining_time": "1 day, 0:50:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6378, "total_steps": 9627, "loss": 1.6374, "learning_rate": 2.5567336375486528e-05, "epoch": 0.6625116858834528, "percentage": 66.25, "elapsed_time": "2 days, 0:45:30", "remaining_time": "1 day, 0:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6379, "total_steps": 9627, "loss": 1.6823, "learning_rate": 2.555310182600751e-05, "epoch": 0.6626155604030332, "percentage": 66.26, "elapsed_time": "2 days, 0:46:02", "remaining_time": "1 day, 0:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6380, "total_steps": 9627, "loss": 1.7883, "learning_rate": 2.5538869879932438e-05, "epoch": 0.6627194349226135, "percentage": 66.27, "elapsed_time": "2 days, 0:46:32", "remaining_time": "1 day, 0:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6381, "total_steps": 9627, "loss": 1.8058, "learning_rate": 2.5524640538776955e-05, "epoch": 0.6628233094421938, "percentage": 66.28, "elapsed_time": "2 days, 0:47:01", "remaining_time": "1 day, 0:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6382, "total_steps": 9627, "loss": 1.6395, "learning_rate": 2.551041380405631e-05, "epoch": 0.6629271839617742, "percentage": 66.29, "elapsed_time": "2 days, 0:47:32", "remaining_time": "1 day, 0:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6383, "total_steps": 9627, "loss": 1.6788, "learning_rate": 2.5496189677285574e-05, "epoch": 0.6630310584813546, "percentage": 66.3, "elapsed_time": "2 days, 0:48:02", "remaining_time": "1 day, 0:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6384, "total_steps": 9627, "loss": 1.8964, "learning_rate": 2.548196815997953e-05, "epoch": 0.6631349330009348, "percentage": 66.31, "elapsed_time": "2 days, 0:48:34", "remaining_time": "1 day, 0:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6385, "total_steps": 9627, "loss": 1.7551, "learning_rate": 2.546774925365259e-05, "epoch": 0.6632388075205152, "percentage": 66.32, "elapsed_time": "2 days, 0:49:04", "remaining_time": "1 day, 0:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6386, "total_steps": 9627, "loss": 1.6075, "learning_rate": 2.5453532959819017e-05, "epoch": 0.6633426820400956, "percentage": 66.33, "elapsed_time": "2 days, 0:49:35", "remaining_time": "1 day, 0:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6387, "total_steps": 9627, "loss": 1.8376, "learning_rate": 2.5439319279992708e-05, "epoch": 0.6634465565596759, "percentage": 66.34, "elapsed_time": "2 days, 0:50:05", "remaining_time": "1 day, 0:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6388, "total_steps": 9627, "loss": 1.6351, "learning_rate": 2.5425108215687314e-05, "epoch": 0.6635504310792563, "percentage": 66.36, "elapsed_time": "2 days, 0:50:35", "remaining_time": "1 day, 0:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6389, "total_steps": 9627, "loss": 1.7869, "learning_rate": 2.5410899768416186e-05, "epoch": 0.6636543055988366, "percentage": 66.37, "elapsed_time": "2 days, 0:51:05", "remaining_time": "1 day, 0:45:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6390, "total_steps": 9627, "loss": 1.5495, "learning_rate": 2.5396693939692474e-05, "epoch": 0.6637581801184169, "percentage": 66.38, "elapsed_time": "2 days, 0:51:36", "remaining_time": "1 day, 0:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6391, "total_steps": 9627, "loss": 1.641, "learning_rate": 2.5382490731028918e-05, "epoch": 0.6638620546379973, "percentage": 66.39, "elapsed_time": "2 days, 0:52:07", "remaining_time": "1 day, 0:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6392, "total_steps": 9627, "loss": 1.7506, "learning_rate": 2.5368290143938062e-05, "epoch": 0.6639659291575777, "percentage": 66.4, "elapsed_time": "2 days, 0:52:37", "remaining_time": "1 day, 0:44:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6393, "total_steps": 9627, "loss": 1.7111, "learning_rate": 2.5354092179932204e-05, "epoch": 0.664069803677158, "percentage": 66.41, "elapsed_time": "2 days, 0:53:09", "remaining_time": "1 day, 0:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6394, "total_steps": 9627, "loss": 1.6557, "learning_rate": 2.533989684052325e-05, "epoch": 0.6641736781967383, "percentage": 66.42, "elapsed_time": "2 days, 0:53:39", "remaining_time": "1 day, 0:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6395, "total_steps": 9627, "loss": 1.5773, "learning_rate": 2.5325704127222937e-05, "epoch": 0.6642775527163187, "percentage": 66.43, "elapsed_time": "2 days, 0:54:09", "remaining_time": "1 day, 0:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6396, "total_steps": 9627, "loss": 1.8766, "learning_rate": 2.5311514041542678e-05, "epoch": 0.664381427235899, "percentage": 66.44, "elapsed_time": "2 days, 0:54:39", "remaining_time": "1 day, 0:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6397, "total_steps": 9627, "loss": 1.582, "learning_rate": 2.529732658499359e-05, "epoch": 0.6644853017554794, "percentage": 66.45, "elapsed_time": "2 days, 0:55:11", "remaining_time": "1 day, 0:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6398, "total_steps": 9627, "loss": 1.6379, "learning_rate": 2.5283141759086537e-05, "epoch": 0.6645891762750598, "percentage": 66.46, "elapsed_time": "2 days, 0:55:41", "remaining_time": "1 day, 0:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6399, "total_steps": 9627, "loss": 1.4214, "learning_rate": 2.5268959565332086e-05, "epoch": 0.66469305079464, "percentage": 66.47, "elapsed_time": "2 days, 0:56:11", "remaining_time": "1 day, 0:41:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6400, "total_steps": 9627, "loss": 1.6518, "learning_rate": 2.525478000524053e-05, "epoch": 0.6647969253142204, "percentage": 66.48, "elapsed_time": "2 days, 0:56:41", "remaining_time": "1 day, 0:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6401, "total_steps": 9627, "loss": 1.578, "learning_rate": 2.5240603080321863e-05, "epoch": 0.6649007998338008, "percentage": 66.49, "elapsed_time": "2 days, 0:57:12", "remaining_time": "1 day, 0:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6402, "total_steps": 9627, "loss": 2.0138, "learning_rate": 2.5226428792085875e-05, "epoch": 0.6650046743533811, "percentage": 66.5, "elapsed_time": "2 days, 0:57:42", "remaining_time": "1 day, 0:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6403, "total_steps": 9627, "loss": 1.5924, "learning_rate": 2.5212257142041938e-05, "epoch": 0.6651085488729614, "percentage": 66.51, "elapsed_time": "2 days, 0:58:12", "remaining_time": "1 day, 0:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6404, "total_steps": 9627, "loss": 1.7202, "learning_rate": 2.5198088131699294e-05, "epoch": 0.6652124233925418, "percentage": 66.52, "elapsed_time": "2 days, 0:58:43", "remaining_time": "1 day, 0:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6405, "total_steps": 9627, "loss": 1.8716, "learning_rate": 2.5183921762566797e-05, "epoch": 0.6653162979121221, "percentage": 66.53, "elapsed_time": "2 days, 0:59:14", "remaining_time": "1 day, 0:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6406, "total_steps": 9627, "loss": 1.6601, "learning_rate": 2.5169758036153056e-05, "epoch": 0.6654201724317025, "percentage": 66.54, "elapsed_time": "2 days, 0:59:44", "remaining_time": "1 day, 0:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6407, "total_steps": 9627, "loss": 1.7759, "learning_rate": 2.5155596953966397e-05, "epoch": 0.6655240469512829, "percentage": 66.55, "elapsed_time": "2 days, 1:00:13", "remaining_time": "1 day, 0:37:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6408, "total_steps": 9627, "loss": 1.4598, "learning_rate": 2.514143851751486e-05, "epoch": 0.6656279214708632, "percentage": 66.56, "elapsed_time": "2 days, 1:00:44", "remaining_time": "1 day, 0:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6409, "total_steps": 9627, "loss": 1.5706, "learning_rate": 2.512728272830625e-05, "epoch": 0.6657317959904435, "percentage": 66.57, "elapsed_time": "2 days, 1:01:14", "remaining_time": "1 day, 0:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6410, "total_steps": 9627, "loss": 1.7148, "learning_rate": 2.511312958784797e-05, "epoch": 0.6658356705100239, "percentage": 66.58, "elapsed_time": "2 days, 1:01:44", "remaining_time": "1 day, 0:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6411, "total_steps": 9627, "loss": 1.561, "learning_rate": 2.5098979097647297e-05, "epoch": 0.6659395450296043, "percentage": 66.59, "elapsed_time": "2 days, 1:02:14", "remaining_time": "1 day, 0:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6412, "total_steps": 9627, "loss": 1.602, "learning_rate": 2.508483125921113e-05, "epoch": 0.6660434195491846, "percentage": 66.6, "elapsed_time": "2 days, 1:02:43", "remaining_time": "1 day, 0:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6413, "total_steps": 9627, "loss": 1.9113, "learning_rate": 2.507068607404604e-05, "epoch": 0.6661472940687649, "percentage": 66.61, "elapsed_time": "2 days, 1:03:13", "remaining_time": "1 day, 0:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6414, "total_steps": 9627, "loss": 1.5093, "learning_rate": 2.5056543543658452e-05, "epoch": 0.6662511685883453, "percentage": 66.63, "elapsed_time": "2 days, 1:03:43", "remaining_time": "1 day, 0:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6415, "total_steps": 9627, "loss": 1.5901, "learning_rate": 2.5042403669554416e-05, "epoch": 0.6663550431079256, "percentage": 66.64, "elapsed_time": "2 days, 1:04:12", "remaining_time": "1 day, 0:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6416, "total_steps": 9627, "loss": 1.6606, "learning_rate": 2.5028266453239703e-05, "epoch": 0.666458917627506, "percentage": 66.65, "elapsed_time": "2 days, 1:04:42", "remaining_time": "1 day, 0:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6417, "total_steps": 9627, "loss": 1.6371, "learning_rate": 2.501413189621983e-05, "epoch": 0.6665627921470864, "percentage": 66.66, "elapsed_time": "2 days, 1:05:12", "remaining_time": "1 day, 0:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6418, "total_steps": 9627, "loss": 1.7512, "learning_rate": 2.500000000000001e-05, "epoch": 0.6666666666666666, "percentage": 66.67, "elapsed_time": "2 days, 1:05:42", "remaining_time": "1 day, 0:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6419, "total_steps": 9627, "loss": 1.6877, "learning_rate": 2.4985870766085185e-05, "epoch": 0.666770541186247, "percentage": 66.68, "elapsed_time": "2 days, 1:06:12", "remaining_time": "1 day, 0:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6420, "total_steps": 9627, "loss": 1.6417, "learning_rate": 2.4971744195979985e-05, "epoch": 0.6668744157058274, "percentage": 66.69, "elapsed_time": "2 days, 1:06:42", "remaining_time": "1 day, 0:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6421, "total_steps": 9627, "loss": 1.7746, "learning_rate": 2.4957620291188844e-05, "epoch": 0.6669782902254077, "percentage": 66.7, "elapsed_time": "2 days, 1:07:12", "remaining_time": "1 day, 0:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6422, "total_steps": 9627, "loss": 1.5985, "learning_rate": 2.4943499053215756e-05, "epoch": 0.667082164744988, "percentage": 66.71, "elapsed_time": "2 days, 1:07:41", "remaining_time": "1 day, 0:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6423, "total_steps": 9627, "loss": 1.7645, "learning_rate": 2.4929380483564602e-05, "epoch": 0.6671860392645684, "percentage": 66.72, "elapsed_time": "2 days, 1:08:12", "remaining_time": "1 day, 0:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6424, "total_steps": 9627, "loss": 1.5833, "learning_rate": 2.4915264583738858e-05, "epoch": 0.6672899137841487, "percentage": 66.73, "elapsed_time": "2 days, 1:08:42", "remaining_time": "1 day, 0:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6425, "total_steps": 9627, "loss": 1.6876, "learning_rate": 2.490115135524177e-05, "epoch": 0.6673937883037291, "percentage": 66.74, "elapsed_time": "2 days, 1:09:11", "remaining_time": "1 day, 0:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6426, "total_steps": 9627, "loss": 1.7356, "learning_rate": 2.488704079957629e-05, "epoch": 0.6674976628233095, "percentage": 66.75, "elapsed_time": "2 days, 1:09:42", "remaining_time": "1 day, 0:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6427, "total_steps": 9627, "loss": 1.6506, "learning_rate": 2.487293291824507e-05, "epoch": 0.6676015373428897, "percentage": 66.76, "elapsed_time": "2 days, 1:10:11", "remaining_time": "1 day, 0:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6428, "total_steps": 9627, "loss": 1.8314, "learning_rate": 2.4858827712750494e-05, "epoch": 0.6677054118624701, "percentage": 66.77, "elapsed_time": "2 days, 1:10:42", "remaining_time": "1 day, 0:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6429, "total_steps": 9627, "loss": 1.6845, "learning_rate": 2.484472518459464e-05, "epoch": 0.6678092863820505, "percentage": 66.78, "elapsed_time": "2 days, 1:11:11", "remaining_time": "1 day, 0:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6430, "total_steps": 9627, "loss": 1.4303, "learning_rate": 2.483062533527938e-05, "epoch": 0.6679131609016308, "percentage": 66.79, "elapsed_time": "2 days, 1:11:40", "remaining_time": "1 day, 0:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6431, "total_steps": 9627, "loss": 1.7178, "learning_rate": 2.4816528166306146e-05, "epoch": 0.6680170354212112, "percentage": 66.8, "elapsed_time": "2 days, 1:12:11", "remaining_time": "1 day, 0:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6432, "total_steps": 9627, "loss": 1.69, "learning_rate": 2.4802433679176247e-05, "epoch": 0.6681209099407915, "percentage": 66.81, "elapsed_time": "2 days, 1:12:41", "remaining_time": "1 day, 0:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6433, "total_steps": 9627, "loss": 1.6254, "learning_rate": 2.4788341875390614e-05, "epoch": 0.6682247844603719, "percentage": 66.82, "elapsed_time": "2 days, 1:13:10", "remaining_time": "1 day, 0:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6434, "total_steps": 9627, "loss": 1.6673, "learning_rate": 2.4774252756449912e-05, "epoch": 0.6683286589799522, "percentage": 66.83, "elapsed_time": "2 days, 1:13:40", "remaining_time": "1 day, 0:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6435, "total_steps": 9627, "loss": 1.8226, "learning_rate": 2.4760166323854524e-05, "epoch": 0.6684325334995326, "percentage": 66.84, "elapsed_time": "2 days, 1:14:10", "remaining_time": "1 day, 0:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6436, "total_steps": 9627, "loss": 1.6372, "learning_rate": 2.4746082579104518e-05, "epoch": 0.668536408019113, "percentage": 66.85, "elapsed_time": "2 days, 1:14:40", "remaining_time": "1 day, 0:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6437, "total_steps": 9627, "loss": 1.5601, "learning_rate": 2.4732001523699772e-05, "epoch": 0.6686402825386932, "percentage": 66.86, "elapsed_time": "2 days, 1:15:10", "remaining_time": "1 day, 0:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6438, "total_steps": 9627, "loss": 1.5854, "learning_rate": 2.471792315913973e-05, "epoch": 0.6687441570582736, "percentage": 66.87, "elapsed_time": "2 days, 1:15:39", "remaining_time": "1 day, 0:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6439, "total_steps": 9627, "loss": 1.5502, "learning_rate": 2.470384748692368e-05, "epoch": 0.668848031577854, "percentage": 66.88, "elapsed_time": "2 days, 1:16:09", "remaining_time": "1 day, 0:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6440, "total_steps": 9627, "loss": 1.836, "learning_rate": 2.468977450855058e-05, "epoch": 0.6689519060974343, "percentage": 66.9, "elapsed_time": "2 days, 1:16:39", "remaining_time": "1 day, 0:23:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6441, "total_steps": 9627, "loss": 1.6872, "learning_rate": 2.4675704225519018e-05, "epoch": 0.6690557806170147, "percentage": 66.91, "elapsed_time": "2 days, 1:17:09", "remaining_time": "1 day, 0:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6442, "total_steps": 9627, "loss": 1.5706, "learning_rate": 2.4661636639327444e-05, "epoch": 0.669159655136595, "percentage": 66.92, "elapsed_time": "2 days, 1:17:38", "remaining_time": "1 day, 0:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6443, "total_steps": 9627, "loss": 1.7595, "learning_rate": 2.4647571751473924e-05, "epoch": 0.6692635296561753, "percentage": 66.93, "elapsed_time": "2 days, 1:18:09", "remaining_time": "1 day, 0:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6444, "total_steps": 9627, "loss": 1.5921, "learning_rate": 2.4633509563456252e-05, "epoch": 0.6693674041757557, "percentage": 66.94, "elapsed_time": "2 days, 1:18:39", "remaining_time": "1 day, 0:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6445, "total_steps": 9627, "loss": 1.9157, "learning_rate": 2.461945007677195e-05, "epoch": 0.6694712786953361, "percentage": 66.95, "elapsed_time": "2 days, 1:19:09", "remaining_time": "1 day, 0:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6446, "total_steps": 9627, "loss": 1.7016, "learning_rate": 2.4605393292918234e-05, "epoch": 0.6695751532149163, "percentage": 66.96, "elapsed_time": "2 days, 1:19:39", "remaining_time": "1 day, 0:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6447, "total_steps": 9627, "loss": 1.5405, "learning_rate": 2.459133921339205e-05, "epoch": 0.6696790277344967, "percentage": 66.97, "elapsed_time": "2 days, 1:20:09", "remaining_time": "1 day, 0:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6448, "total_steps": 9627, "loss": 1.7017, "learning_rate": 2.4577287839690022e-05, "epoch": 0.6697829022540771, "percentage": 66.98, "elapsed_time": "2 days, 1:20:39", "remaining_time": "1 day, 0:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6449, "total_steps": 9627, "loss": 1.8029, "learning_rate": 2.456323917330857e-05, "epoch": 0.6698867767736574, "percentage": 66.99, "elapsed_time": "2 days, 1:21:08", "remaining_time": "1 day, 0:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6450, "total_steps": 9627, "loss": 1.6008, "learning_rate": 2.4549193215743706e-05, "epoch": 0.6699906512932378, "percentage": 67.0, "elapsed_time": "2 days, 1:21:39", "remaining_time": "1 day, 0:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6451, "total_steps": 9627, "loss": 1.667, "learning_rate": 2.453514996849125e-05, "epoch": 0.6700945258128181, "percentage": 67.01, "elapsed_time": "2 days, 1:22:09", "remaining_time": "1 day, 0:18:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6452, "total_steps": 9627, "loss": 1.5254, "learning_rate": 2.452110943304669e-05, "epoch": 0.6701984003323984, "percentage": 67.02, "elapsed_time": "2 days, 1:22:39", "remaining_time": "1 day, 0:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6453, "total_steps": 9627, "loss": 1.5862, "learning_rate": 2.450707161090523e-05, "epoch": 0.6703022748519788, "percentage": 67.03, "elapsed_time": "2 days, 1:23:09", "remaining_time": "1 day, 0:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6454, "total_steps": 9627, "loss": 1.7249, "learning_rate": 2.4493036503561795e-05, "epoch": 0.6704061493715592, "percentage": 67.04, "elapsed_time": "2 days, 1:23:38", "remaining_time": "1 day, 0:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6455, "total_steps": 9627, "loss": 1.5667, "learning_rate": 2.4479004112511012e-05, "epoch": 0.6705100238911395, "percentage": 67.05, "elapsed_time": "2 days, 1:24:08", "remaining_time": "1 day, 0:16:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6456, "total_steps": 9627, "loss": 1.7565, "learning_rate": 2.4464974439247213e-05, "epoch": 0.6706138984107198, "percentage": 67.06, "elapsed_time": "2 days, 1:24:37", "remaining_time": "1 day, 0:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6457, "total_steps": 9627, "loss": 1.6019, "learning_rate": 2.4450947485264442e-05, "epoch": 0.6707177729303002, "percentage": 67.07, "elapsed_time": "2 days, 1:25:07", "remaining_time": "1 day, 0:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6458, "total_steps": 9627, "loss": 1.6025, "learning_rate": 2.4436923252056486e-05, "epoch": 0.6708216474498806, "percentage": 67.08, "elapsed_time": "2 days, 1:25:37", "remaining_time": "1 day, 0:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6459, "total_steps": 9627, "loss": 1.8032, "learning_rate": 2.442290174111681e-05, "epoch": 0.6709255219694609, "percentage": 67.09, "elapsed_time": "2 days, 1:26:07", "remaining_time": "1 day, 0:14:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6460, "total_steps": 9627, "loss": 1.844, "learning_rate": 2.440888295393859e-05, "epoch": 0.6710293964890413, "percentage": 67.1, "elapsed_time": "2 days, 1:26:37", "remaining_time": "1 day, 0:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6461, "total_steps": 9627, "loss": 1.5926, "learning_rate": 2.4394866892014716e-05, "epoch": 0.6711332710086216, "percentage": 67.11, "elapsed_time": "2 days, 1:27:07", "remaining_time": "1 day, 0:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6462, "total_steps": 9627, "loss": 1.5847, "learning_rate": 2.438085355683779e-05, "epoch": 0.6712371455282019, "percentage": 67.12, "elapsed_time": "2 days, 1:27:36", "remaining_time": "1 day, 0:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6463, "total_steps": 9627, "loss": 1.5292, "learning_rate": 2.436684294990012e-05, "epoch": 0.6713410200477823, "percentage": 67.13, "elapsed_time": "2 days, 1:28:06", "remaining_time": "1 day, 0:13:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6464, "total_steps": 9627, "loss": 1.6891, "learning_rate": 2.4352835072693713e-05, "epoch": 0.6714448945673627, "percentage": 67.14, "elapsed_time": "2 days, 1:28:36", "remaining_time": "1 day, 0:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6465, "total_steps": 9627, "loss": 1.8254, "learning_rate": 2.4338829926710356e-05, "epoch": 0.6715487690869429, "percentage": 67.15, "elapsed_time": "2 days, 1:29:06", "remaining_time": "1 day, 0:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6466, "total_steps": 9627, "loss": 1.5315, "learning_rate": 2.4324827513441406e-05, "epoch": 0.6716526436065233, "percentage": 67.17, "elapsed_time": "2 days, 1:29:36", "remaining_time": "1 day, 0:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6467, "total_steps": 9627, "loss": 1.6046, "learning_rate": 2.431082783437807e-05, "epoch": 0.6717565181261037, "percentage": 67.18, "elapsed_time": "2 days, 1:30:05", "remaining_time": "1 day, 0:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6468, "total_steps": 9627, "loss": 1.7201, "learning_rate": 2.4296830891011206e-05, "epoch": 0.671860392645684, "percentage": 67.19, "elapsed_time": "2 days, 1:30:34", "remaining_time": "1 day, 0:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6469, "total_steps": 9627, "loss": 1.5979, "learning_rate": 2.4282836684831324e-05, "epoch": 0.6719642671652644, "percentage": 67.2, "elapsed_time": "2 days, 1:31:05", "remaining_time": "1 day, 0:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6470, "total_steps": 9627, "loss": 1.6024, "learning_rate": 2.426884521732875e-05, "epoch": 0.6720681416848447, "percentage": 67.21, "elapsed_time": "2 days, 1:31:34", "remaining_time": "1 day, 0:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6471, "total_steps": 9627, "loss": 1.4421, "learning_rate": 2.425485648999345e-05, "epoch": 0.672172016204425, "percentage": 67.22, "elapsed_time": "2 days, 1:32:04", "remaining_time": "1 day, 0:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6472, "total_steps": 9627, "loss": 1.7063, "learning_rate": 2.4240870504315117e-05, "epoch": 0.6722758907240054, "percentage": 67.23, "elapsed_time": "2 days, 1:32:33", "remaining_time": "1 day, 0:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6473, "total_steps": 9627, "loss": 1.6469, "learning_rate": 2.4226887261783143e-05, "epoch": 0.6723797652435858, "percentage": 67.24, "elapsed_time": "2 days, 1:33:04", "remaining_time": "1 day, 0:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6474, "total_steps": 9627, "loss": 1.6914, "learning_rate": 2.4212906763886638e-05, "epoch": 0.672483639763166, "percentage": 67.25, "elapsed_time": "2 days, 1:33:33", "remaining_time": "1 day, 0:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6475, "total_steps": 9627, "loss": 1.5814, "learning_rate": 2.4198929012114413e-05, "epoch": 0.6725875142827464, "percentage": 67.26, "elapsed_time": "2 days, 1:34:02", "remaining_time": "1 day, 0:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6476, "total_steps": 9627, "loss": 1.6704, "learning_rate": 2.4184954007954978e-05, "epoch": 0.6726913888023268, "percentage": 67.27, "elapsed_time": "2 days, 1:34:33", "remaining_time": "1 day, 0:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6477, "total_steps": 9627, "loss": 1.7766, "learning_rate": 2.417098175289661e-05, "epoch": 0.6727952633219071, "percentage": 67.28, "elapsed_time": "2 days, 1:35:03", "remaining_time": "1 day, 0:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6478, "total_steps": 9627, "loss": 1.5764, "learning_rate": 2.4157012248427173e-05, "epoch": 0.6728991378414875, "percentage": 67.29, "elapsed_time": "2 days, 1:35:32", "remaining_time": "1 day, 0:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6479, "total_steps": 9627, "loss": 1.7778, "learning_rate": 2.414304549603437e-05, "epoch": 0.6730030123610679, "percentage": 67.3, "elapsed_time": "2 days, 1:36:03", "remaining_time": "1 day, 0:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6480, "total_steps": 9627, "loss": 1.7988, "learning_rate": 2.4129081497205535e-05, "epoch": 0.6731068868806481, "percentage": 67.31, "elapsed_time": "2 days, 1:36:33", "remaining_time": "1 day, 0:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6481, "total_steps": 9627, "loss": 1.636, "learning_rate": 2.4115120253427715e-05, "epoch": 0.6732107614002285, "percentage": 67.32, "elapsed_time": "2 days, 1:37:02", "remaining_time": "1 day, 0:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6482, "total_steps": 9627, "loss": 1.6532, "learning_rate": 2.4101161766187673e-05, "epoch": 0.6733146359198089, "percentage": 67.33, "elapsed_time": "2 days, 1:37:33", "remaining_time": "1 day, 0:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6483, "total_steps": 9627, "loss": 1.5258, "learning_rate": 2.4087206036971872e-05, "epoch": 0.6734185104393893, "percentage": 67.34, "elapsed_time": "2 days, 1:38:03", "remaining_time": "1 day, 0:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6484, "total_steps": 9627, "loss": 1.6615, "learning_rate": 2.4073253067266532e-05, "epoch": 0.6735223849589695, "percentage": 67.35, "elapsed_time": "2 days, 1:38:32", "remaining_time": "1 day, 0:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6485, "total_steps": 9627, "loss": 1.7412, "learning_rate": 2.4059302858557475e-05, "epoch": 0.6736262594785499, "percentage": 67.36, "elapsed_time": "2 days, 1:39:01", "remaining_time": "1 day, 0:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6486, "total_steps": 9627, "loss": 1.6766, "learning_rate": 2.4045355412330328e-05, "epoch": 0.6737301339981303, "percentage": 67.37, "elapsed_time": "2 days, 1:39:32", "remaining_time": "1 day, 0:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6487, "total_steps": 9627, "loss": 1.6006, "learning_rate": 2.403141073007038e-05, "epoch": 0.6738340085177106, "percentage": 67.38, "elapsed_time": "2 days, 1:40:01", "remaining_time": "1 day, 0:02:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6488, "total_steps": 9627, "loss": 1.6916, "learning_rate": 2.401746881326263e-05, "epoch": 0.673937883037291, "percentage": 67.39, "elapsed_time": "2 days, 1:40:32", "remaining_time": "1 day, 0:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6489, "total_steps": 9627, "loss": 1.7378, "learning_rate": 2.400352966339177e-05, "epoch": 0.6740417575568713, "percentage": 67.4, "elapsed_time": "2 days, 1:41:01", "remaining_time": "1 day, 0:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6490, "total_steps": 9627, "loss": 1.6959, "learning_rate": 2.398959328194223e-05, "epoch": 0.6741456320764516, "percentage": 67.41, "elapsed_time": "2 days, 1:41:32", "remaining_time": "1 day, 0:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6491, "total_steps": 9627, "loss": 1.7088, "learning_rate": 2.3975659670398117e-05, "epoch": 0.674249506596032, "percentage": 67.42, "elapsed_time": "2 days, 1:42:02", "remaining_time": "1 day, 0:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6492, "total_steps": 9627, "loss": 1.4458, "learning_rate": 2.3961728830243224e-05, "epoch": 0.6743533811156124, "percentage": 67.44, "elapsed_time": "2 days, 1:42:31", "remaining_time": "1 day, 0:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6493, "total_steps": 9627, "loss": 1.68, "learning_rate": 2.3947800762961147e-05, "epoch": 0.6744572556351927, "percentage": 67.45, "elapsed_time": "2 days, 1:43:02", "remaining_time": "23:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6494, "total_steps": 9627, "loss": 1.4526, "learning_rate": 2.3933875470035038e-05, "epoch": 0.674561130154773, "percentage": 67.46, "elapsed_time": "2 days, 1:43:31", "remaining_time": "23:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6495, "total_steps": 9627, "loss": 1.6881, "learning_rate": 2.391995295294788e-05, "epoch": 0.6746650046743534, "percentage": 67.47, "elapsed_time": "2 days, 1:44:02", "remaining_time": "23:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6496, "total_steps": 9627, "loss": 1.8923, "learning_rate": 2.3906033213182328e-05, "epoch": 0.6747688791939337, "percentage": 67.48, "elapsed_time": "2 days, 1:44:33", "remaining_time": "23:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6497, "total_steps": 9627, "loss": 1.6732, "learning_rate": 2.3892116252220653e-05, "epoch": 0.6748727537135141, "percentage": 67.49, "elapsed_time": "2 days, 1:45:02", "remaining_time": "23:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6498, "total_steps": 9627, "loss": 1.5638, "learning_rate": 2.3878202071544977e-05, "epoch": 0.6749766282330945, "percentage": 67.5, "elapsed_time": "2 days, 1:45:32", "remaining_time": "23:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6499, "total_steps": 9627, "loss": 1.7186, "learning_rate": 2.3864290672637012e-05, "epoch": 0.6750805027526747, "percentage": 67.51, "elapsed_time": "2 days, 1:46:01", "remaining_time": "23:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6500, "total_steps": 9627, "loss": 1.621, "learning_rate": 2.3850382056978228e-05, "epoch": 0.6751843772722551, "percentage": 67.52, "elapsed_time": "2 days, 1:46:31", "remaining_time": "23:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6501, "total_steps": 9627, "loss": 1.5422, "learning_rate": 2.3836476226049775e-05, "epoch": 0.6752882517918355, "percentage": 67.53, "elapsed_time": "2 days, 1:47:02", "remaining_time": "23:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6502, "total_steps": 9627, "loss": 1.7677, "learning_rate": 2.3822573181332526e-05, "epoch": 0.6753921263114158, "percentage": 67.54, "elapsed_time": "2 days, 1:47:31", "remaining_time": "23:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6503, "total_steps": 9627, "loss": 1.7901, "learning_rate": 2.380867292430704e-05, "epoch": 0.6754960008309961, "percentage": 67.55, "elapsed_time": "2 days, 1:48:00", "remaining_time": "23:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6504, "total_steps": 9627, "loss": 1.708, "learning_rate": 2.3794775456453573e-05, "epoch": 0.6755998753505765, "percentage": 67.56, "elapsed_time": "2 days, 1:48:31", "remaining_time": "23:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6505, "total_steps": 9627, "loss": 1.5471, "learning_rate": 2.378088077925214e-05, "epoch": 0.6757037498701568, "percentage": 67.57, "elapsed_time": "2 days, 1:49:00", "remaining_time": "23:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6506, "total_steps": 9627, "loss": 1.8363, "learning_rate": 2.3766988894182357e-05, "epoch": 0.6758076243897372, "percentage": 67.58, "elapsed_time": "2 days, 1:49:31", "remaining_time": "23:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6507, "total_steps": 9627, "loss": 2.0124, "learning_rate": 2.3753099802723643e-05, "epoch": 0.6759114989093176, "percentage": 67.59, "elapsed_time": "2 days, 1:50:01", "remaining_time": "23:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6508, "total_steps": 9627, "loss": 1.698, "learning_rate": 2.3739213506355073e-05, "epoch": 0.6760153734288978, "percentage": 67.6, "elapsed_time": "2 days, 1:50:31", "remaining_time": "23:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6509, "total_steps": 9627, "loss": 1.8448, "learning_rate": 2.372533000655542e-05, "epoch": 0.6761192479484782, "percentage": 67.61, "elapsed_time": "2 days, 1:51:00", "remaining_time": "23:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6510, "total_steps": 9627, "loss": 1.6932, "learning_rate": 2.3711449304803175e-05, "epoch": 0.6762231224680586, "percentage": 67.62, "elapsed_time": "2 days, 1:51:31", "remaining_time": "23:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6511, "total_steps": 9627, "loss": 1.6501, "learning_rate": 2.3697571402576497e-05, "epoch": 0.676326996987639, "percentage": 67.63, "elapsed_time": "2 days, 1:52:01", "remaining_time": "23:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6512, "total_steps": 9627, "loss": 1.4518, "learning_rate": 2.3683696301353337e-05, "epoch": 0.6764308715072193, "percentage": 67.64, "elapsed_time": "2 days, 1:52:30", "remaining_time": "23:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6513, "total_steps": 9627, "loss": 1.6496, "learning_rate": 2.3669824002611207e-05, "epoch": 0.6765347460267996, "percentage": 67.65, "elapsed_time": "2 days, 1:52:59", "remaining_time": "23:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6514, "total_steps": 9627, "loss": 1.6076, "learning_rate": 2.3655954507827456e-05, "epoch": 0.67663862054638, "percentage": 67.66, "elapsed_time": "2 days, 1:53:29", "remaining_time": "23:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6515, "total_steps": 9627, "loss": 1.7109, "learning_rate": 2.364208781847906e-05, "epoch": 0.6767424950659603, "percentage": 67.67, "elapsed_time": "2 days, 1:53:59", "remaining_time": "23:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6516, "total_steps": 9627, "loss": 1.6478, "learning_rate": 2.3628223936042708e-05, "epoch": 0.6768463695855407, "percentage": 67.68, "elapsed_time": "2 days, 1:54:29", "remaining_time": "23:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6517, "total_steps": 9627, "loss": 1.5394, "learning_rate": 2.3614362861994803e-05, "epoch": 0.6769502441051211, "percentage": 67.7, "elapsed_time": "2 days, 1:54:58", "remaining_time": "23:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6518, "total_steps": 9627, "loss": 1.8076, "learning_rate": 2.3600504597811436e-05, "epoch": 0.6770541186247013, "percentage": 67.71, "elapsed_time": "2 days, 1:55:28", "remaining_time": "23:48:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6519, "total_steps": 9627, "loss": 1.718, "learning_rate": 2.3586649144968404e-05, "epoch": 0.6771579931442817, "percentage": 67.72, "elapsed_time": "2 days, 1:55:58", "remaining_time": "23:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6520, "total_steps": 9627, "loss": 1.4616, "learning_rate": 2.357279650494119e-05, "epoch": 0.6772618676638621, "percentage": 67.73, "elapsed_time": "2 days, 1:56:28", "remaining_time": "23:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6521, "total_steps": 9627, "loss": 1.6517, "learning_rate": 2.3558946679205046e-05, "epoch": 0.6773657421834424, "percentage": 67.74, "elapsed_time": "2 days, 1:56:57", "remaining_time": "23:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6522, "total_steps": 9627, "loss": 1.5593, "learning_rate": 2.3545099669234792e-05, "epoch": 0.6774696167030227, "percentage": 67.75, "elapsed_time": "2 days, 1:57:27", "remaining_time": "23:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6523, "total_steps": 9627, "loss": 1.7158, "learning_rate": 2.3531255476505086e-05, "epoch": 0.6775734912226031, "percentage": 67.76, "elapsed_time": "2 days, 1:57:58", "remaining_time": "23:46:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6524, "total_steps": 9627, "loss": 1.8144, "learning_rate": 2.3517414102490232e-05, "epoch": 0.6776773657421834, "percentage": 67.77, "elapsed_time": "2 days, 1:58:28", "remaining_time": "23:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6525, "total_steps": 9627, "loss": 1.8248, "learning_rate": 2.350357554866416e-05, "epoch": 0.6777812402617638, "percentage": 67.78, "elapsed_time": "2 days, 1:58:58", "remaining_time": "23:45:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6526, "total_steps": 9627, "loss": 1.7912, "learning_rate": 2.3489739816500635e-05, "epoch": 0.6778851147813442, "percentage": 67.79, "elapsed_time": "2 days, 1:59:27", "remaining_time": "23:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6527, "total_steps": 9627, "loss": 1.7446, "learning_rate": 2.3475906907473027e-05, "epoch": 0.6779889893009244, "percentage": 67.8, "elapsed_time": "2 days, 1:59:57", "remaining_time": "23:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6528, "total_steps": 9627, "loss": 1.6939, "learning_rate": 2.3462076823054442e-05, "epoch": 0.6780928638205048, "percentage": 67.81, "elapsed_time": "2 days, 2:00:27", "remaining_time": "23:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6529, "total_steps": 9627, "loss": 1.7973, "learning_rate": 2.3448249564717666e-05, "epoch": 0.6781967383400852, "percentage": 67.82, "elapsed_time": "2 days, 2:00:57", "remaining_time": "23:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6530, "total_steps": 9627, "loss": 1.6438, "learning_rate": 2.3434425133935207e-05, "epoch": 0.6783006128596655, "percentage": 67.83, "elapsed_time": "2 days, 2:01:27", "remaining_time": "23:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6531, "total_steps": 9627, "loss": 1.7301, "learning_rate": 2.3420603532179246e-05, "epoch": 0.6784044873792459, "percentage": 67.84, "elapsed_time": "2 days, 2:01:57", "remaining_time": "23:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6532, "total_steps": 9627, "loss": 1.7364, "learning_rate": 2.3406784760921667e-05, "epoch": 0.6785083618988262, "percentage": 67.85, "elapsed_time": "2 days, 2:02:27", "remaining_time": "23:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6533, "total_steps": 9627, "loss": 1.608, "learning_rate": 2.339296882163411e-05, "epoch": 0.6786122364184065, "percentage": 67.86, "elapsed_time": "2 days, 2:02:56", "remaining_time": "23:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6534, "total_steps": 9627, "loss": 1.8397, "learning_rate": 2.3379155715787792e-05, "epoch": 0.6787161109379869, "percentage": 67.87, "elapsed_time": "2 days, 2:03:26", "remaining_time": "23:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6535, "total_steps": 9627, "loss": 1.9061, "learning_rate": 2.3365345444853763e-05, "epoch": 0.6788199854575673, "percentage": 67.88, "elapsed_time": "2 days, 2:03:57", "remaining_time": "23:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6536, "total_steps": 9627, "loss": 1.6904, "learning_rate": 2.3351538010302688e-05, "epoch": 0.6789238599771477, "percentage": 67.89, "elapsed_time": "2 days, 2:04:26", "remaining_time": "23:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6537, "total_steps": 9627, "loss": 1.6176, "learning_rate": 2.333773341360494e-05, "epoch": 0.6790277344967279, "percentage": 67.9, "elapsed_time": "2 days, 2:04:56", "remaining_time": "23:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6538, "total_steps": 9627, "loss": 1.7018, "learning_rate": 2.3323931656230614e-05, "epoch": 0.6791316090163083, "percentage": 67.91, "elapsed_time": "2 days, 2:05:27", "remaining_time": "23:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6539, "total_steps": 9627, "loss": 1.6211, "learning_rate": 2.331013273964947e-05, "epoch": 0.6792354835358887, "percentage": 67.92, "elapsed_time": "2 days, 2:05:57", "remaining_time": "23:39:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6540, "total_steps": 9627, "loss": 1.6159, "learning_rate": 2.3296336665331032e-05, "epoch": 0.679339358055469, "percentage": 67.93, "elapsed_time": "2 days, 2:06:26", "remaining_time": "23:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6541, "total_steps": 9627, "loss": 1.6425, "learning_rate": 2.3282543434744407e-05, "epoch": 0.6794432325750493, "percentage": 67.94, "elapsed_time": "2 days, 2:06:56", "remaining_time": "23:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6542, "total_steps": 9627, "loss": 1.6235, "learning_rate": 2.3268753049358522e-05, "epoch": 0.6795471070946297, "percentage": 67.95, "elapsed_time": "2 days, 2:07:25", "remaining_time": "23:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6543, "total_steps": 9627, "loss": 1.8103, "learning_rate": 2.3254965510641928e-05, "epoch": 0.67965098161421, "percentage": 67.97, "elapsed_time": "2 days, 2:07:56", "remaining_time": "23:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6544, "total_steps": 9627, "loss": 1.6595, "learning_rate": 2.3241180820062885e-05, "epoch": 0.6797548561337904, "percentage": 67.98, "elapsed_time": "2 days, 2:08:25", "remaining_time": "23:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6545, "total_steps": 9627, "loss": 1.586, "learning_rate": 2.3227398979089353e-05, "epoch": 0.6798587306533708, "percentage": 67.99, "elapsed_time": "2 days, 2:08:56", "remaining_time": "23:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6546, "total_steps": 9627, "loss": 1.4932, "learning_rate": 2.3213619989189006e-05, "epoch": 0.679962605172951, "percentage": 68.0, "elapsed_time": "2 days, 2:09:25", "remaining_time": "23:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6547, "total_steps": 9627, "loss": 1.6931, "learning_rate": 2.319984385182918e-05, "epoch": 0.6800664796925314, "percentage": 68.01, "elapsed_time": "2 days, 2:09:55", "remaining_time": "23:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6548, "total_steps": 9627, "loss": 1.5665, "learning_rate": 2.318607056847692e-05, "epoch": 0.6801703542121118, "percentage": 68.02, "elapsed_time": "2 days, 2:10:25", "remaining_time": "23:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6549, "total_steps": 9627, "loss": 1.7028, "learning_rate": 2.3172300140599024e-05, "epoch": 0.6802742287316921, "percentage": 68.03, "elapsed_time": "2 days, 2:10:55", "remaining_time": "23:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6550, "total_steps": 9627, "loss": 1.5754, "learning_rate": 2.315853256966186e-05, "epoch": 0.6803781032512725, "percentage": 68.04, "elapsed_time": "2 days, 2:11:25", "remaining_time": "23:34:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6551, "total_steps": 9627, "loss": 1.8211, "learning_rate": 2.314476785713163e-05, "epoch": 0.6804819777708528, "percentage": 68.05, "elapsed_time": "2 days, 2:11:55", "remaining_time": "23:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6552, "total_steps": 9627, "loss": 1.5858, "learning_rate": 2.3131006004474152e-05, "epoch": 0.6805858522904331, "percentage": 68.06, "elapsed_time": "2 days, 2:12:25", "remaining_time": "23:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6553, "total_steps": 9627, "loss": 1.9818, "learning_rate": 2.3117247013154918e-05, "epoch": 0.6806897268100135, "percentage": 68.07, "elapsed_time": "2 days, 2:12:55", "remaining_time": "23:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6554, "total_steps": 9627, "loss": 1.519, "learning_rate": 2.31034908846392e-05, "epoch": 0.6807936013295939, "percentage": 68.08, "elapsed_time": "2 days, 2:13:24", "remaining_time": "23:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6555, "total_steps": 9627, "loss": 1.6836, "learning_rate": 2.3089737620391906e-05, "epoch": 0.6808974758491741, "percentage": 68.09, "elapsed_time": "2 days, 2:13:54", "remaining_time": "23:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6556, "total_steps": 9627, "loss": 1.6183, "learning_rate": 2.307598722187765e-05, "epoch": 0.6810013503687545, "percentage": 68.1, "elapsed_time": "2 days, 2:14:24", "remaining_time": "23:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6557, "total_steps": 9627, "loss": 1.7593, "learning_rate": 2.306223969056073e-05, "epoch": 0.6811052248883349, "percentage": 68.11, "elapsed_time": "2 days, 2:14:54", "remaining_time": "23:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6558, "total_steps": 9627, "loss": 1.5302, "learning_rate": 2.3048495027905166e-05, "epoch": 0.6812090994079152, "percentage": 68.12, "elapsed_time": "2 days, 2:15:24", "remaining_time": "23:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6559, "total_steps": 9627, "loss": 1.5051, "learning_rate": 2.303475323537465e-05, "epoch": 0.6813129739274956, "percentage": 68.13, "elapsed_time": "2 days, 2:15:54", "remaining_time": "23:30:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6560, "total_steps": 9627, "loss": 1.9087, "learning_rate": 2.302101431443256e-05, "epoch": 0.681416848447076, "percentage": 68.14, "elapsed_time": "2 days, 2:16:23", "remaining_time": "23:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6561, "total_steps": 9627, "loss": 1.6909, "learning_rate": 2.300727826654202e-05, "epoch": 0.6815207229666563, "percentage": 68.15, "elapsed_time": "2 days, 2:16:53", "remaining_time": "23:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6562, "total_steps": 9627, "loss": 1.6303, "learning_rate": 2.299354509316579e-05, "epoch": 0.6816245974862366, "percentage": 68.16, "elapsed_time": "2 days, 2:17:24", "remaining_time": "23:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6563, "total_steps": 9627, "loss": 1.8708, "learning_rate": 2.297981479576635e-05, "epoch": 0.681728472005817, "percentage": 68.17, "elapsed_time": "2 days, 2:17:53", "remaining_time": "23:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6564, "total_steps": 9627, "loss": 1.6224, "learning_rate": 2.2966087375805874e-05, "epoch": 0.6818323465253974, "percentage": 68.18, "elapsed_time": "2 days, 2:18:22", "remaining_time": "23:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6565, "total_steps": 9627, "loss": 1.5744, "learning_rate": 2.2952362834746216e-05, "epoch": 0.6819362210449776, "percentage": 68.19, "elapsed_time": "2 days, 2:18:53", "remaining_time": "23:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6566, "total_steps": 9627, "loss": 1.5341, "learning_rate": 2.2938641174048936e-05, "epoch": 0.682040095564558, "percentage": 68.2, "elapsed_time": "2 days, 2:19:23", "remaining_time": "23:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6567, "total_steps": 9627, "loss": 1.8871, "learning_rate": 2.2924922395175268e-05, "epoch": 0.6821439700841384, "percentage": 68.21, "elapsed_time": "2 days, 2:19:53", "remaining_time": "23:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6568, "total_steps": 9627, "loss": 1.8006, "learning_rate": 2.2911206499586207e-05, "epoch": 0.6822478446037187, "percentage": 68.22, "elapsed_time": "2 days, 2:20:22", "remaining_time": "23:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6569, "total_steps": 9627, "loss": 1.6603, "learning_rate": 2.2897493488742317e-05, "epoch": 0.6823517191232991, "percentage": 68.24, "elapsed_time": "2 days, 2:20:53", "remaining_time": "23:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6570, "total_steps": 9627, "loss": 1.5109, "learning_rate": 2.2883783364103976e-05, "epoch": 0.6824555936428794, "percentage": 68.25, "elapsed_time": "2 days, 2:21:23", "remaining_time": "23:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6571, "total_steps": 9627, "loss": 1.7607, "learning_rate": 2.2870076127131196e-05, "epoch": 0.6825594681624597, "percentage": 68.26, "elapsed_time": "2 days, 2:21:52", "remaining_time": "23:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6572, "total_steps": 9627, "loss": 1.7517, "learning_rate": 2.2856371779283692e-05, "epoch": 0.6826633426820401, "percentage": 68.27, "elapsed_time": "2 days, 2:22:23", "remaining_time": "23:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6573, "total_steps": 9627, "loss": 1.7537, "learning_rate": 2.2842670322020858e-05, "epoch": 0.6827672172016205, "percentage": 68.28, "elapsed_time": "2 days, 2:22:52", "remaining_time": "23:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6574, "total_steps": 9627, "loss": 1.5869, "learning_rate": 2.2828971756801802e-05, "epoch": 0.6828710917212008, "percentage": 68.29, "elapsed_time": "2 days, 2:23:23", "remaining_time": "23:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6575, "total_steps": 9627, "loss": 1.5199, "learning_rate": 2.2815276085085313e-05, "epoch": 0.6829749662407811, "percentage": 68.3, "elapsed_time": "2 days, 2:23:52", "remaining_time": "23:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6576, "total_steps": 9627, "loss": 1.6698, "learning_rate": 2.2801583308329848e-05, "epoch": 0.6830788407603615, "percentage": 68.31, "elapsed_time": "2 days, 2:24:23", "remaining_time": "23:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6577, "total_steps": 9627, "loss": 1.582, "learning_rate": 2.2787893427993646e-05, "epoch": 0.6831827152799418, "percentage": 68.32, "elapsed_time": "2 days, 2:24:52", "remaining_time": "23:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6578, "total_steps": 9627, "loss": 1.4429, "learning_rate": 2.2774206445534495e-05, "epoch": 0.6832865897995222, "percentage": 68.33, "elapsed_time": "2 days, 2:25:23", "remaining_time": "23:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6579, "total_steps": 9627, "loss": 1.5655, "learning_rate": 2.2760522362410003e-05, "epoch": 0.6833904643191026, "percentage": 68.34, "elapsed_time": "2 days, 2:25:52", "remaining_time": "23:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6580, "total_steps": 9627, "loss": 1.6493, "learning_rate": 2.274684118007743e-05, "epoch": 0.6834943388386828, "percentage": 68.35, "elapsed_time": "2 days, 2:26:22", "remaining_time": "23:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6581, "total_steps": 9627, "loss": 1.4814, "learning_rate": 2.2733162899993642e-05, "epoch": 0.6835982133582632, "percentage": 68.36, "elapsed_time": "2 days, 2:26:52", "remaining_time": "23:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6582, "total_steps": 9627, "loss": 1.5412, "learning_rate": 2.271948752361534e-05, "epoch": 0.6837020878778436, "percentage": 68.37, "elapsed_time": "2 days, 2:27:22", "remaining_time": "23:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6583, "total_steps": 9627, "loss": 1.6233, "learning_rate": 2.2705815052398816e-05, "epoch": 0.6838059623974239, "percentage": 68.38, "elapsed_time": "2 days, 2:27:52", "remaining_time": "23:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6584, "total_steps": 9627, "loss": 1.6233, "learning_rate": 2.2692145487800093e-05, "epoch": 0.6839098369170042, "percentage": 68.39, "elapsed_time": "2 days, 2:28:21", "remaining_time": "23:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6585, "total_steps": 9627, "loss": 1.8792, "learning_rate": 2.2678478831274858e-05, "epoch": 0.6840137114365846, "percentage": 68.4, "elapsed_time": "2 days, 2:28:51", "remaining_time": "23:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6586, "total_steps": 9627, "loss": 1.6535, "learning_rate": 2.266481508427852e-05, "epoch": 0.6841175859561649, "percentage": 68.41, "elapsed_time": "2 days, 2:29:21", "remaining_time": "23:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6587, "total_steps": 9627, "loss": 1.5587, "learning_rate": 2.2651154248266145e-05, "epoch": 0.6842214604757453, "percentage": 68.42, "elapsed_time": "2 days, 2:29:51", "remaining_time": "23:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6588, "total_steps": 9627, "loss": 1.6661, "learning_rate": 2.2637496324692496e-05, "epoch": 0.6843253349953257, "percentage": 68.43, "elapsed_time": "2 days, 2:30:21", "remaining_time": "23:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6589, "total_steps": 9627, "loss": 1.7157, "learning_rate": 2.2623841315012072e-05, "epoch": 0.684429209514906, "percentage": 68.44, "elapsed_time": "2 days, 2:30:51", "remaining_time": "23:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6590, "total_steps": 9627, "loss": 1.7036, "learning_rate": 2.2610189220679007e-05, "epoch": 0.6845330840344863, "percentage": 68.45, "elapsed_time": "2 days, 2:31:20", "remaining_time": "23:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6591, "total_steps": 9627, "loss": 1.6208, "learning_rate": 2.2596540043147142e-05, "epoch": 0.6846369585540667, "percentage": 68.46, "elapsed_time": "2 days, 2:31:51", "remaining_time": "23:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6592, "total_steps": 9627, "loss": 1.8271, "learning_rate": 2.2582893783870006e-05, "epoch": 0.6847408330736471, "percentage": 68.47, "elapsed_time": "2 days, 2:32:21", "remaining_time": "23:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6593, "total_steps": 9627, "loss": 1.638, "learning_rate": 2.256925044430082e-05, "epoch": 0.6848447075932274, "percentage": 68.48, "elapsed_time": "2 days, 2:32:51", "remaining_time": "23:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6594, "total_steps": 9627, "loss": 1.5826, "learning_rate": 2.2555610025892498e-05, "epoch": 0.6849485821128077, "percentage": 68.49, "elapsed_time": "2 days, 2:33:21", "remaining_time": "23:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6595, "total_steps": 9627, "loss": 1.5875, "learning_rate": 2.254197253009761e-05, "epoch": 0.6850524566323881, "percentage": 68.51, "elapsed_time": "2 days, 2:33:51", "remaining_time": "23:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6596, "total_steps": 9627, "loss": 1.6933, "learning_rate": 2.2528337958368507e-05, "epoch": 0.6851563311519684, "percentage": 68.52, "elapsed_time": "2 days, 2:34:20", "remaining_time": "23:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6597, "total_steps": 9627, "loss": 1.5773, "learning_rate": 2.2514706312157085e-05, "epoch": 0.6852602056715488, "percentage": 68.53, "elapsed_time": "2 days, 2:34:50", "remaining_time": "23:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6598, "total_steps": 9627, "loss": 1.6426, "learning_rate": 2.2501077592915065e-05, "epoch": 0.6853640801911292, "percentage": 68.54, "elapsed_time": "2 days, 2:35:20", "remaining_time": "23:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6599, "total_steps": 9627, "loss": 1.5363, "learning_rate": 2.2487451802093784e-05, "epoch": 0.6854679547107094, "percentage": 68.55, "elapsed_time": "2 days, 2:35:50", "remaining_time": "23:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6600, "total_steps": 9627, "loss": 1.5895, "learning_rate": 2.2473828941144276e-05, "epoch": 0.6855718292302898, "percentage": 68.56, "elapsed_time": "2 days, 2:36:20", "remaining_time": "23:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6601, "total_steps": 9627, "loss": 1.6797, "learning_rate": 2.246020901151728e-05, "epoch": 0.6856757037498702, "percentage": 68.57, "elapsed_time": "2 days, 2:36:49", "remaining_time": "23:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6602, "total_steps": 9627, "loss": 1.6592, "learning_rate": 2.24465920146632e-05, "epoch": 0.6857795782694505, "percentage": 68.58, "elapsed_time": "2 days, 2:37:19", "remaining_time": "23:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6603, "total_steps": 9627, "loss": 1.7151, "learning_rate": 2.2432977952032148e-05, "epoch": 0.6858834527890308, "percentage": 68.59, "elapsed_time": "2 days, 2:37:49", "remaining_time": "23:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6604, "total_steps": 9627, "loss": 1.8579, "learning_rate": 2.2419366825073894e-05, "epoch": 0.6859873273086112, "percentage": 68.6, "elapsed_time": "2 days, 2:38:19", "remaining_time": "23:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6605, "total_steps": 9627, "loss": 1.57, "learning_rate": 2.2405758635237973e-05, "epoch": 0.6860912018281915, "percentage": 68.61, "elapsed_time": "2 days, 2:38:49", "remaining_time": "23:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6606, "total_steps": 9627, "loss": 1.7868, "learning_rate": 2.2392153383973473e-05, "epoch": 0.6861950763477719, "percentage": 68.62, "elapsed_time": "2 days, 2:39:19", "remaining_time": "23:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6607, "total_steps": 9627, "loss": 1.7668, "learning_rate": 2.2378551072729314e-05, "epoch": 0.6862989508673523, "percentage": 68.63, "elapsed_time": "2 days, 2:39:48", "remaining_time": "23:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6608, "total_steps": 9627, "loss": 1.7325, "learning_rate": 2.2364951702954025e-05, "epoch": 0.6864028253869325, "percentage": 68.64, "elapsed_time": "2 days, 2:40:18", "remaining_time": "23:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6609, "total_steps": 9627, "loss": 1.8742, "learning_rate": 2.235135527609578e-05, "epoch": 0.6865066999065129, "percentage": 68.65, "elapsed_time": "2 days, 2:40:48", "remaining_time": "23:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6610, "total_steps": 9627, "loss": 1.5874, "learning_rate": 2.233776179360255e-05, "epoch": 0.6866105744260933, "percentage": 68.66, "elapsed_time": "2 days, 2:41:19", "remaining_time": "23:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6611, "total_steps": 9627, "loss": 1.8026, "learning_rate": 2.2324171256921918e-05, "epoch": 0.6867144489456736, "percentage": 68.67, "elapsed_time": "2 days, 2:41:48", "remaining_time": "23:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6612, "total_steps": 9627, "loss": 1.68, "learning_rate": 2.2310583667501163e-05, "epoch": 0.686818323465254, "percentage": 68.68, "elapsed_time": "2 days, 2:42:20", "remaining_time": "23:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6613, "total_steps": 9627, "loss": 1.5025, "learning_rate": 2.2296999026787262e-05, "epoch": 0.6869221979848343, "percentage": 68.69, "elapsed_time": "2 days, 2:42:50", "remaining_time": "23:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6614, "total_steps": 9627, "loss": 1.6217, "learning_rate": 2.2283417336226853e-05, "epoch": 0.6870260725044147, "percentage": 68.7, "elapsed_time": "2 days, 2:43:19", "remaining_time": "23:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6615, "total_steps": 9627, "loss": 1.5827, "learning_rate": 2.2269838597266342e-05, "epoch": 0.687129947023995, "percentage": 68.71, "elapsed_time": "2 days, 2:43:50", "remaining_time": "23:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6616, "total_steps": 9627, "loss": 1.7894, "learning_rate": 2.2256262811351676e-05, "epoch": 0.6872338215435754, "percentage": 68.72, "elapsed_time": "2 days, 2:44:21", "remaining_time": "23:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6617, "total_steps": 9627, "loss": 1.5107, "learning_rate": 2.2242689979928632e-05, "epoch": 0.6873376960631558, "percentage": 68.73, "elapsed_time": "2 days, 2:44:51", "remaining_time": "23:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6618, "total_steps": 9627, "loss": 1.6793, "learning_rate": 2.222912010444259e-05, "epoch": 0.687441570582736, "percentage": 68.74, "elapsed_time": "2 days, 2:45:21", "remaining_time": "23:04:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6619, "total_steps": 9627, "loss": 1.6067, "learning_rate": 2.2215553186338635e-05, "epoch": 0.6875454451023164, "percentage": 68.75, "elapsed_time": "2 days, 2:45:50", "remaining_time": "23:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6620, "total_steps": 9627, "loss": 1.6807, "learning_rate": 2.2201989227061535e-05, "epoch": 0.6876493196218968, "percentage": 68.76, "elapsed_time": "2 days, 2:46:20", "remaining_time": "23:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6621, "total_steps": 9627, "loss": 1.5434, "learning_rate": 2.2188428228055756e-05, "epoch": 0.6877531941414771, "percentage": 68.78, "elapsed_time": "2 days, 2:46:50", "remaining_time": "23:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6622, "total_steps": 9627, "loss": 1.6909, "learning_rate": 2.2174870190765428e-05, "epoch": 0.6878570686610574, "percentage": 68.79, "elapsed_time": "2 days, 2:47:20", "remaining_time": "23:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6623, "total_steps": 9627, "loss": 1.7252, "learning_rate": 2.2161315116634362e-05, "epoch": 0.6879609431806378, "percentage": 68.8, "elapsed_time": "2 days, 2:47:50", "remaining_time": "23:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6624, "total_steps": 9627, "loss": 1.7813, "learning_rate": 2.2147763007106126e-05, "epoch": 0.6880648177002181, "percentage": 68.81, "elapsed_time": "2 days, 2:48:20", "remaining_time": "23:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6625, "total_steps": 9627, "loss": 1.7338, "learning_rate": 2.213421386362383e-05, "epoch": 0.6881686922197985, "percentage": 68.82, "elapsed_time": "2 days, 2:48:51", "remaining_time": "23:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6626, "total_steps": 9627, "loss": 1.7215, "learning_rate": 2.212066768763042e-05, "epoch": 0.6882725667393789, "percentage": 68.83, "elapsed_time": "2 days, 2:49:21", "remaining_time": "23:01:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6627, "total_steps": 9627, "loss": 1.5899, "learning_rate": 2.2107124480568435e-05, "epoch": 0.6883764412589591, "percentage": 68.84, "elapsed_time": "2 days, 2:49:51", "remaining_time": "23:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6628, "total_steps": 9627, "loss": 1.6213, "learning_rate": 2.2093584243880116e-05, "epoch": 0.6884803157785395, "percentage": 68.85, "elapsed_time": "2 days, 2:50:21", "remaining_time": "23:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6629, "total_steps": 9627, "loss": 1.5516, "learning_rate": 2.20800469790074e-05, "epoch": 0.6885841902981199, "percentage": 68.86, "elapsed_time": "2 days, 2:50:52", "remaining_time": "22:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6630, "total_steps": 9627, "loss": 1.6291, "learning_rate": 2.2066512687391898e-05, "epoch": 0.6886880648177002, "percentage": 68.87, "elapsed_time": "2 days, 2:51:21", "remaining_time": "22:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6631, "total_steps": 9627, "loss": 1.819, "learning_rate": 2.20529813704749e-05, "epoch": 0.6887919393372806, "percentage": 68.88, "elapsed_time": "2 days, 2:51:52", "remaining_time": "22:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6632, "total_steps": 9627, "loss": 1.7297, "learning_rate": 2.2039453029697378e-05, "epoch": 0.6888958138568609, "percentage": 68.89, "elapsed_time": "2 days, 2:52:22", "remaining_time": "22:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6633, "total_steps": 9627, "loss": 1.6097, "learning_rate": 2.202592766650004e-05, "epoch": 0.6889996883764412, "percentage": 68.9, "elapsed_time": "2 days, 2:52:52", "remaining_time": "22:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6634, "total_steps": 9627, "loss": 1.4958, "learning_rate": 2.2012405282323166e-05, "epoch": 0.6891035628960216, "percentage": 68.91, "elapsed_time": "2 days, 2:53:21", "remaining_time": "22:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6635, "total_steps": 9627, "loss": 1.5057, "learning_rate": 2.1998885878606835e-05, "epoch": 0.689207437415602, "percentage": 68.92, "elapsed_time": "2 days, 2:53:53", "remaining_time": "22:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6636, "total_steps": 9627, "loss": 1.614, "learning_rate": 2.1985369456790757e-05, "epoch": 0.6893113119351822, "percentage": 68.93, "elapsed_time": "2 days, 2:54:22", "remaining_time": "22:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6637, "total_steps": 9627, "loss": 1.8599, "learning_rate": 2.1971856018314274e-05, "epoch": 0.6894151864547626, "percentage": 68.94, "elapsed_time": "2 days, 2:54:52", "remaining_time": "22:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6638, "total_steps": 9627, "loss": 1.6569, "learning_rate": 2.1958345564616515e-05, "epoch": 0.689519060974343, "percentage": 68.95, "elapsed_time": "2 days, 2:55:22", "remaining_time": "22:55:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6639, "total_steps": 9627, "loss": 1.6422, "learning_rate": 2.1944838097136205e-05, "epoch": 0.6896229354939234, "percentage": 68.96, "elapsed_time": "2 days, 2:55:52", "remaining_time": "22:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6640, "total_steps": 9627, "loss": 1.8098, "learning_rate": 2.1931333617311833e-05, "epoch": 0.6897268100135037, "percentage": 68.97, "elapsed_time": "2 days, 2:56:21", "remaining_time": "22:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6641, "total_steps": 9627, "loss": 1.6439, "learning_rate": 2.1917832126581467e-05, "epoch": 0.689830684533084, "percentage": 68.98, "elapsed_time": "2 days, 2:56:52", "remaining_time": "22:54:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6642, "total_steps": 9627, "loss": 1.6079, "learning_rate": 2.1904333626382918e-05, "epoch": 0.6899345590526644, "percentage": 68.99, "elapsed_time": "2 days, 2:57:22", "remaining_time": "22:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6643, "total_steps": 9627, "loss": 1.6243, "learning_rate": 2.189083811815371e-05, "epoch": 0.6900384335722447, "percentage": 69.0, "elapsed_time": "2 days, 2:57:53", "remaining_time": "22:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6644, "total_steps": 9627, "loss": 1.8424, "learning_rate": 2.187734560333095e-05, "epoch": 0.6901423080918251, "percentage": 69.01, "elapsed_time": "2 days, 2:58:24", "remaining_time": "22:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6645, "total_steps": 9627, "loss": 1.5472, "learning_rate": 2.186385608335154e-05, "epoch": 0.6902461826114055, "percentage": 69.02, "elapsed_time": "2 days, 2:58:53", "remaining_time": "22:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6646, "total_steps": 9627, "loss": 1.5287, "learning_rate": 2.1850369559651984e-05, "epoch": 0.6903500571309857, "percentage": 69.04, "elapsed_time": "2 days, 2:59:23", "remaining_time": "22:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6647, "total_steps": 9627, "loss": 1.5671, "learning_rate": 2.1836886033668495e-05, "epoch": 0.6904539316505661, "percentage": 69.05, "elapsed_time": "2 days, 2:59:53", "remaining_time": "22:51:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6648, "total_steps": 9627, "loss": 1.6821, "learning_rate": 2.1823405506836962e-05, "epoch": 0.6905578061701465, "percentage": 69.06, "elapsed_time": "2 days, 3:00:23", "remaining_time": "22:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6649, "total_steps": 9627, "loss": 1.6621, "learning_rate": 2.180992798059296e-05, "epoch": 0.6906616806897268, "percentage": 69.07, "elapsed_time": "2 days, 3:00:54", "remaining_time": "22:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6650, "total_steps": 9627, "loss": 1.5388, "learning_rate": 2.1796453456371735e-05, "epoch": 0.6907655552093072, "percentage": 69.08, "elapsed_time": "2 days, 3:01:24", "remaining_time": "22:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6651, "total_steps": 9627, "loss": 1.5155, "learning_rate": 2.17829819356082e-05, "epoch": 0.6908694297288875, "percentage": 69.09, "elapsed_time": "2 days, 3:01:54", "remaining_time": "22:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6652, "total_steps": 9627, "loss": 1.768, "learning_rate": 2.1769513419737024e-05, "epoch": 0.6909733042484678, "percentage": 69.1, "elapsed_time": "2 days, 3:02:24", "remaining_time": "22:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6653, "total_steps": 9627, "loss": 1.6215, "learning_rate": 2.1756047910192428e-05, "epoch": 0.6910771787680482, "percentage": 69.11, "elapsed_time": "2 days, 3:02:55", "remaining_time": "22:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6654, "total_steps": 9627, "loss": 1.7715, "learning_rate": 2.1742585408408438e-05, "epoch": 0.6911810532876286, "percentage": 69.12, "elapsed_time": "2 days, 3:03:25", "remaining_time": "22:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6655, "total_steps": 9627, "loss": 1.7967, "learning_rate": 2.1729125915818684e-05, "epoch": 0.6912849278072088, "percentage": 69.13, "elapsed_time": "2 days, 3:03:55", "remaining_time": "22:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6656, "total_steps": 9627, "loss": 1.6482, "learning_rate": 2.17156694338565e-05, "epoch": 0.6913888023267892, "percentage": 69.14, "elapsed_time": "2 days, 3:04:25", "remaining_time": "22:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6657, "total_steps": 9627, "loss": 1.6526, "learning_rate": 2.1702215963954893e-05, "epoch": 0.6914926768463696, "percentage": 69.15, "elapsed_time": "2 days, 3:04:55", "remaining_time": "22:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6658, "total_steps": 9627, "loss": 1.3809, "learning_rate": 2.1688765507546556e-05, "epoch": 0.6915965513659499, "percentage": 69.16, "elapsed_time": "2 days, 3:05:27", "remaining_time": "22:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6659, "total_steps": 9627, "loss": 1.6426, "learning_rate": 2.1675318066063855e-05, "epoch": 0.6917004258855303, "percentage": 69.17, "elapsed_time": "2 days, 3:05:56", "remaining_time": "22:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6660, "total_steps": 9627, "loss": 1.6819, "learning_rate": 2.166187364093882e-05, "epoch": 0.6918043004051107, "percentage": 69.18, "elapsed_time": "2 days, 3:06:27", "remaining_time": "22:46:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6661, "total_steps": 9627, "loss": 1.8221, "learning_rate": 2.1648432233603232e-05, "epoch": 0.6919081749246909, "percentage": 69.19, "elapsed_time": "2 days, 3:06:57", "remaining_time": "22:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6662, "total_steps": 9627, "loss": 1.707, "learning_rate": 2.1634993845488426e-05, "epoch": 0.6920120494442713, "percentage": 69.2, "elapsed_time": "2 days, 3:07:27", "remaining_time": "22:45:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6663, "total_steps": 9627, "loss": 1.6048, "learning_rate": 2.162155847802554e-05, "epoch": 0.6921159239638517, "percentage": 69.21, "elapsed_time": "2 days, 3:07:57", "remaining_time": "22:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6664, "total_steps": 9627, "loss": 1.8689, "learning_rate": 2.1608126132645317e-05, "epoch": 0.6922197984834321, "percentage": 69.22, "elapsed_time": "2 days, 3:08:27", "remaining_time": "22:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6665, "total_steps": 9627, "loss": 1.7781, "learning_rate": 2.1594696810778193e-05, "epoch": 0.6923236730030123, "percentage": 69.23, "elapsed_time": "2 days, 3:08:58", "remaining_time": "22:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6666, "total_steps": 9627, "loss": 1.71, "learning_rate": 2.1581270513854283e-05, "epoch": 0.6924275475225927, "percentage": 69.24, "elapsed_time": "2 days, 3:09:28", "remaining_time": "22:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6667, "total_steps": 9627, "loss": 1.7161, "learning_rate": 2.156784724330338e-05, "epoch": 0.6925314220421731, "percentage": 69.25, "elapsed_time": "2 days, 3:09:58", "remaining_time": "22:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6668, "total_steps": 9627, "loss": 1.5071, "learning_rate": 2.1554427000555e-05, "epoch": 0.6926352965617534, "percentage": 69.26, "elapsed_time": "2 days, 3:10:29", "remaining_time": "22:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6669, "total_steps": 9627, "loss": 1.9258, "learning_rate": 2.154100978703824e-05, "epoch": 0.6927391710813338, "percentage": 69.27, "elapsed_time": "2 days, 3:10:59", "remaining_time": "22:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6670, "total_steps": 9627, "loss": 1.4963, "learning_rate": 2.1527595604181933e-05, "epoch": 0.6928430456009141, "percentage": 69.28, "elapsed_time": "2 days, 3:11:28", "remaining_time": "22:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6671, "total_steps": 9627, "loss": 1.745, "learning_rate": 2.151418445341463e-05, "epoch": 0.6929469201204944, "percentage": 69.29, "elapsed_time": "2 days, 3:12:01", "remaining_time": "22:41:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6672, "total_steps": 9627, "loss": 1.6489, "learning_rate": 2.1500776336164456e-05, "epoch": 0.6930507946400748, "percentage": 69.31, "elapsed_time": "2 days, 3:12:30", "remaining_time": "22:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6673, "total_steps": 9627, "loss": 1.8266, "learning_rate": 2.1487371253859316e-05, "epoch": 0.6931546691596552, "percentage": 69.32, "elapsed_time": "2 days, 3:13:00", "remaining_time": "22:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6674, "total_steps": 9627, "loss": 1.6169, "learning_rate": 2.1473969207926737e-05, "epoch": 0.6932585436792355, "percentage": 69.33, "elapsed_time": "2 days, 3:13:30", "remaining_time": "22:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6675, "total_steps": 9627, "loss": 1.7495, "learning_rate": 2.1460570199793917e-05, "epoch": 0.6933624181988158, "percentage": 69.34, "elapsed_time": "2 days, 3:14:01", "remaining_time": "22:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6676, "total_steps": 9627, "loss": 1.7681, "learning_rate": 2.1447174230887757e-05, "epoch": 0.6934662927183962, "percentage": 69.35, "elapsed_time": "2 days, 3:14:31", "remaining_time": "22:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6677, "total_steps": 9627, "loss": 1.665, "learning_rate": 2.143378130263482e-05, "epoch": 0.6935701672379765, "percentage": 69.36, "elapsed_time": "2 days, 3:15:02", "remaining_time": "22:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6678, "total_steps": 9627, "loss": 1.6799, "learning_rate": 2.142039141646135e-05, "epoch": 0.6936740417575569, "percentage": 69.37, "elapsed_time": "2 days, 3:15:33", "remaining_time": "22:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6679, "total_steps": 9627, "loss": 1.6812, "learning_rate": 2.140700457379325e-05, "epoch": 0.6937779162771373, "percentage": 69.38, "elapsed_time": "2 days, 3:16:02", "remaining_time": "22:37:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6680, "total_steps": 9627, "loss": 1.7876, "learning_rate": 2.1393620776056163e-05, "epoch": 0.6938817907967175, "percentage": 69.39, "elapsed_time": "2 days, 3:16:32", "remaining_time": "22:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6681, "total_steps": 9627, "loss": 1.3614, "learning_rate": 2.1380240024675285e-05, "epoch": 0.6939856653162979, "percentage": 69.4, "elapsed_time": "2 days, 3:17:02", "remaining_time": "22:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6682, "total_steps": 9627, "loss": 1.7599, "learning_rate": 2.136686232107562e-05, "epoch": 0.6940895398358783, "percentage": 69.41, "elapsed_time": "2 days, 3:17:34", "remaining_time": "22:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6683, "total_steps": 9627, "loss": 1.663, "learning_rate": 2.1353487666681777e-05, "epoch": 0.6941934143554586, "percentage": 69.42, "elapsed_time": "2 days, 3:18:04", "remaining_time": "22:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6684, "total_steps": 9627, "loss": 1.8039, "learning_rate": 2.134011606291804e-05, "epoch": 0.6942972888750389, "percentage": 69.43, "elapsed_time": "2 days, 3:18:34", "remaining_time": "22:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6685, "total_steps": 9627, "loss": 1.7361, "learning_rate": 2.132674751120839e-05, "epoch": 0.6944011633946193, "percentage": 69.44, "elapsed_time": "2 days, 3:19:04", "remaining_time": "22:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6686, "total_steps": 9627, "loss": 1.5977, "learning_rate": 2.131338201297647e-05, "epoch": 0.6945050379141996, "percentage": 69.45, "elapsed_time": "2 days, 3:19:35", "remaining_time": "22:34:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6687, "total_steps": 9627, "loss": 1.9488, "learning_rate": 2.1300019569645596e-05, "epoch": 0.69460891243378, "percentage": 69.46, "elapsed_time": "2 days, 3:20:05", "remaining_time": "22:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6688, "total_steps": 9627, "loss": 1.7338, "learning_rate": 2.1286660182638756e-05, "epoch": 0.6947127869533604, "percentage": 69.47, "elapsed_time": "2 days, 3:20:34", "remaining_time": "22:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6689, "total_steps": 9627, "loss": 1.5402, "learning_rate": 2.1273303853378674e-05, "epoch": 0.6948166614729406, "percentage": 69.48, "elapsed_time": "2 days, 3:21:05", "remaining_time": "22:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6690, "total_steps": 9627, "loss": 1.6692, "learning_rate": 2.125995058328763e-05, "epoch": 0.694920535992521, "percentage": 69.49, "elapsed_time": "2 days, 3:21:35", "remaining_time": "22:32:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6691, "total_steps": 9627, "loss": 1.7801, "learning_rate": 2.124660037378765e-05, "epoch": 0.6950244105121014, "percentage": 69.5, "elapsed_time": "2 days, 3:22:05", "remaining_time": "22:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6692, "total_steps": 9627, "loss": 1.5115, "learning_rate": 2.1233253226300465e-05, "epoch": 0.6951282850316818, "percentage": 69.51, "elapsed_time": "2 days, 3:22:35", "remaining_time": "22:31:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6693, "total_steps": 9627, "loss": 1.8221, "learning_rate": 2.1219909142247424e-05, "epoch": 0.695232159551262, "percentage": 69.52, "elapsed_time": "2 days, 3:23:05", "remaining_time": "22:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6694, "total_steps": 9627, "loss": 1.6134, "learning_rate": 2.1206568123049564e-05, "epoch": 0.6953360340708424, "percentage": 69.53, "elapsed_time": "2 days, 3:23:35", "remaining_time": "22:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6695, "total_steps": 9627, "loss": 1.5809, "learning_rate": 2.119323017012759e-05, "epoch": 0.6954399085904228, "percentage": 69.54, "elapsed_time": "2 days, 3:24:05", "remaining_time": "22:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6696, "total_steps": 9627, "loss": 1.5416, "learning_rate": 2.1179895284901924e-05, "epoch": 0.6955437831100031, "percentage": 69.55, "elapsed_time": "2 days, 3:24:36", "remaining_time": "22:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6697, "total_steps": 9627, "loss": 1.5112, "learning_rate": 2.1166563468792594e-05, "epoch": 0.6956476576295835, "percentage": 69.56, "elapsed_time": "2 days, 3:25:07", "remaining_time": "22:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6698, "total_steps": 9627, "loss": 1.6208, "learning_rate": 2.1153234723219328e-05, "epoch": 0.6957515321491639, "percentage": 69.58, "elapsed_time": "2 days, 3:25:36", "remaining_time": "22:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6699, "total_steps": 9627, "loss": 1.7745, "learning_rate": 2.1139909049601587e-05, "epoch": 0.6958554066687441, "percentage": 69.59, "elapsed_time": "2 days, 3:26:06", "remaining_time": "22:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6700, "total_steps": 9627, "loss": 1.5898, "learning_rate": 2.1126586449358375e-05, "epoch": 0.6959592811883245, "percentage": 69.6, "elapsed_time": "2 days, 3:26:36", "remaining_time": "22:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6701, "total_steps": 9627, "loss": 1.7258, "learning_rate": 2.111326692390851e-05, "epoch": 0.6960631557079049, "percentage": 69.61, "elapsed_time": "2 days, 3:27:06", "remaining_time": "22:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6702, "total_steps": 9627, "loss": 1.6533, "learning_rate": 2.1099950474670387e-05, "epoch": 0.6961670302274852, "percentage": 69.62, "elapsed_time": "2 days, 3:27:36", "remaining_time": "22:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6703, "total_steps": 9627, "loss": 1.5623, "learning_rate": 2.1086637103062107e-05, "epoch": 0.6962709047470655, "percentage": 69.63, "elapsed_time": "2 days, 3:28:07", "remaining_time": "22:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6704, "total_steps": 9627, "loss": 1.6596, "learning_rate": 2.1073326810501448e-05, "epoch": 0.6963747792666459, "percentage": 69.64, "elapsed_time": "2 days, 3:28:37", "remaining_time": "22:26:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6705, "total_steps": 9627, "loss": 1.5612, "learning_rate": 2.1060019598405843e-05, "epoch": 0.6964786537862262, "percentage": 69.65, "elapsed_time": "2 days, 3:29:07", "remaining_time": "22:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6706, "total_steps": 9627, "loss": 1.5457, "learning_rate": 2.1046715468192414e-05, "epoch": 0.6965825283058066, "percentage": 69.66, "elapsed_time": "2 days, 3:29:37", "remaining_time": "22:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6707, "total_steps": 9627, "loss": 1.7415, "learning_rate": 2.1033414421277924e-05, "epoch": 0.696686402825387, "percentage": 69.67, "elapsed_time": "2 days, 3:30:08", "remaining_time": "22:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6708, "total_steps": 9627, "loss": 1.5627, "learning_rate": 2.1020116459078887e-05, "epoch": 0.6967902773449672, "percentage": 69.68, "elapsed_time": "2 days, 3:30:37", "remaining_time": "22:24:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6709, "total_steps": 9627, "loss": 1.6067, "learning_rate": 2.1006821583011356e-05, "epoch": 0.6968941518645476, "percentage": 69.69, "elapsed_time": "2 days, 3:31:07", "remaining_time": "22:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6710, "total_steps": 9627, "loss": 1.5778, "learning_rate": 2.099352979449119e-05, "epoch": 0.696998026384128, "percentage": 69.7, "elapsed_time": "2 days, 3:31:37", "remaining_time": "22:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6711, "total_steps": 9627, "loss": 1.685, "learning_rate": 2.0980241094933845e-05, "epoch": 0.6971019009037083, "percentage": 69.71, "elapsed_time": "2 days, 3:32:07", "remaining_time": "22:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6712, "total_steps": 9627, "loss": 1.2405, "learning_rate": 2.0966955485754457e-05, "epoch": 0.6972057754232887, "percentage": 69.72, "elapsed_time": "2 days, 3:32:38", "remaining_time": "22:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6713, "total_steps": 9627, "loss": 1.4806, "learning_rate": 2.0953672968367844e-05, "epoch": 0.697309649942869, "percentage": 69.73, "elapsed_time": "2 days, 3:33:09", "remaining_time": "22:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6714, "total_steps": 9627, "loss": 1.4771, "learning_rate": 2.094039354418849e-05, "epoch": 0.6974135244624493, "percentage": 69.74, "elapsed_time": "2 days, 3:33:38", "remaining_time": "22:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6715, "total_steps": 9627, "loss": 1.8148, "learning_rate": 2.0927117214630547e-05, "epoch": 0.6975173989820297, "percentage": 69.75, "elapsed_time": "2 days, 3:34:09", "remaining_time": "22:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6716, "total_steps": 9627, "loss": 1.7156, "learning_rate": 2.0913843981107835e-05, "epoch": 0.6976212735016101, "percentage": 69.76, "elapsed_time": "2 days, 3:34:38", "remaining_time": "22:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6717, "total_steps": 9627, "loss": 1.6558, "learning_rate": 2.0900573845033865e-05, "epoch": 0.6977251480211905, "percentage": 69.77, "elapsed_time": "2 days, 3:35:08", "remaining_time": "22:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6718, "total_steps": 9627, "loss": 1.5849, "learning_rate": 2.0887306807821822e-05, "epoch": 0.6978290225407707, "percentage": 69.78, "elapsed_time": "2 days, 3:35:38", "remaining_time": "22:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6719, "total_steps": 9627, "loss": 1.5836, "learning_rate": 2.0874042870884475e-05, "epoch": 0.6979328970603511, "percentage": 69.79, "elapsed_time": "2 days, 3:36:08", "remaining_time": "22:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6720, "total_steps": 9627, "loss": 1.7748, "learning_rate": 2.086078203563439e-05, "epoch": 0.6980367715799315, "percentage": 69.8, "elapsed_time": "2 days, 3:36:38", "remaining_time": "22:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6721, "total_steps": 9627, "loss": 1.7206, "learning_rate": 2.0847524303483728e-05, "epoch": 0.6981406460995118, "percentage": 69.81, "elapsed_time": "2 days, 3:37:08", "remaining_time": "22:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6722, "total_steps": 9627, "loss": 1.7428, "learning_rate": 2.0834269675844326e-05, "epoch": 0.6982445206190921, "percentage": 69.82, "elapsed_time": "2 days, 3:37:38", "remaining_time": "22:18:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6723, "total_steps": 9627, "loss": 1.7212, "learning_rate": 2.0821018154127686e-05, "epoch": 0.6983483951386725, "percentage": 69.83, "elapsed_time": "2 days, 3:38:07", "remaining_time": "22:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6724, "total_steps": 9627, "loss": 1.326, "learning_rate": 2.0807769739745043e-05, "epoch": 0.6984522696582528, "percentage": 69.85, "elapsed_time": "2 days, 3:38:38", "remaining_time": "22:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6725, "total_steps": 9627, "loss": 1.6675, "learning_rate": 2.0794524434107192e-05, "epoch": 0.6985561441778332, "percentage": 69.86, "elapsed_time": "2 days, 3:39:09", "remaining_time": "22:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6726, "total_steps": 9627, "loss": 1.6125, "learning_rate": 2.0781282238624666e-05, "epoch": 0.6986600186974136, "percentage": 69.87, "elapsed_time": "2 days, 3:39:39", "remaining_time": "22:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6727, "total_steps": 9627, "loss": 1.567, "learning_rate": 2.07680431547077e-05, "epoch": 0.6987638932169938, "percentage": 69.88, "elapsed_time": "2 days, 3:40:08", "remaining_time": "22:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6728, "total_steps": 9627, "loss": 1.6608, "learning_rate": 2.0754807183766084e-05, "epoch": 0.6988677677365742, "percentage": 69.89, "elapsed_time": "2 days, 3:40:39", "remaining_time": "22:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6729, "total_steps": 9627, "loss": 1.672, "learning_rate": 2.07415743272094e-05, "epoch": 0.6989716422561546, "percentage": 69.9, "elapsed_time": "2 days, 3:41:09", "remaining_time": "22:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6730, "total_steps": 9627, "loss": 1.6127, "learning_rate": 2.0728344586446825e-05, "epoch": 0.6990755167757349, "percentage": 69.91, "elapsed_time": "2 days, 3:41:40", "remaining_time": "22:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6731, "total_steps": 9627, "loss": 1.604, "learning_rate": 2.0715117962887224e-05, "epoch": 0.6991793912953153, "percentage": 69.92, "elapsed_time": "2 days, 3:42:09", "remaining_time": "22:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6732, "total_steps": 9627, "loss": 1.6413, "learning_rate": 2.070189445793913e-05, "epoch": 0.6992832658148956, "percentage": 69.93, "elapsed_time": "2 days, 3:42:40", "remaining_time": "22:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6733, "total_steps": 9627, "loss": 1.6768, "learning_rate": 2.068867407301074e-05, "epoch": 0.6993871403344759, "percentage": 69.94, "elapsed_time": "2 days, 3:43:11", "remaining_time": "22:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6734, "total_steps": 9627, "loss": 1.6151, "learning_rate": 2.0675456809509925e-05, "epoch": 0.6994910148540563, "percentage": 69.95, "elapsed_time": "2 days, 3:43:40", "remaining_time": "22:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6735, "total_steps": 9627, "loss": 1.6619, "learning_rate": 2.06622426688442e-05, "epoch": 0.6995948893736367, "percentage": 69.96, "elapsed_time": "2 days, 3:44:11", "remaining_time": "22:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6736, "total_steps": 9627, "loss": 1.7536, "learning_rate": 2.064903165242083e-05, "epoch": 0.699698763893217, "percentage": 69.97, "elapsed_time": "2 days, 3:44:41", "remaining_time": "22:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6737, "total_steps": 9627, "loss": 1.8067, "learning_rate": 2.06358237616466e-05, "epoch": 0.6998026384127973, "percentage": 69.98, "elapsed_time": "2 days, 3:45:13", "remaining_time": "22:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6738, "total_steps": 9627, "loss": 1.6172, "learning_rate": 2.062261899792811e-05, "epoch": 0.6999065129323777, "percentage": 69.99, "elapsed_time": "2 days, 3:45:43", "remaining_time": "22:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6739, "total_steps": 9627, "loss": 1.7188, "learning_rate": 2.0609417362671545e-05, "epoch": 0.700010387451958, "percentage": 70.0, "elapsed_time": "2 days, 3:46:14", "remaining_time": "22:11:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6740, "total_steps": 9627, "loss": 1.5628, "learning_rate": 2.0596218857282778e-05, "epoch": 0.7001142619715384, "percentage": 70.01, "elapsed_time": "2 days, 3:46:44", "remaining_time": "22:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6741, "total_steps": 9627, "loss": 1.6419, "learning_rate": 2.058302348316734e-05, "epoch": 0.7002181364911187, "percentage": 70.02, "elapsed_time": "2 days, 3:47:16", "remaining_time": "22:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6742, "total_steps": 9627, "loss": 1.5731, "learning_rate": 2.0569831241730425e-05, "epoch": 0.7003220110106991, "percentage": 70.03, "elapsed_time": "2 days, 3:47:46", "remaining_time": "22:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6743, "total_steps": 9627, "loss": 1.6441, "learning_rate": 2.0556642134376953e-05, "epoch": 0.7004258855302794, "percentage": 70.04, "elapsed_time": "2 days, 3:48:17", "remaining_time": "22:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6744, "total_steps": 9627, "loss": 1.7277, "learning_rate": 2.0543456162511386e-05, "epoch": 0.7005297600498598, "percentage": 70.05, "elapsed_time": "2 days, 3:48:48", "remaining_time": "22:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6745, "total_steps": 9627, "loss": 1.4717, "learning_rate": 2.053027332753799e-05, "epoch": 0.7006336345694402, "percentage": 70.06, "elapsed_time": "2 days, 3:49:18", "remaining_time": "22:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6746, "total_steps": 9627, "loss": 1.619, "learning_rate": 2.0517093630860633e-05, "epoch": 0.7007375090890204, "percentage": 70.07, "elapsed_time": "2 days, 3:49:48", "remaining_time": "22:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6747, "total_steps": 9627, "loss": 1.5183, "learning_rate": 2.050391707388279e-05, "epoch": 0.7008413836086008, "percentage": 70.08, "elapsed_time": "2 days, 3:50:20", "remaining_time": "22:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6748, "total_steps": 9627, "loss": 1.7367, "learning_rate": 2.049074365800772e-05, "epoch": 0.7009452581281812, "percentage": 70.09, "elapsed_time": "2 days, 3:50:50", "remaining_time": "22:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6749, "total_steps": 9627, "loss": 1.8808, "learning_rate": 2.0477573384638266e-05, "epoch": 0.7010491326477615, "percentage": 70.1, "elapsed_time": "2 days, 3:51:20", "remaining_time": "22:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6750, "total_steps": 9627, "loss": 1.6206, "learning_rate": 2.0464406255176966e-05, "epoch": 0.7011530071673419, "percentage": 70.12, "elapsed_time": "2 days, 3:51:51", "remaining_time": "22:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6751, "total_steps": 9627, "loss": 1.6493, "learning_rate": 2.045124227102601e-05, "epoch": 0.7012568816869222, "percentage": 70.13, "elapsed_time": "2 days, 3:52:21", "remaining_time": "22:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6752, "total_steps": 9627, "loss": 1.6487, "learning_rate": 2.043808143358727e-05, "epoch": 0.7013607562065025, "percentage": 70.14, "elapsed_time": "2 days, 3:52:52", "remaining_time": "22:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6753, "total_steps": 9627, "loss": 1.7022, "learning_rate": 2.0424923744262258e-05, "epoch": 0.7014646307260829, "percentage": 70.15, "elapsed_time": "2 days, 3:53:22", "remaining_time": "22:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6754, "total_steps": 9627, "loss": 1.7152, "learning_rate": 2.041176920445216e-05, "epoch": 0.7015685052456633, "percentage": 70.16, "elapsed_time": "2 days, 3:53:52", "remaining_time": "22:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6755, "total_steps": 9627, "loss": 1.5213, "learning_rate": 2.0398617815557875e-05, "epoch": 0.7016723797652435, "percentage": 70.17, "elapsed_time": "2 days, 3:54:22", "remaining_time": "22:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6756, "total_steps": 9627, "loss": 1.4975, "learning_rate": 2.038546957897986e-05, "epoch": 0.7017762542848239, "percentage": 70.18, "elapsed_time": "2 days, 3:54:53", "remaining_time": "22:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6757, "total_steps": 9627, "loss": 1.5669, "learning_rate": 2.037232449611835e-05, "epoch": 0.7018801288044043, "percentage": 70.19, "elapsed_time": "2 days, 3:55:23", "remaining_time": "22:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6758, "total_steps": 9627, "loss": 1.7064, "learning_rate": 2.0359182568373176e-05, "epoch": 0.7019840033239846, "percentage": 70.2, "elapsed_time": "2 days, 3:55:53", "remaining_time": "22:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6759, "total_steps": 9627, "loss": 1.5934, "learning_rate": 2.0346043797143854e-05, "epoch": 0.702087877843565, "percentage": 70.21, "elapsed_time": "2 days, 3:56:23", "remaining_time": "22:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6760, "total_steps": 9627, "loss": 1.6623, "learning_rate": 2.0332908183829556e-05, "epoch": 0.7021917523631453, "percentage": 70.22, "elapsed_time": "2 days, 3:56:53", "remaining_time": "22:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6761, "total_steps": 9627, "loss": 1.8849, "learning_rate": 2.031977572982912e-05, "epoch": 0.7022956268827256, "percentage": 70.23, "elapsed_time": "2 days, 3:57:23", "remaining_time": "22:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6762, "total_steps": 9627, "loss": 1.7985, "learning_rate": 2.030664643654106e-05, "epoch": 0.702399501402306, "percentage": 70.24, "elapsed_time": "2 days, 3:57:54", "remaining_time": "22:01:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6763, "total_steps": 9627, "loss": 1.5767, "learning_rate": 2.0293520305363522e-05, "epoch": 0.7025033759218864, "percentage": 70.25, "elapsed_time": "2 days, 3:58:24", "remaining_time": "22:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6764, "total_steps": 9627, "loss": 1.7073, "learning_rate": 2.028039733769438e-05, "epoch": 0.7026072504414667, "percentage": 70.26, "elapsed_time": "2 days, 3:58:55", "remaining_time": "22:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6765, "total_steps": 9627, "loss": 1.3946, "learning_rate": 2.0267277534931066e-05, "epoch": 0.702711124961047, "percentage": 70.27, "elapsed_time": "2 days, 3:59:25", "remaining_time": "21:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6766, "total_steps": 9627, "loss": 1.7273, "learning_rate": 2.0254160898470792e-05, "epoch": 0.7028149994806274, "percentage": 70.28, "elapsed_time": "2 days, 3:59:55", "remaining_time": "21:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6767, "total_steps": 9627, "loss": 1.4529, "learning_rate": 2.024104742971035e-05, "epoch": 0.7029188740002077, "percentage": 70.29, "elapsed_time": "2 days, 4:00:24", "remaining_time": "21:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6768, "total_steps": 9627, "loss": 1.4317, "learning_rate": 2.0227937130046237e-05, "epoch": 0.7030227485197881, "percentage": 70.3, "elapsed_time": "2 days, 4:00:55", "remaining_time": "21:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6769, "total_steps": 9627, "loss": 1.659, "learning_rate": 2.0214830000874586e-05, "epoch": 0.7031266230393685, "percentage": 70.31, "elapsed_time": "2 days, 4:01:26", "remaining_time": "21:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6770, "total_steps": 9627, "loss": 1.7416, "learning_rate": 2.0201726043591186e-05, "epoch": 0.7032304975589488, "percentage": 70.32, "elapsed_time": "2 days, 4:01:56", "remaining_time": "21:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6771, "total_steps": 9627, "loss": 1.6191, "learning_rate": 2.018862525959156e-05, "epoch": 0.7033343720785291, "percentage": 70.33, "elapsed_time": "2 days, 4:02:25", "remaining_time": "21:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6772, "total_steps": 9627, "loss": 1.6096, "learning_rate": 2.017552765027077e-05, "epoch": 0.7034382465981095, "percentage": 70.34, "elapsed_time": "2 days, 4:02:57", "remaining_time": "21:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6773, "total_steps": 9627, "loss": 1.7234, "learning_rate": 2.0162433217023667e-05, "epoch": 0.7035421211176899, "percentage": 70.35, "elapsed_time": "2 days, 4:03:27", "remaining_time": "21:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6774, "total_steps": 9627, "loss": 1.5358, "learning_rate": 2.0149341961244704e-05, "epoch": 0.7036459956372701, "percentage": 70.36, "elapsed_time": "2 days, 4:03:57", "remaining_time": "21:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6775, "total_steps": 9627, "loss": 1.592, "learning_rate": 2.0136253884327937e-05, "epoch": 0.7037498701568505, "percentage": 70.37, "elapsed_time": "2 days, 4:04:27", "remaining_time": "21:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6776, "total_steps": 9627, "loss": 1.6287, "learning_rate": 2.0123168987667206e-05, "epoch": 0.7038537446764309, "percentage": 70.39, "elapsed_time": "2 days, 4:04:58", "remaining_time": "21:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6777, "total_steps": 9627, "loss": 1.6935, "learning_rate": 2.011008727265593e-05, "epoch": 0.7039576191960112, "percentage": 70.4, "elapsed_time": "2 days, 4:05:28", "remaining_time": "21:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6778, "total_steps": 9627, "loss": 1.8375, "learning_rate": 2.009700874068721e-05, "epoch": 0.7040614937155916, "percentage": 70.41, "elapsed_time": "2 days, 4:05:57", "remaining_time": "21:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6779, "total_steps": 9627, "loss": 1.6755, "learning_rate": 2.0083933393153808e-05, "epoch": 0.704165368235172, "percentage": 70.42, "elapsed_time": "2 days, 4:06:27", "remaining_time": "21:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6780, "total_steps": 9627, "loss": 1.6924, "learning_rate": 2.007086123144814e-05, "epoch": 0.7042692427547522, "percentage": 70.43, "elapsed_time": "2 days, 4:06:58", "remaining_time": "21:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6781, "total_steps": 9627, "loss": 1.8002, "learning_rate": 2.00577922569623e-05, "epoch": 0.7043731172743326, "percentage": 70.44, "elapsed_time": "2 days, 4:07:28", "remaining_time": "21:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6782, "total_steps": 9627, "loss": 1.6296, "learning_rate": 2.0044726471088005e-05, "epoch": 0.704476991793913, "percentage": 70.45, "elapsed_time": "2 days, 4:07:58", "remaining_time": "21:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6783, "total_steps": 9627, "loss": 1.7662, "learning_rate": 2.0031663875216717e-05, "epoch": 0.7045808663134933, "percentage": 70.46, "elapsed_time": "2 days, 4:08:28", "remaining_time": "21:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6784, "total_steps": 9627, "loss": 1.5681, "learning_rate": 2.0018604470739434e-05, "epoch": 0.7046847408330736, "percentage": 70.47, "elapsed_time": "2 days, 4:08:58", "remaining_time": "21:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6785, "total_steps": 9627, "loss": 1.6114, "learning_rate": 2.000554825904692e-05, "epoch": 0.704788615352654, "percentage": 70.48, "elapsed_time": "2 days, 4:09:29", "remaining_time": "21:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6786, "total_steps": 9627, "loss": 1.6702, "learning_rate": 1.9992495241529556e-05, "epoch": 0.7048924898722343, "percentage": 70.49, "elapsed_time": "2 days, 4:09:58", "remaining_time": "21:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6787, "total_steps": 9627, "loss": 1.7412, "learning_rate": 1.997944541957738e-05, "epoch": 0.7049963643918147, "percentage": 70.5, "elapsed_time": "2 days, 4:10:30", "remaining_time": "21:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6788, "total_steps": 9627, "loss": 1.7816, "learning_rate": 1.99663987945801e-05, "epoch": 0.7051002389113951, "percentage": 70.51, "elapsed_time": "2 days, 4:10:59", "remaining_time": "21:49:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6789, "total_steps": 9627, "loss": 1.6678, "learning_rate": 1.9953355367927075e-05, "epoch": 0.7052041134309753, "percentage": 70.52, "elapsed_time": "2 days, 4:11:30", "remaining_time": "21:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6790, "total_steps": 9627, "loss": 1.6948, "learning_rate": 1.9940315141007327e-05, "epoch": 0.7053079879505557, "percentage": 70.53, "elapsed_time": "2 days, 4:11:59", "remaining_time": "21:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6791, "total_steps": 9627, "loss": 1.6762, "learning_rate": 1.992727811520953e-05, "epoch": 0.7054118624701361, "percentage": 70.54, "elapsed_time": "2 days, 4:12:31", "remaining_time": "21:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6792, "total_steps": 9627, "loss": 1.495, "learning_rate": 1.991424429192207e-05, "epoch": 0.7055157369897164, "percentage": 70.55, "elapsed_time": "2 days, 4:13:01", "remaining_time": "21:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6793, "total_steps": 9627, "loss": 1.6277, "learning_rate": 1.9901213672532875e-05, "epoch": 0.7056196115092968, "percentage": 70.56, "elapsed_time": "2 days, 4:13:31", "remaining_time": "21:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6794, "total_steps": 9627, "loss": 1.6252, "learning_rate": 1.988818625842967e-05, "epoch": 0.7057234860288771, "percentage": 70.57, "elapsed_time": "2 days, 4:14:02", "remaining_time": "21:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6795, "total_steps": 9627, "loss": 1.5978, "learning_rate": 1.9875162050999747e-05, "epoch": 0.7058273605484575, "percentage": 70.58, "elapsed_time": "2 days, 4:14:32", "remaining_time": "21:46:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6796, "total_steps": 9627, "loss": 1.521, "learning_rate": 1.986214105163008e-05, "epoch": 0.7059312350680378, "percentage": 70.59, "elapsed_time": "2 days, 4:15:02", "remaining_time": "21:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6797, "total_steps": 9627, "loss": 1.7809, "learning_rate": 1.9849123261707305e-05, "epoch": 0.7060351095876182, "percentage": 70.6, "elapsed_time": "2 days, 4:15:33", "remaining_time": "21:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6798, "total_steps": 9627, "loss": 1.6883, "learning_rate": 1.98361086826177e-05, "epoch": 0.7061389841071986, "percentage": 70.61, "elapsed_time": "2 days, 4:16:04", "remaining_time": "21:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6799, "total_steps": 9627, "loss": 1.6939, "learning_rate": 1.9823097315747267e-05, "epoch": 0.7062428586267788, "percentage": 70.62, "elapsed_time": "2 days, 4:16:35", "remaining_time": "21:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6800, "total_steps": 9627, "loss": 1.6935, "learning_rate": 1.9810089162481548e-05, "epoch": 0.7063467331463592, "percentage": 70.63, "elapsed_time": "2 days, 4:17:05", "remaining_time": "21:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6801, "total_steps": 9627, "loss": 1.8802, "learning_rate": 1.9797084224205857e-05, "epoch": 0.7064506076659396, "percentage": 70.65, "elapsed_time": "2 days, 4:17:36", "remaining_time": "21:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6802, "total_steps": 9627, "loss": 1.7329, "learning_rate": 1.978408250230513e-05, "epoch": 0.7065544821855199, "percentage": 70.66, "elapsed_time": "2 days, 4:18:06", "remaining_time": "21:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6803, "total_steps": 9627, "loss": 1.5892, "learning_rate": 1.977108399816388e-05, "epoch": 0.7066583567051002, "percentage": 70.67, "elapsed_time": "2 days, 4:18:37", "remaining_time": "21:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6804, "total_steps": 9627, "loss": 1.5868, "learning_rate": 1.975808871316641e-05, "epoch": 0.7067622312246806, "percentage": 70.68, "elapsed_time": "2 days, 4:19:07", "remaining_time": "21:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6805, "total_steps": 9627, "loss": 1.7898, "learning_rate": 1.97450966486966e-05, "epoch": 0.7068661057442609, "percentage": 70.69, "elapsed_time": "2 days, 4:19:38", "remaining_time": "21:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6806, "total_steps": 9627, "loss": 1.662, "learning_rate": 1.9732107806137996e-05, "epoch": 0.7069699802638413, "percentage": 70.7, "elapsed_time": "2 days, 4:20:08", "remaining_time": "21:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6807, "total_steps": 9627, "loss": 1.5625, "learning_rate": 1.971912218687381e-05, "epoch": 0.7070738547834217, "percentage": 70.71, "elapsed_time": "2 days, 4:20:39", "remaining_time": "21:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6808, "total_steps": 9627, "loss": 1.4567, "learning_rate": 1.9706139792286915e-05, "epoch": 0.7071777293030019, "percentage": 70.72, "elapsed_time": "2 days, 4:21:11", "remaining_time": "21:40:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6809, "total_steps": 9627, "loss": 1.6887, "learning_rate": 1.9693160623759826e-05, "epoch": 0.7072816038225823, "percentage": 70.73, "elapsed_time": "2 days, 4:21:41", "remaining_time": "21:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6810, "total_steps": 9627, "loss": 1.7088, "learning_rate": 1.968018468267472e-05, "epoch": 0.7073854783421627, "percentage": 70.74, "elapsed_time": "2 days, 4:22:12", "remaining_time": "21:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6811, "total_steps": 9627, "loss": 1.5636, "learning_rate": 1.9667211970413468e-05, "epoch": 0.707489352861743, "percentage": 70.75, "elapsed_time": "2 days, 4:22:43", "remaining_time": "21:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6812, "total_steps": 9627, "loss": 1.5771, "learning_rate": 1.96542424883575e-05, "epoch": 0.7075932273813234, "percentage": 70.76, "elapsed_time": "2 days, 4:23:14", "remaining_time": "21:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6813, "total_steps": 9627, "loss": 1.8045, "learning_rate": 1.9641276237888023e-05, "epoch": 0.7076971019009037, "percentage": 70.77, "elapsed_time": "2 days, 4:23:44", "remaining_time": "21:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6814, "total_steps": 9627, "loss": 1.7703, "learning_rate": 1.9628313220385818e-05, "epoch": 0.707800976420484, "percentage": 70.78, "elapsed_time": "2 days, 4:24:15", "remaining_time": "21:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6815, "total_steps": 9627, "loss": 1.4605, "learning_rate": 1.961535343723135e-05, "epoch": 0.7079048509400644, "percentage": 70.79, "elapsed_time": "2 days, 4:24:46", "remaining_time": "21:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6816, "total_steps": 9627, "loss": 1.6786, "learning_rate": 1.960239688980473e-05, "epoch": 0.7080087254596448, "percentage": 70.8, "elapsed_time": "2 days, 4:25:17", "remaining_time": "21:37:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6817, "total_steps": 9627, "loss": 1.5045, "learning_rate": 1.958944357948573e-05, "epoch": 0.708112599979225, "percentage": 70.81, "elapsed_time": "2 days, 4:25:48", "remaining_time": "21:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6818, "total_steps": 9627, "loss": 1.653, "learning_rate": 1.9576493507653776e-05, "epoch": 0.7082164744988054, "percentage": 70.82, "elapsed_time": "2 days, 4:26:19", "remaining_time": "21:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6819, "total_steps": 9627, "loss": 1.7776, "learning_rate": 1.9563546675687932e-05, "epoch": 0.7083203490183858, "percentage": 70.83, "elapsed_time": "2 days, 4:26:49", "remaining_time": "21:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6820, "total_steps": 9627, "loss": 1.5983, "learning_rate": 1.9550603084966973e-05, "epoch": 0.7084242235379662, "percentage": 70.84, "elapsed_time": "2 days, 4:27:21", "remaining_time": "21:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6821, "total_steps": 9627, "loss": 1.7198, "learning_rate": 1.9537662736869272e-05, "epoch": 0.7085280980575465, "percentage": 70.85, "elapsed_time": "2 days, 4:27:52", "remaining_time": "21:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6822, "total_steps": 9627, "loss": 1.6711, "learning_rate": 1.9524725632772878e-05, "epoch": 0.7086319725771268, "percentage": 70.86, "elapsed_time": "2 days, 4:28:22", "remaining_time": "21:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6823, "total_steps": 9627, "loss": 1.8374, "learning_rate": 1.9511791774055482e-05, "epoch": 0.7087358470967072, "percentage": 70.87, "elapsed_time": "2 days, 4:28:54", "remaining_time": "21:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6824, "total_steps": 9627, "loss": 1.6595, "learning_rate": 1.9498861162094446e-05, "epoch": 0.7088397216162875, "percentage": 70.88, "elapsed_time": "2 days, 4:29:24", "remaining_time": "21:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6825, "total_steps": 9627, "loss": 1.5316, "learning_rate": 1.948593379826678e-05, "epoch": 0.7089435961358679, "percentage": 70.89, "elapsed_time": "2 days, 4:29:56", "remaining_time": "21:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6826, "total_steps": 9627, "loss": 1.5832, "learning_rate": 1.947300968394913e-05, "epoch": 0.7090474706554483, "percentage": 70.9, "elapsed_time": "2 days, 4:30:26", "remaining_time": "21:32:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6827, "total_steps": 9627, "loss": 1.6259, "learning_rate": 1.946008882051786e-05, "epoch": 0.7091513451750285, "percentage": 70.92, "elapsed_time": "2 days, 4:30:58", "remaining_time": "21:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6828, "total_steps": 9627, "loss": 1.6728, "learning_rate": 1.9447171209348875e-05, "epoch": 0.7092552196946089, "percentage": 70.93, "elapsed_time": "2 days, 4:31:28", "remaining_time": "21:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6829, "total_steps": 9627, "loss": 1.5225, "learning_rate": 1.943425685181785e-05, "epoch": 0.7093590942141893, "percentage": 70.94, "elapsed_time": "2 days, 4:31:59", "remaining_time": "21:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6830, "total_steps": 9627, "loss": 1.6512, "learning_rate": 1.9421345749300073e-05, "epoch": 0.7094629687337696, "percentage": 70.95, "elapsed_time": "2 days, 4:32:31", "remaining_time": "21:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6831, "total_steps": 9627, "loss": 1.6372, "learning_rate": 1.940843790317041e-05, "epoch": 0.70956684325335, "percentage": 70.96, "elapsed_time": "2 days, 4:33:02", "remaining_time": "21:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6832, "total_steps": 9627, "loss": 1.5949, "learning_rate": 1.939553331480351e-05, "epoch": 0.7096707177729303, "percentage": 70.97, "elapsed_time": "2 days, 4:33:33", "remaining_time": "21:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6833, "total_steps": 9627, "loss": 1.682, "learning_rate": 1.9382631985573586e-05, "epoch": 0.7097745922925106, "percentage": 70.98, "elapsed_time": "2 days, 4:34:02", "remaining_time": "21:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6834, "total_steps": 9627, "loss": 1.5583, "learning_rate": 1.9369733916854526e-05, "epoch": 0.709878466812091, "percentage": 70.99, "elapsed_time": "2 days, 4:34:35", "remaining_time": "21:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6835, "total_steps": 9627, "loss": 1.6265, "learning_rate": 1.935683911001988e-05, "epoch": 0.7099823413316714, "percentage": 71.0, "elapsed_time": "2 days, 4:35:05", "remaining_time": "21:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6836, "total_steps": 9627, "loss": 1.7359, "learning_rate": 1.934394756644285e-05, "epoch": 0.7100862158512516, "percentage": 71.01, "elapsed_time": "2 days, 4:35:37", "remaining_time": "21:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6837, "total_steps": 9627, "loss": 1.6238, "learning_rate": 1.9331059287496274e-05, "epoch": 0.710190090370832, "percentage": 71.02, "elapsed_time": "2 days, 4:36:08", "remaining_time": "21:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6838, "total_steps": 9627, "loss": 1.7365, "learning_rate": 1.9318174274552638e-05, "epoch": 0.7102939648904124, "percentage": 71.03, "elapsed_time": "2 days, 4:36:38", "remaining_time": "21:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6839, "total_steps": 9627, "loss": 1.7917, "learning_rate": 1.930529252898415e-05, "epoch": 0.7103978394099927, "percentage": 71.04, "elapsed_time": "2 days, 4:37:10", "remaining_time": "21:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6840, "total_steps": 9627, "loss": 1.7213, "learning_rate": 1.929241405216254e-05, "epoch": 0.7105017139295731, "percentage": 71.05, "elapsed_time": "2 days, 4:37:40", "remaining_time": "21:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6841, "total_steps": 9627, "loss": 1.5519, "learning_rate": 1.9279538845459327e-05, "epoch": 0.7106055884491534, "percentage": 71.06, "elapsed_time": "2 days, 4:38:12", "remaining_time": "21:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6842, "total_steps": 9627, "loss": 1.505, "learning_rate": 1.92666669102456e-05, "epoch": 0.7107094629687337, "percentage": 71.07, "elapsed_time": "2 days, 4:38:43", "remaining_time": "21:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6843, "total_steps": 9627, "loss": 1.678, "learning_rate": 1.9253798247892113e-05, "epoch": 0.7108133374883141, "percentage": 71.08, "elapsed_time": "2 days, 4:39:13", "remaining_time": "21:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6844, "total_steps": 9627, "loss": 1.8031, "learning_rate": 1.924093285976929e-05, "epoch": 0.7109172120078945, "percentage": 71.09, "elapsed_time": "2 days, 4:39:45", "remaining_time": "21:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6845, "total_steps": 9627, "loss": 1.7211, "learning_rate": 1.9228070747247185e-05, "epoch": 0.7110210865274748, "percentage": 71.1, "elapsed_time": "2 days, 4:40:17", "remaining_time": "21:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6846, "total_steps": 9627, "loss": 1.7405, "learning_rate": 1.9215211911695512e-05, "epoch": 0.7111249610470551, "percentage": 71.11, "elapsed_time": "2 days, 4:40:48", "remaining_time": "21:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6847, "total_steps": 9627, "loss": 1.6972, "learning_rate": 1.9202356354483624e-05, "epoch": 0.7112288355666355, "percentage": 71.12, "elapsed_time": "2 days, 4:41:20", "remaining_time": "21:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6848, "total_steps": 9627, "loss": 1.7432, "learning_rate": 1.9189504076980567e-05, "epoch": 0.7113327100862159, "percentage": 71.13, "elapsed_time": "2 days, 4:41:50", "remaining_time": "21:23:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6849, "total_steps": 9627, "loss": 1.6582, "learning_rate": 1.9176655080555e-05, "epoch": 0.7114365846057962, "percentage": 71.14, "elapsed_time": "2 days, 4:42:21", "remaining_time": "21:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6850, "total_steps": 9627, "loss": 1.6672, "learning_rate": 1.9163809366575235e-05, "epoch": 0.7115404591253766, "percentage": 71.15, "elapsed_time": "2 days, 4:42:53", "remaining_time": "21:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6851, "total_steps": 9627, "loss": 1.7137, "learning_rate": 1.9150966936409242e-05, "epoch": 0.7116443336449569, "percentage": 71.16, "elapsed_time": "2 days, 4:43:24", "remaining_time": "21:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6852, "total_steps": 9627, "loss": 1.5847, "learning_rate": 1.9138127791424637e-05, "epoch": 0.7117482081645372, "percentage": 71.17, "elapsed_time": "2 days, 4:43:55", "remaining_time": "21:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6853, "total_steps": 9627, "loss": 1.7037, "learning_rate": 1.912529193298869e-05, "epoch": 0.7118520826841176, "percentage": 71.19, "elapsed_time": "2 days, 4:44:28", "remaining_time": "21:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6854, "total_steps": 9627, "loss": 1.5538, "learning_rate": 1.91124593624683e-05, "epoch": 0.711955957203698, "percentage": 71.2, "elapsed_time": "2 days, 4:44:58", "remaining_time": "21:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6855, "total_steps": 9627, "loss": 1.4787, "learning_rate": 1.9099630081230095e-05, "epoch": 0.7120598317232782, "percentage": 71.21, "elapsed_time": "2 days, 4:45:30", "remaining_time": "21:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6856, "total_steps": 9627, "loss": 1.831, "learning_rate": 1.908680409064022e-05, "epoch": 0.7121637062428586, "percentage": 71.22, "elapsed_time": "2 days, 4:46:02", "remaining_time": "21:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6857, "total_steps": 9627, "loss": 1.9043, "learning_rate": 1.9073981392064587e-05, "epoch": 0.712267580762439, "percentage": 71.23, "elapsed_time": "2 days, 4:46:31", "remaining_time": "21:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6858, "total_steps": 9627, "loss": 1.7122, "learning_rate": 1.9061161986868732e-05, "epoch": 0.7123714552820193, "percentage": 71.24, "elapsed_time": "2 days, 4:47:03", "remaining_time": "21:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6859, "total_steps": 9627, "loss": 1.6308, "learning_rate": 1.9048345876417752e-05, "epoch": 0.7124753298015997, "percentage": 71.25, "elapsed_time": "2 days, 4:47:34", "remaining_time": "21:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6860, "total_steps": 9627, "loss": 1.658, "learning_rate": 1.9035533062076522e-05, "epoch": 0.71257920432118, "percentage": 71.26, "elapsed_time": "2 days, 4:48:04", "remaining_time": "21:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6861, "total_steps": 9627, "loss": 1.5886, "learning_rate": 1.9022723545209487e-05, "epoch": 0.7126830788407603, "percentage": 71.27, "elapsed_time": "2 days, 4:48:37", "remaining_time": "21:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6862, "total_steps": 9627, "loss": 1.5387, "learning_rate": 1.9009917327180766e-05, "epoch": 0.7127869533603407, "percentage": 71.28, "elapsed_time": "2 days, 4:49:07", "remaining_time": "21:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6863, "total_steps": 9627, "loss": 1.7033, "learning_rate": 1.8997114409354116e-05, "epoch": 0.7128908278799211, "percentage": 71.29, "elapsed_time": "2 days, 4:49:40", "remaining_time": "21:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6864, "total_steps": 9627, "loss": 1.6542, "learning_rate": 1.898431479309295e-05, "epoch": 0.7129947023995014, "percentage": 71.3, "elapsed_time": "2 days, 4:50:10", "remaining_time": "21:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6865, "total_steps": 9627, "loss": 1.6021, "learning_rate": 1.8971518479760324e-05, "epoch": 0.7130985769190817, "percentage": 71.31, "elapsed_time": "2 days, 4:50:41", "remaining_time": "21:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6866, "total_steps": 9627, "loss": 1.9381, "learning_rate": 1.8958725470718937e-05, "epoch": 0.7132024514386621, "percentage": 71.32, "elapsed_time": "2 days, 4:51:11", "remaining_time": "21:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6867, "total_steps": 9627, "loss": 1.6968, "learning_rate": 1.8945935767331186e-05, "epoch": 0.7133063259582424, "percentage": 71.33, "elapsed_time": "2 days, 4:51:43", "remaining_time": "21:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6868, "total_steps": 9627, "loss": 1.6144, "learning_rate": 1.893314937095901e-05, "epoch": 0.7134102004778228, "percentage": 71.34, "elapsed_time": "2 days, 4:52:14", "remaining_time": "21:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6869, "total_steps": 9627, "loss": 1.723, "learning_rate": 1.8920366282964115e-05, "epoch": 0.7135140749974032, "percentage": 71.35, "elapsed_time": "2 days, 4:52:45", "remaining_time": "21:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6870, "total_steps": 9627, "loss": 1.5267, "learning_rate": 1.8907586504707773e-05, "epoch": 0.7136179495169834, "percentage": 71.36, "elapsed_time": "2 days, 4:53:16", "remaining_time": "21:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6871, "total_steps": 9627, "loss": 1.53, "learning_rate": 1.8894810037550947e-05, "epoch": 0.7137218240365638, "percentage": 71.37, "elapsed_time": "2 days, 4:53:47", "remaining_time": "21:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6872, "total_steps": 9627, "loss": 1.6174, "learning_rate": 1.888203688285422e-05, "epoch": 0.7138256985561442, "percentage": 71.38, "elapsed_time": "2 days, 4:54:17", "remaining_time": "21:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6873, "total_steps": 9627, "loss": 1.7112, "learning_rate": 1.8869267041977817e-05, "epoch": 0.7139295730757246, "percentage": 71.39, "elapsed_time": "2 days, 4:54:49", "remaining_time": "21:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6874, "total_steps": 9627, "loss": 1.6291, "learning_rate": 1.8856500516281684e-05, "epoch": 0.7140334475953048, "percentage": 71.4, "elapsed_time": "2 days, 4:55:20", "remaining_time": "21:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6875, "total_steps": 9627, "loss": 1.4871, "learning_rate": 1.8843737307125275e-05, "epoch": 0.7141373221148852, "percentage": 71.41, "elapsed_time": "2 days, 4:55:52", "remaining_time": "21:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6876, "total_steps": 9627, "loss": 1.4438, "learning_rate": 1.883097741586784e-05, "epoch": 0.7142411966344656, "percentage": 71.42, "elapsed_time": "2 days, 4:56:23", "remaining_time": "21:10:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6877, "total_steps": 9627, "loss": 1.6393, "learning_rate": 1.8818220843868178e-05, "epoch": 0.7143450711540459, "percentage": 71.43, "elapsed_time": "2 days, 4:56:53", "remaining_time": "21:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6878, "total_steps": 9627, "loss": 1.7655, "learning_rate": 1.8805467592484772e-05, "epoch": 0.7144489456736263, "percentage": 71.44, "elapsed_time": "2 days, 4:57:25", "remaining_time": "21:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6879, "total_steps": 9627, "loss": 1.9356, "learning_rate": 1.8792717663075738e-05, "epoch": 0.7145528201932067, "percentage": 71.46, "elapsed_time": "2 days, 4:57:57", "remaining_time": "21:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6880, "total_steps": 9627, "loss": 1.5515, "learning_rate": 1.8779971056998846e-05, "epoch": 0.7146566947127869, "percentage": 71.47, "elapsed_time": "2 days, 4:58:27", "remaining_time": "21:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6881, "total_steps": 9627, "loss": 1.7381, "learning_rate": 1.876722777561151e-05, "epoch": 0.7147605692323673, "percentage": 71.48, "elapsed_time": "2 days, 4:58:59", "remaining_time": "21:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6882, "total_steps": 9627, "loss": 1.5871, "learning_rate": 1.8754487820270778e-05, "epoch": 0.7148644437519477, "percentage": 71.49, "elapsed_time": "2 days, 4:59:29", "remaining_time": "21:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6883, "total_steps": 9627, "loss": 1.7346, "learning_rate": 1.87417511923334e-05, "epoch": 0.714968318271528, "percentage": 71.5, "elapsed_time": "2 days, 5:00:01", "remaining_time": "21:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6884, "total_steps": 9627, "loss": 1.7387, "learning_rate": 1.872901789315566e-05, "epoch": 0.7150721927911083, "percentage": 71.51, "elapsed_time": "2 days, 5:00:33", "remaining_time": "21:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6885, "total_steps": 9627, "loss": 1.6588, "learning_rate": 1.8716287924093613e-05, "epoch": 0.7151760673106887, "percentage": 71.52, "elapsed_time": "2 days, 5:01:03", "remaining_time": "21:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6886, "total_steps": 9627, "loss": 1.5263, "learning_rate": 1.8703561286502896e-05, "epoch": 0.715279941830269, "percentage": 71.53, "elapsed_time": "2 days, 5:01:35", "remaining_time": "21:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6887, "total_steps": 9627, "loss": 1.6721, "learning_rate": 1.8690837981738747e-05, "epoch": 0.7153838163498494, "percentage": 71.54, "elapsed_time": "2 days, 5:02:07", "remaining_time": "21:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6888, "total_steps": 9627, "loss": 1.6021, "learning_rate": 1.867811801115614e-05, "epoch": 0.7154876908694298, "percentage": 71.55, "elapsed_time": "2 days, 5:02:38", "remaining_time": "21:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6889, "total_steps": 9627, "loss": 1.7418, "learning_rate": 1.8665401376109654e-05, "epoch": 0.71559156538901, "percentage": 71.56, "elapsed_time": "2 days, 5:03:09", "remaining_time": "21:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6890, "total_steps": 9627, "loss": 1.9432, "learning_rate": 1.86526880779535e-05, "epoch": 0.7156954399085904, "percentage": 71.57, "elapsed_time": "2 days, 5:03:40", "remaining_time": "21:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6891, "total_steps": 9627, "loss": 1.4421, "learning_rate": 1.863997811804155e-05, "epoch": 0.7157993144281708, "percentage": 71.58, "elapsed_time": "2 days, 5:04:11", "remaining_time": "21:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6892, "total_steps": 9627, "loss": 1.6838, "learning_rate": 1.862727149772731e-05, "epoch": 0.7159031889477511, "percentage": 71.59, "elapsed_time": "2 days, 5:04:43", "remaining_time": "21:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6893, "total_steps": 9627, "loss": 1.6661, "learning_rate": 1.8614568218363937e-05, "epoch": 0.7160070634673315, "percentage": 71.6, "elapsed_time": "2 days, 5:05:14", "remaining_time": "21:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6894, "total_steps": 9627, "loss": 1.7035, "learning_rate": 1.860186828130422e-05, "epoch": 0.7161109379869118, "percentage": 71.61, "elapsed_time": "2 days, 5:05:45", "remaining_time": "21:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6895, "total_steps": 9627, "loss": 1.5622, "learning_rate": 1.8589171687900646e-05, "epoch": 0.7162148125064921, "percentage": 71.62, "elapsed_time": "2 days, 5:06:17", "remaining_time": "21:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6896, "total_steps": 9627, "loss": 1.6196, "learning_rate": 1.8576478439505248e-05, "epoch": 0.7163186870260725, "percentage": 71.63, "elapsed_time": "2 days, 5:06:47", "remaining_time": "21:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6897, "total_steps": 9627, "loss": 1.7369, "learning_rate": 1.856378853746979e-05, "epoch": 0.7164225615456529, "percentage": 71.64, "elapsed_time": "2 days, 5:07:19", "remaining_time": "21:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6898, "total_steps": 9627, "loss": 1.7267, "learning_rate": 1.855110198314565e-05, "epoch": 0.7165264360652333, "percentage": 71.65, "elapsed_time": "2 days, 5:07:50", "remaining_time": "21:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6899, "total_steps": 9627, "loss": 1.7538, "learning_rate": 1.8538418777883825e-05, "epoch": 0.7166303105848135, "percentage": 71.66, "elapsed_time": "2 days, 5:08:23", "remaining_time": "21:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6900, "total_steps": 9627, "loss": 1.5747, "learning_rate": 1.8525738923035003e-05, "epoch": 0.7167341851043939, "percentage": 71.67, "elapsed_time": "2 days, 5:08:53", "remaining_time": "21:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6901, "total_steps": 9627, "loss": 1.8062, "learning_rate": 1.8513062419949452e-05, "epoch": 0.7168380596239743, "percentage": 71.68, "elapsed_time": "2 days, 5:09:25", "remaining_time": "20:59:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6902, "total_steps": 9627, "loss": 1.668, "learning_rate": 1.8500389269977186e-05, "epoch": 0.7169419341435546, "percentage": 71.69, "elapsed_time": "2 days, 5:09:56", "remaining_time": "20:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6903, "total_steps": 9627, "loss": 1.6166, "learning_rate": 1.848771947446772e-05, "epoch": 0.7170458086631349, "percentage": 71.7, "elapsed_time": "2 days, 5:10:29", "remaining_time": "20:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6904, "total_steps": 9627, "loss": 1.5487, "learning_rate": 1.847505303477034e-05, "epoch": 0.7171496831827153, "percentage": 71.71, "elapsed_time": "2 days, 5:11:00", "remaining_time": "20:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6905, "total_steps": 9627, "loss": 1.5665, "learning_rate": 1.8462389952233905e-05, "epoch": 0.7172535577022956, "percentage": 71.73, "elapsed_time": "2 days, 5:11:32", "remaining_time": "20:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6906, "total_steps": 9627, "loss": 1.4904, "learning_rate": 1.8449730228206945e-05, "epoch": 0.717357432221876, "percentage": 71.74, "elapsed_time": "2 days, 5:12:02", "remaining_time": "20:57:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6907, "total_steps": 9627, "loss": 1.6915, "learning_rate": 1.8437073864037608e-05, "epoch": 0.7174613067414564, "percentage": 71.75, "elapsed_time": "2 days, 5:12:34", "remaining_time": "20:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6908, "total_steps": 9627, "loss": 1.6279, "learning_rate": 1.842442086107371e-05, "epoch": 0.7175651812610366, "percentage": 71.76, "elapsed_time": "2 days, 5:13:05", "remaining_time": "20:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6909, "total_steps": 9627, "loss": 1.6648, "learning_rate": 1.8411771220662684e-05, "epoch": 0.717669055780617, "percentage": 71.77, "elapsed_time": "2 days, 5:13:37", "remaining_time": "20:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6910, "total_steps": 9627, "loss": 1.755, "learning_rate": 1.8399124944151614e-05, "epoch": 0.7177729303001974, "percentage": 71.78, "elapsed_time": "2 days, 5:14:10", "remaining_time": "20:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6911, "total_steps": 9627, "loss": 1.7247, "learning_rate": 1.838648203288727e-05, "epoch": 0.7178768048197777, "percentage": 71.79, "elapsed_time": "2 days, 5:14:41", "remaining_time": "20:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6912, "total_steps": 9627, "loss": 1.5317, "learning_rate": 1.8373842488215966e-05, "epoch": 0.717980679339358, "percentage": 71.8, "elapsed_time": "2 days, 5:15:12", "remaining_time": "20:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6913, "total_steps": 9627, "loss": 1.7154, "learning_rate": 1.836120631148376e-05, "epoch": 0.7180845538589384, "percentage": 71.81, "elapsed_time": "2 days, 5:15:44", "remaining_time": "20:54:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6914, "total_steps": 9627, "loss": 1.7214, "learning_rate": 1.8348573504036305e-05, "epoch": 0.7181884283785187, "percentage": 71.82, "elapsed_time": "2 days, 5:16:17", "remaining_time": "20:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6915, "total_steps": 9627, "loss": 1.652, "learning_rate": 1.8335944067218846e-05, "epoch": 0.7182923028980991, "percentage": 71.83, "elapsed_time": "2 days, 5:16:47", "remaining_time": "20:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6916, "total_steps": 9627, "loss": 1.6764, "learning_rate": 1.8323318002376372e-05, "epoch": 0.7183961774176795, "percentage": 71.84, "elapsed_time": "2 days, 5:17:19", "remaining_time": "20:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6917, "total_steps": 9627, "loss": 1.7295, "learning_rate": 1.831069531085344e-05, "epoch": 0.7185000519372597, "percentage": 71.85, "elapsed_time": "2 days, 5:17:50", "remaining_time": "20:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6918, "total_steps": 9627, "loss": 1.5781, "learning_rate": 1.829807599399428e-05, "epoch": 0.7186039264568401, "percentage": 71.86, "elapsed_time": "2 days, 5:18:21", "remaining_time": "20:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6919, "total_steps": 9627, "loss": 1.6024, "learning_rate": 1.828546005314274e-05, "epoch": 0.7187078009764205, "percentage": 71.87, "elapsed_time": "2 days, 5:18:53", "remaining_time": "20:51:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6920, "total_steps": 9627, "loss": 1.7269, "learning_rate": 1.8272847489642314e-05, "epoch": 0.7188116754960008, "percentage": 71.88, "elapsed_time": "2 days, 5:19:24", "remaining_time": "20:51:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6921, "total_steps": 9627, "loss": 1.6872, "learning_rate": 1.826023830483616e-05, "epoch": 0.7189155500155812, "percentage": 71.89, "elapsed_time": "2 days, 5:19:56", "remaining_time": "20:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6922, "total_steps": 9627, "loss": 1.3766, "learning_rate": 1.8247632500067017e-05, "epoch": 0.7190194245351615, "percentage": 71.9, "elapsed_time": "2 days, 5:20:29", "remaining_time": "20:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6923, "total_steps": 9627, "loss": 1.7151, "learning_rate": 1.8235030076677362e-05, "epoch": 0.7191232990547419, "percentage": 71.91, "elapsed_time": "2 days, 5:20:59", "remaining_time": "20:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6924, "total_steps": 9627, "loss": 1.6841, "learning_rate": 1.8222431036009226e-05, "epoch": 0.7192271735743222, "percentage": 71.92, "elapsed_time": "2 days, 5:21:31", "remaining_time": "20:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6925, "total_steps": 9627, "loss": 1.5951, "learning_rate": 1.8209835379404304e-05, "epoch": 0.7193310480939026, "percentage": 71.93, "elapsed_time": "2 days, 5:22:02", "remaining_time": "20:49:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6926, "total_steps": 9627, "loss": 1.6513, "learning_rate": 1.819724310820395e-05, "epoch": 0.719434922613483, "percentage": 71.94, "elapsed_time": "2 days, 5:22:33", "remaining_time": "20:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6927, "total_steps": 9627, "loss": 1.63, "learning_rate": 1.8184654223749126e-05, "epoch": 0.7195387971330632, "percentage": 71.95, "elapsed_time": "2 days, 5:23:06", "remaining_time": "20:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6928, "total_steps": 9627, "loss": 1.7954, "learning_rate": 1.8172068727380464e-05, "epoch": 0.7196426716526436, "percentage": 71.96, "elapsed_time": "2 days, 5:23:36", "remaining_time": "20:48:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6929, "total_steps": 9627, "loss": 1.7982, "learning_rate": 1.8159486620438193e-05, "epoch": 0.719746546172224, "percentage": 71.97, "elapsed_time": "2 days, 5:24:09", "remaining_time": "20:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6930, "total_steps": 9627, "loss": 1.8414, "learning_rate": 1.8146907904262267e-05, "epoch": 0.7198504206918043, "percentage": 71.99, "elapsed_time": "2 days, 5:24:40", "remaining_time": "20:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6931, "total_steps": 9627, "loss": 1.8044, "learning_rate": 1.8134332580192152e-05, "epoch": 0.7199542952113847, "percentage": 72.0, "elapsed_time": "2 days, 5:25:11", "remaining_time": "20:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6932, "total_steps": 9627, "loss": 1.6786, "learning_rate": 1.8121760649567077e-05, "epoch": 0.720058169730965, "percentage": 72.01, "elapsed_time": "2 days, 5:25:44", "remaining_time": "20:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6933, "total_steps": 9627, "loss": 1.51, "learning_rate": 1.8109192113725826e-05, "epoch": 0.7201620442505453, "percentage": 72.02, "elapsed_time": "2 days, 5:26:16", "remaining_time": "20:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6934, "total_steps": 9627, "loss": 1.5216, "learning_rate": 1.809662697400686e-05, "epoch": 0.7202659187701257, "percentage": 72.03, "elapsed_time": "2 days, 5:26:47", "remaining_time": "20:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6935, "total_steps": 9627, "loss": 1.7657, "learning_rate": 1.8084065231748265e-05, "epoch": 0.7203697932897061, "percentage": 72.04, "elapsed_time": "2 days, 5:27:18", "remaining_time": "20:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6936, "total_steps": 9627, "loss": 1.7116, "learning_rate": 1.807150688828777e-05, "epoch": 0.7204736678092863, "percentage": 72.05, "elapsed_time": "2 days, 5:27:50", "remaining_time": "20:44:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6937, "total_steps": 9627, "loss": 1.503, "learning_rate": 1.8058951944962736e-05, "epoch": 0.7205775423288667, "percentage": 72.06, "elapsed_time": "2 days, 5:28:22", "remaining_time": "20:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6938, "total_steps": 9627, "loss": 1.6463, "learning_rate": 1.804640040311016e-05, "epoch": 0.7206814168484471, "percentage": 72.07, "elapsed_time": "2 days, 5:28:55", "remaining_time": "20:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6939, "total_steps": 9627, "loss": 1.4503, "learning_rate": 1.8033852264066718e-05, "epoch": 0.7207852913680274, "percentage": 72.08, "elapsed_time": "2 days, 5:29:25", "remaining_time": "20:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6940, "total_steps": 9627, "loss": 1.6289, "learning_rate": 1.802130752916864e-05, "epoch": 0.7208891658876078, "percentage": 72.09, "elapsed_time": "2 days, 5:29:58", "remaining_time": "20:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6941, "total_steps": 9627, "loss": 1.6664, "learning_rate": 1.800876619975188e-05, "epoch": 0.7209930404071881, "percentage": 72.1, "elapsed_time": "2 days, 5:30:29", "remaining_time": "20:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6942, "total_steps": 9627, "loss": 1.5518, "learning_rate": 1.7996228277151995e-05, "epoch": 0.7210969149267684, "percentage": 72.11, "elapsed_time": "2 days, 5:31:00", "remaining_time": "20:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6943, "total_steps": 9627, "loss": 1.5822, "learning_rate": 1.7983693762704122e-05, "epoch": 0.7212007894463488, "percentage": 72.12, "elapsed_time": "2 days, 5:31:33", "remaining_time": "20:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6944, "total_steps": 9627, "loss": 1.6165, "learning_rate": 1.797116265774315e-05, "epoch": 0.7213046639659292, "percentage": 72.13, "elapsed_time": "2 days, 5:32:04", "remaining_time": "20:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6945, "total_steps": 9627, "loss": 1.5928, "learning_rate": 1.7958634963603516e-05, "epoch": 0.7214085384855095, "percentage": 72.14, "elapsed_time": "2 days, 5:32:37", "remaining_time": "20:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6946, "total_steps": 9627, "loss": 1.8438, "learning_rate": 1.7946110681619327e-05, "epoch": 0.7215124130050898, "percentage": 72.15, "elapsed_time": "2 days, 5:33:08", "remaining_time": "20:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6947, "total_steps": 9627, "loss": 1.6103, "learning_rate": 1.7933589813124325e-05, "epoch": 0.7216162875246702, "percentage": 72.16, "elapsed_time": "2 days, 5:33:40", "remaining_time": "20:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6948, "total_steps": 9627, "loss": 1.6833, "learning_rate": 1.7921072359451872e-05, "epoch": 0.7217201620442505, "percentage": 72.17, "elapsed_time": "2 days, 5:34:11", "remaining_time": "20:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6949, "total_steps": 9627, "loss": 1.5623, "learning_rate": 1.7908558321934992e-05, "epoch": 0.7218240365638309, "percentage": 72.18, "elapsed_time": "2 days, 5:34:42", "remaining_time": "20:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6950, "total_steps": 9627, "loss": 1.5559, "learning_rate": 1.789604770190631e-05, "epoch": 0.7219279110834113, "percentage": 72.19, "elapsed_time": "2 days, 5:35:15", "remaining_time": "20:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6951, "total_steps": 9627, "loss": 1.6942, "learning_rate": 1.7883540500698148e-05, "epoch": 0.7220317856029916, "percentage": 72.2, "elapsed_time": "2 days, 5:35:47", "remaining_time": "20:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6952, "total_steps": 9627, "loss": 1.4997, "learning_rate": 1.7871036719642398e-05, "epoch": 0.7221356601225719, "percentage": 72.21, "elapsed_time": "2 days, 5:36:18", "remaining_time": "20:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6953, "total_steps": 9627, "loss": 1.8249, "learning_rate": 1.7858536360070626e-05, "epoch": 0.7222395346421523, "percentage": 72.22, "elapsed_time": "2 days, 5:36:50", "remaining_time": "20:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6954, "total_steps": 9627, "loss": 1.6494, "learning_rate": 1.784603942331402e-05, "epoch": 0.7223434091617327, "percentage": 72.23, "elapsed_time": "2 days, 5:37:23", "remaining_time": "20:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6955, "total_steps": 9627, "loss": 1.5129, "learning_rate": 1.7833545910703402e-05, "epoch": 0.722447283681313, "percentage": 72.24, "elapsed_time": "2 days, 5:37:53", "remaining_time": "20:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6956, "total_steps": 9627, "loss": 1.4516, "learning_rate": 1.7821055823569238e-05, "epoch": 0.7225511582008933, "percentage": 72.26, "elapsed_time": "2 days, 5:38:26", "remaining_time": "20:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6957, "total_steps": 9627, "loss": 1.7454, "learning_rate": 1.7808569163241605e-05, "epoch": 0.7226550327204737, "percentage": 72.27, "elapsed_time": "2 days, 5:38:56", "remaining_time": "20:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6958, "total_steps": 9627, "loss": 1.6144, "learning_rate": 1.7796085931050287e-05, "epoch": 0.722758907240054, "percentage": 72.28, "elapsed_time": "2 days, 5:39:29", "remaining_time": "20:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6959, "total_steps": 9627, "loss": 1.6667, "learning_rate": 1.778360612832458e-05, "epoch": 0.7228627817596344, "percentage": 72.29, "elapsed_time": "2 days, 5:40:01", "remaining_time": "20:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6960, "total_steps": 9627, "loss": 1.7617, "learning_rate": 1.7771129756393547e-05, "epoch": 0.7229666562792147, "percentage": 72.3, "elapsed_time": "2 days, 5:40:31", "remaining_time": "20:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6961, "total_steps": 9627, "loss": 1.6515, "learning_rate": 1.77586568165858e-05, "epoch": 0.723070530798795, "percentage": 72.31, "elapsed_time": "2 days, 5:41:04", "remaining_time": "20:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6962, "total_steps": 9627, "loss": 1.7102, "learning_rate": 1.7746187310229606e-05, "epoch": 0.7231744053183754, "percentage": 72.32, "elapsed_time": "2 days, 5:41:36", "remaining_time": "20:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6963, "total_steps": 9627, "loss": 1.8452, "learning_rate": 1.773372123865287e-05, "epoch": 0.7232782798379558, "percentage": 72.33, "elapsed_time": "2 days, 5:42:08", "remaining_time": "20:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6964, "total_steps": 9627, "loss": 1.6948, "learning_rate": 1.7721258603183144e-05, "epoch": 0.7233821543575361, "percentage": 72.34, "elapsed_time": "2 days, 5:42:39", "remaining_time": "20:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6965, "total_steps": 9627, "loss": 1.9625, "learning_rate": 1.770879940514759e-05, "epoch": 0.7234860288771164, "percentage": 72.35, "elapsed_time": "2 days, 5:43:10", "remaining_time": "20:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6966, "total_steps": 9627, "loss": 1.6516, "learning_rate": 1.7696343645873e-05, "epoch": 0.7235899033966968, "percentage": 72.36, "elapsed_time": "2 days, 5:43:41", "remaining_time": "20:31:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6967, "total_steps": 9627, "loss": 1.7148, "learning_rate": 1.768389132668587e-05, "epoch": 0.7236937779162771, "percentage": 72.37, "elapsed_time": "2 days, 5:44:14", "remaining_time": "20:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6968, "total_steps": 9627, "loss": 1.457, "learning_rate": 1.7671442448912202e-05, "epoch": 0.7237976524358575, "percentage": 72.38, "elapsed_time": "2 days, 5:44:45", "remaining_time": "20:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6969, "total_steps": 9627, "loss": 1.5079, "learning_rate": 1.7658997013877754e-05, "epoch": 0.7239015269554379, "percentage": 72.39, "elapsed_time": "2 days, 5:45:16", "remaining_time": "20:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6970, "total_steps": 9627, "loss": 1.7927, "learning_rate": 1.764655502290788e-05, "epoch": 0.7240054014750181, "percentage": 72.4, "elapsed_time": "2 days, 5:45:48", "remaining_time": "20:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6971, "total_steps": 9627, "loss": 1.6194, "learning_rate": 1.763411647732749e-05, "epoch": 0.7241092759945985, "percentage": 72.41, "elapsed_time": "2 days, 5:46:19", "remaining_time": "20:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6972, "total_steps": 9627, "loss": 1.5284, "learning_rate": 1.7621681378461245e-05, "epoch": 0.7242131505141789, "percentage": 72.42, "elapsed_time": "2 days, 5:46:51", "remaining_time": "20:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6973, "total_steps": 9627, "loss": 1.3562, "learning_rate": 1.7609249727633382e-05, "epoch": 0.7243170250337592, "percentage": 72.43, "elapsed_time": "2 days, 5:47:23", "remaining_time": "20:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6974, "total_steps": 9627, "loss": 1.6075, "learning_rate": 1.759682152616776e-05, "epoch": 0.7244208995533395, "percentage": 72.44, "elapsed_time": "2 days, 5:47:54", "remaining_time": "20:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6975, "total_steps": 9627, "loss": 1.5422, "learning_rate": 1.758439677538789e-05, "epoch": 0.7245247740729199, "percentage": 72.45, "elapsed_time": "2 days, 5:48:25", "remaining_time": "20:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6976, "total_steps": 9627, "loss": 1.6262, "learning_rate": 1.7571975476616897e-05, "epoch": 0.7246286485925003, "percentage": 72.46, "elapsed_time": "2 days, 5:48:58", "remaining_time": "20:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6977, "total_steps": 9627, "loss": 1.6682, "learning_rate": 1.7559557631177605e-05, "epoch": 0.7247325231120806, "percentage": 72.47, "elapsed_time": "2 days, 5:49:28", "remaining_time": "20:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6978, "total_steps": 9627, "loss": 1.836, "learning_rate": 1.754714324039234e-05, "epoch": 0.724836397631661, "percentage": 72.48, "elapsed_time": "2 days, 5:49:59", "remaining_time": "20:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6979, "total_steps": 9627, "loss": 1.7584, "learning_rate": 1.7534732305583196e-05, "epoch": 0.7249402721512413, "percentage": 72.49, "elapsed_time": "2 days, 5:50:30", "remaining_time": "20:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6980, "total_steps": 9627, "loss": 1.6672, "learning_rate": 1.7522324828071822e-05, "epoch": 0.7250441466708216, "percentage": 72.5, "elapsed_time": "2 days, 5:51:03", "remaining_time": "20:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6981, "total_steps": 9627, "loss": 1.5338, "learning_rate": 1.750992080917952e-05, "epoch": 0.725148021190402, "percentage": 72.51, "elapsed_time": "2 days, 5:51:32", "remaining_time": "20:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6982, "total_steps": 9627, "loss": 1.6543, "learning_rate": 1.7497520250227222e-05, "epoch": 0.7252518957099824, "percentage": 72.53, "elapsed_time": "2 days, 5:52:05", "remaining_time": "20:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6983, "total_steps": 9627, "loss": 1.6052, "learning_rate": 1.7485123152535488e-05, "epoch": 0.7253557702295627, "percentage": 72.54, "elapsed_time": "2 days, 5:52:35", "remaining_time": "20:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6984, "total_steps": 9627, "loss": 1.7914, "learning_rate": 1.7472729517424508e-05, "epoch": 0.725459644749143, "percentage": 72.55, "elapsed_time": "2 days, 5:53:07", "remaining_time": "20:23:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6985, "total_steps": 9627, "loss": 1.6915, "learning_rate": 1.7460339346214095e-05, "epoch": 0.7255635192687234, "percentage": 72.56, "elapsed_time": "2 days, 5:53:37", "remaining_time": "20:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6986, "total_steps": 9627, "loss": 1.7437, "learning_rate": 1.744795264022376e-05, "epoch": 0.7256673937883037, "percentage": 72.57, "elapsed_time": "2 days, 5:54:09", "remaining_time": "20:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6987, "total_steps": 9627, "loss": 1.8705, "learning_rate": 1.7435569400772516e-05, "epoch": 0.7257712683078841, "percentage": 72.58, "elapsed_time": "2 days, 5:54:40", "remaining_time": "20:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6988, "total_steps": 9627, "loss": 1.7026, "learning_rate": 1.742318962917914e-05, "epoch": 0.7258751428274645, "percentage": 72.59, "elapsed_time": "2 days, 5:55:10", "remaining_time": "20:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6989, "total_steps": 9627, "loss": 1.7673, "learning_rate": 1.7410813326761955e-05, "epoch": 0.7259790173470447, "percentage": 72.6, "elapsed_time": "2 days, 5:55:42", "remaining_time": "20:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6990, "total_steps": 9627, "loss": 1.5597, "learning_rate": 1.7398440494838947e-05, "epoch": 0.7260828918666251, "percentage": 72.61, "elapsed_time": "2 days, 5:56:14", "remaining_time": "20:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6991, "total_steps": 9627, "loss": 1.8227, "learning_rate": 1.7386071134727726e-05, "epoch": 0.7261867663862055, "percentage": 72.62, "elapsed_time": "2 days, 5:56:45", "remaining_time": "20:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6992, "total_steps": 9627, "loss": 1.5315, "learning_rate": 1.7373705247745532e-05, "epoch": 0.7262906409057858, "percentage": 72.63, "elapsed_time": "2 days, 5:57:16", "remaining_time": "20:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6993, "total_steps": 9627, "loss": 1.598, "learning_rate": 1.7361342835209225e-05, "epoch": 0.7263945154253661, "percentage": 72.64, "elapsed_time": "2 days, 5:57:46", "remaining_time": "20:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6994, "total_steps": 9627, "loss": 1.7899, "learning_rate": 1.7348983898435307e-05, "epoch": 0.7264983899449465, "percentage": 72.65, "elapsed_time": "2 days, 5:58:18", "remaining_time": "20:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6995, "total_steps": 9627, "loss": 1.7511, "learning_rate": 1.733662843873995e-05, "epoch": 0.7266022644645268, "percentage": 72.66, "elapsed_time": "2 days, 5:58:50", "remaining_time": "20:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6996, "total_steps": 9627, "loss": 1.741, "learning_rate": 1.7324276457438843e-05, "epoch": 0.7267061389841072, "percentage": 72.67, "elapsed_time": "2 days, 5:59:21", "remaining_time": "20:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6997, "total_steps": 9627, "loss": 1.8191, "learning_rate": 1.7311927955847428e-05, "epoch": 0.7268100135036876, "percentage": 72.68, "elapsed_time": "2 days, 5:59:53", "remaining_time": "20:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6998, "total_steps": 9627, "loss": 1.5197, "learning_rate": 1.729958293528073e-05, "epoch": 0.7269138880232678, "percentage": 72.69, "elapsed_time": "2 days, 6:00:23", "remaining_time": "20:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6999, "total_steps": 9627, "loss": 1.6748, "learning_rate": 1.728724139705334e-05, "epoch": 0.7270177625428482, "percentage": 72.7, "elapsed_time": "2 days, 6:00:55", "remaining_time": "20:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7000, "total_steps": 9627, "loss": 1.6716, "learning_rate": 1.7274903342479586e-05, "epoch": 0.7271216370624286, "percentage": 72.71, "elapsed_time": "2 days, 6:01:26", "remaining_time": "20:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7001, "total_steps": 9627, "loss": 1.6378, "learning_rate": 1.726256877287335e-05, "epoch": 0.727225511582009, "percentage": 72.72, "elapsed_time": "2 days, 6:01:58", "remaining_time": "20:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7002, "total_steps": 9627, "loss": 1.5495, "learning_rate": 1.725023768954821e-05, "epoch": 0.7273293861015893, "percentage": 72.73, "elapsed_time": "2 days, 6:02:29", "remaining_time": "20:15:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7003, "total_steps": 9627, "loss": 1.5418, "learning_rate": 1.7237910093817278e-05, "epoch": 0.7274332606211696, "percentage": 72.74, "elapsed_time": "2 days, 6:03:01", "remaining_time": "20:15:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7004, "total_steps": 9627, "loss": 1.5632, "learning_rate": 1.7225585986993353e-05, "epoch": 0.72753713514075, "percentage": 72.75, "elapsed_time": "2 days, 6:03:32", "remaining_time": "20:14:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7005, "total_steps": 9627, "loss": 1.7221, "learning_rate": 1.7213265370388898e-05, "epoch": 0.7276410096603303, "percentage": 72.76, "elapsed_time": "2 days, 6:04:03", "remaining_time": "20:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7006, "total_steps": 9627, "loss": 1.7604, "learning_rate": 1.7200948245315908e-05, "epoch": 0.7277448841799107, "percentage": 72.77, "elapsed_time": "2 days, 6:04:35", "remaining_time": "20:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7007, "total_steps": 9627, "loss": 1.6143, "learning_rate": 1.7188634613086103e-05, "epoch": 0.7278487586994911, "percentage": 72.78, "elapsed_time": "2 days, 6:05:05", "remaining_time": "20:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7008, "total_steps": 9627, "loss": 1.5589, "learning_rate": 1.717632447501077e-05, "epoch": 0.7279526332190713, "percentage": 72.8, "elapsed_time": "2 days, 6:05:38", "remaining_time": "20:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7009, "total_steps": 9627, "loss": 1.5601, "learning_rate": 1.7164017832400846e-05, "epoch": 0.7280565077386517, "percentage": 72.81, "elapsed_time": "2 days, 6:06:10", "remaining_time": "20:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7010, "total_steps": 9627, "loss": 1.6215, "learning_rate": 1.71517146865669e-05, "epoch": 0.7281603822582321, "percentage": 72.82, "elapsed_time": "2 days, 6:06:40", "remaining_time": "20:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7011, "total_steps": 9627, "loss": 1.8012, "learning_rate": 1.7139415038819108e-05, "epoch": 0.7282642567778124, "percentage": 72.83, "elapsed_time": "2 days, 6:07:11", "remaining_time": "20:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7012, "total_steps": 9627, "loss": 1.6024, "learning_rate": 1.7127118890467292e-05, "epoch": 0.7283681312973928, "percentage": 72.84, "elapsed_time": "2 days, 6:07:44", "remaining_time": "20:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7013, "total_steps": 9627, "loss": 1.6076, "learning_rate": 1.7114826242820875e-05, "epoch": 0.7284720058169731, "percentage": 72.85, "elapsed_time": "2 days, 6:08:14", "remaining_time": "20:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7014, "total_steps": 9627, "loss": 1.5847, "learning_rate": 1.7102537097188986e-05, "epoch": 0.7285758803365534, "percentage": 72.86, "elapsed_time": "2 days, 6:08:47", "remaining_time": "20:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7015, "total_steps": 9627, "loss": 1.8128, "learning_rate": 1.7090251454880258e-05, "epoch": 0.7286797548561338, "percentage": 72.87, "elapsed_time": "2 days, 6:09:19", "remaining_time": "20:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7016, "total_steps": 9627, "loss": 1.5522, "learning_rate": 1.707796931720305e-05, "epoch": 0.7287836293757142, "percentage": 72.88, "elapsed_time": "2 days, 6:09:50", "remaining_time": "20:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7017, "total_steps": 9627, "loss": 1.8937, "learning_rate": 1.706569068546532e-05, "epoch": 0.7288875038952944, "percentage": 72.89, "elapsed_time": "2 days, 6:10:22", "remaining_time": "20:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7018, "total_steps": 9627, "loss": 1.6175, "learning_rate": 1.7053415560974623e-05, "epoch": 0.7289913784148748, "percentage": 72.9, "elapsed_time": "2 days, 6:10:53", "remaining_time": "20:08:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7019, "total_steps": 9627, "loss": 1.7127, "learning_rate": 1.7041143945038186e-05, "epoch": 0.7290952529344552, "percentage": 72.91, "elapsed_time": "2 days, 6:11:24", "remaining_time": "20:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7020, "total_steps": 9627, "loss": 1.822, "learning_rate": 1.702887583896282e-05, "epoch": 0.7291991274540355, "percentage": 72.92, "elapsed_time": "2 days, 6:11:57", "remaining_time": "20:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7021, "total_steps": 9627, "loss": 1.7217, "learning_rate": 1.7016611244055e-05, "epoch": 0.7293030019736159, "percentage": 72.93, "elapsed_time": "2 days, 6:12:29", "remaining_time": "20:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7022, "total_steps": 9627, "loss": 1.7666, "learning_rate": 1.700435016162078e-05, "epoch": 0.7294068764931962, "percentage": 72.94, "elapsed_time": "2 days, 6:13:00", "remaining_time": "20:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7023, "total_steps": 9627, "loss": 1.6506, "learning_rate": 1.699209259296593e-05, "epoch": 0.7295107510127765, "percentage": 72.95, "elapsed_time": "2 days, 6:13:32", "remaining_time": "20:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7024, "total_steps": 9627, "loss": 1.6463, "learning_rate": 1.697983853939571e-05, "epoch": 0.7296146255323569, "percentage": 72.96, "elapsed_time": "2 days, 6:14:04", "remaining_time": "20:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7025, "total_steps": 9627, "loss": 1.6875, "learning_rate": 1.6967588002215134e-05, "epoch": 0.7297185000519373, "percentage": 72.97, "elapsed_time": "2 days, 6:14:35", "remaining_time": "20:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7026, "total_steps": 9627, "loss": 1.6181, "learning_rate": 1.6955340982728797e-05, "epoch": 0.7298223745715176, "percentage": 72.98, "elapsed_time": "2 days, 6:15:08", "remaining_time": "20:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7027, "total_steps": 9627, "loss": 1.7707, "learning_rate": 1.694309748224085e-05, "epoch": 0.7299262490910979, "percentage": 72.99, "elapsed_time": "2 days, 6:15:40", "remaining_time": "20:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7028, "total_steps": 9627, "loss": 1.6969, "learning_rate": 1.693085750205518e-05, "epoch": 0.7300301236106783, "percentage": 73.0, "elapsed_time": "2 days, 6:16:12", "remaining_time": "20:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7029, "total_steps": 9627, "loss": 1.5153, "learning_rate": 1.6918621043475225e-05, "epoch": 0.7301339981302587, "percentage": 73.01, "elapsed_time": "2 days, 6:16:44", "remaining_time": "20:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7030, "total_steps": 9627, "loss": 1.5392, "learning_rate": 1.6906388107804118e-05, "epoch": 0.730237872649839, "percentage": 73.02, "elapsed_time": "2 days, 6:17:14", "remaining_time": "20:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7031, "total_steps": 9627, "loss": 1.7474, "learning_rate": 1.6894158696344515e-05, "epoch": 0.7303417471694194, "percentage": 73.03, "elapsed_time": "2 days, 6:17:47", "remaining_time": "20:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7032, "total_steps": 9627, "loss": 1.5063, "learning_rate": 1.6881932810398765e-05, "epoch": 0.7304456216889997, "percentage": 73.04, "elapsed_time": "2 days, 6:18:19", "remaining_time": "20:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7033, "total_steps": 9627, "loss": 1.5769, "learning_rate": 1.686971045126887e-05, "epoch": 0.73054949620858, "percentage": 73.05, "elapsed_time": "2 days, 6:18:52", "remaining_time": "20:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7034, "total_steps": 9627, "loss": 1.628, "learning_rate": 1.6857491620256353e-05, "epoch": 0.7306533707281604, "percentage": 73.07, "elapsed_time": "2 days, 6:19:23", "remaining_time": "20:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7035, "total_steps": 9627, "loss": 1.8296, "learning_rate": 1.6845276318662472e-05, "epoch": 0.7307572452477408, "percentage": 73.08, "elapsed_time": "2 days, 6:19:56", "remaining_time": "20:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7036, "total_steps": 9627, "loss": 1.5515, "learning_rate": 1.6833064547788053e-05, "epoch": 0.730861119767321, "percentage": 73.09, "elapsed_time": "2 days, 6:20:27", "remaining_time": "20:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7037, "total_steps": 9627, "loss": 1.7212, "learning_rate": 1.6820856308933543e-05, "epoch": 0.7309649942869014, "percentage": 73.1, "elapsed_time": "2 days, 6:20:59", "remaining_time": "20:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7038, "total_steps": 9627, "loss": 1.5695, "learning_rate": 1.6808651603399024e-05, "epoch": 0.7310688688064818, "percentage": 73.11, "elapsed_time": "2 days, 6:21:32", "remaining_time": "19:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7039, "total_steps": 9627, "loss": 1.6526, "learning_rate": 1.6796450432484212e-05, "epoch": 0.7311727433260621, "percentage": 73.12, "elapsed_time": "2 days, 6:22:04", "remaining_time": "19:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7040, "total_steps": 9627, "loss": 1.5189, "learning_rate": 1.678425279748843e-05, "epoch": 0.7312766178456425, "percentage": 73.13, "elapsed_time": "2 days, 6:22:36", "remaining_time": "19:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7041, "total_steps": 9627, "loss": 1.6336, "learning_rate": 1.6772058699710618e-05, "epoch": 0.7313804923652228, "percentage": 73.14, "elapsed_time": "2 days, 6:23:08", "remaining_time": "19:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7042, "total_steps": 9627, "loss": 1.5303, "learning_rate": 1.6759868140449397e-05, "epoch": 0.7314843668848031, "percentage": 73.15, "elapsed_time": "2 days, 6:23:40", "remaining_time": "19:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7043, "total_steps": 9627, "loss": 1.6328, "learning_rate": 1.6747681121002902e-05, "epoch": 0.7315882414043835, "percentage": 73.16, "elapsed_time": "2 days, 6:24:12", "remaining_time": "19:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7044, "total_steps": 9627, "loss": 1.7547, "learning_rate": 1.6735497642669008e-05, "epoch": 0.7316921159239639, "percentage": 73.17, "elapsed_time": "2 days, 6:24:45", "remaining_time": "19:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7045, "total_steps": 9627, "loss": 1.6887, "learning_rate": 1.6723317706745144e-05, "epoch": 0.7317959904435442, "percentage": 73.18, "elapsed_time": "2 days, 6:25:17", "remaining_time": "19:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7046, "total_steps": 9627, "loss": 1.4962, "learning_rate": 1.6711141314528374e-05, "epoch": 0.7318998649631245, "percentage": 73.19, "elapsed_time": "2 days, 6:25:49", "remaining_time": "19:56:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7047, "total_steps": 9627, "loss": 1.6409, "learning_rate": 1.669896846731539e-05, "epoch": 0.7320037394827049, "percentage": 73.2, "elapsed_time": "2 days, 6:26:21", "remaining_time": "19:55:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7048, "total_steps": 9627, "loss": 1.5295, "learning_rate": 1.6686799166402507e-05, "epoch": 0.7321076140022852, "percentage": 73.21, "elapsed_time": "2 days, 6:26:53", "remaining_time": "19:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7049, "total_steps": 9627, "loss": 1.5359, "learning_rate": 1.667463341308566e-05, "epoch": 0.7322114885218656, "percentage": 73.22, "elapsed_time": "2 days, 6:27:26", "remaining_time": "19:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7050, "total_steps": 9627, "loss": 1.5948, "learning_rate": 1.666247120866039e-05, "epoch": 0.732315363041446, "percentage": 73.23, "elapsed_time": "2 days, 6:27:57", "remaining_time": "19:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7051, "total_steps": 9627, "loss": 1.4639, "learning_rate": 1.6650312554421928e-05, "epoch": 0.7324192375610262, "percentage": 73.24, "elapsed_time": "2 days, 6:28:29", "remaining_time": "19:54:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7052, "total_steps": 9627, "loss": 1.8214, "learning_rate": 1.663815745166502e-05, "epoch": 0.7325231120806066, "percentage": 73.25, "elapsed_time": "2 days, 6:29:01", "remaining_time": "19:53:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7053, "total_steps": 9627, "loss": 1.5394, "learning_rate": 1.66260059016841e-05, "epoch": 0.732626986600187, "percentage": 73.26, "elapsed_time": "2 days, 6:29:34", "remaining_time": "19:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7054, "total_steps": 9627, "loss": 1.5732, "learning_rate": 1.6613857905773238e-05, "epoch": 0.7327308611197674, "percentage": 73.27, "elapsed_time": "2 days, 6:30:06", "remaining_time": "19:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7055, "total_steps": 9627, "loss": 1.6296, "learning_rate": 1.6601713465226086e-05, "epoch": 0.7328347356393476, "percentage": 73.28, "elapsed_time": "2 days, 6:30:39", "remaining_time": "19:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7056, "total_steps": 9627, "loss": 1.6349, "learning_rate": 1.6589572581335938e-05, "epoch": 0.732938610158928, "percentage": 73.29, "elapsed_time": "2 days, 6:31:11", "remaining_time": "19:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7057, "total_steps": 9627, "loss": 1.6986, "learning_rate": 1.6577435255395677e-05, "epoch": 0.7330424846785084, "percentage": 73.3, "elapsed_time": "2 days, 6:31:43", "remaining_time": "19:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7058, "total_steps": 9627, "loss": 1.7157, "learning_rate": 1.6565301488697893e-05, "epoch": 0.7331463591980887, "percentage": 73.31, "elapsed_time": "2 days, 6:32:15", "remaining_time": "19:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7059, "total_steps": 9627, "loss": 1.587, "learning_rate": 1.655317128253468e-05, "epoch": 0.7332502337176691, "percentage": 73.33, "elapsed_time": "2 days, 6:32:48", "remaining_time": "19:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7060, "total_steps": 9627, "loss": 1.7887, "learning_rate": 1.6541044638197818e-05, "epoch": 0.7333541082372494, "percentage": 73.34, "elapsed_time": "2 days, 6:33:20", "remaining_time": "19:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7061, "total_steps": 9627, "loss": 1.7428, "learning_rate": 1.6528921556978737e-05, "epoch": 0.7334579827568297, "percentage": 73.35, "elapsed_time": "2 days, 6:33:52", "remaining_time": "19:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7062, "total_steps": 9627, "loss": 1.79, "learning_rate": 1.65168020401684e-05, "epoch": 0.7335618572764101, "percentage": 73.36, "elapsed_time": "2 days, 6:34:24", "remaining_time": "19:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7063, "total_steps": 9627, "loss": 1.8929, "learning_rate": 1.650468608905748e-05, "epoch": 0.7336657317959905, "percentage": 73.37, "elapsed_time": "2 days, 6:34:56", "remaining_time": "19:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7064, "total_steps": 9627, "loss": 1.7476, "learning_rate": 1.649257370493622e-05, "epoch": 0.7337696063155708, "percentage": 73.38, "elapsed_time": "2 days, 6:35:28", "remaining_time": "19:48:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7065, "total_steps": 9627, "loss": 1.762, "learning_rate": 1.6480464889094493e-05, "epoch": 0.7338734808351511, "percentage": 73.39, "elapsed_time": "2 days, 6:36:01", "remaining_time": "19:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7066, "total_steps": 9627, "loss": 1.5714, "learning_rate": 1.646835964282179e-05, "epoch": 0.7339773553547315, "percentage": 73.4, "elapsed_time": "2 days, 6:36:33", "remaining_time": "19:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7067, "total_steps": 9627, "loss": 1.6522, "learning_rate": 1.6456257967407228e-05, "epoch": 0.7340812298743118, "percentage": 73.41, "elapsed_time": "2 days, 6:37:05", "remaining_time": "19:47:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7068, "total_steps": 9627, "loss": 1.7425, "learning_rate": 1.6444159864139542e-05, "epoch": 0.7341851043938922, "percentage": 73.42, "elapsed_time": "2 days, 6:37:38", "remaining_time": "19:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7069, "total_steps": 9627, "loss": 1.6434, "learning_rate": 1.6432065334307074e-05, "epoch": 0.7342889789134726, "percentage": 73.43, "elapsed_time": "2 days, 6:38:10", "remaining_time": "19:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7070, "total_steps": 9627, "loss": 1.7726, "learning_rate": 1.6419974379197834e-05, "epoch": 0.7343928534330528, "percentage": 73.44, "elapsed_time": "2 days, 6:38:42", "remaining_time": "19:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7071, "total_steps": 9627, "loss": 1.5734, "learning_rate": 1.6407887000099354e-05, "epoch": 0.7344967279526332, "percentage": 73.45, "elapsed_time": "2 days, 6:39:14", "remaining_time": "19:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7072, "total_steps": 9627, "loss": 1.7336, "learning_rate": 1.6395803198298905e-05, "epoch": 0.7346006024722136, "percentage": 73.46, "elapsed_time": "2 days, 6:39:46", "remaining_time": "19:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7073, "total_steps": 9627, "loss": 1.6019, "learning_rate": 1.6383722975083282e-05, "epoch": 0.7347044769917939, "percentage": 73.47, "elapsed_time": "2 days, 6:40:18", "remaining_time": "19:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7074, "total_steps": 9627, "loss": 1.7766, "learning_rate": 1.6371646331738953e-05, "epoch": 0.7348083515113742, "percentage": 73.48, "elapsed_time": "2 days, 6:40:50", "remaining_time": "19:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7075, "total_steps": 9627, "loss": 1.6961, "learning_rate": 1.6359573269551977e-05, "epoch": 0.7349122260309546, "percentage": 73.49, "elapsed_time": "2 days, 6:41:23", "remaining_time": "19:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7076, "total_steps": 9627, "loss": 1.6388, "learning_rate": 1.634750378980804e-05, "epoch": 0.7350161005505349, "percentage": 73.5, "elapsed_time": "2 days, 6:41:55", "remaining_time": "19:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7077, "total_steps": 9627, "loss": 1.6002, "learning_rate": 1.633543789379245e-05, "epoch": 0.7351199750701153, "percentage": 73.51, "elapsed_time": "2 days, 6:42:28", "remaining_time": "19:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7078, "total_steps": 9627, "loss": 1.7919, "learning_rate": 1.632337558279011e-05, "epoch": 0.7352238495896957, "percentage": 73.52, "elapsed_time": "2 days, 6:43:00", "remaining_time": "19:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7079, "total_steps": 9627, "loss": 1.5934, "learning_rate": 1.6311316858085607e-05, "epoch": 0.735327724109276, "percentage": 73.53, "elapsed_time": "2 days, 6:43:32", "remaining_time": "19:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7080, "total_steps": 9627, "loss": 1.6255, "learning_rate": 1.6299261720963093e-05, "epoch": 0.7354315986288563, "percentage": 73.54, "elapsed_time": "2 days, 6:44:04", "remaining_time": "19:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7081, "total_steps": 9627, "loss": 1.7223, "learning_rate": 1.6287210172706297e-05, "epoch": 0.7355354731484367, "percentage": 73.55, "elapsed_time": "2 days, 6:44:37", "remaining_time": "19:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7082, "total_steps": 9627, "loss": 1.6397, "learning_rate": 1.627516221459866e-05, "epoch": 0.7356393476680171, "percentage": 73.56, "elapsed_time": "2 days, 6:45:09", "remaining_time": "19:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7083, "total_steps": 9627, "loss": 1.7121, "learning_rate": 1.6263117847923182e-05, "epoch": 0.7357432221875974, "percentage": 73.57, "elapsed_time": "2 days, 6:45:41", "remaining_time": "19:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7084, "total_steps": 9627, "loss": 1.5572, "learning_rate": 1.62510770739625e-05, "epoch": 0.7358470967071777, "percentage": 73.58, "elapsed_time": "2 days, 6:46:13", "remaining_time": "19:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7085, "total_steps": 9627, "loss": 1.6877, "learning_rate": 1.6239039893998842e-05, "epoch": 0.7359509712267581, "percentage": 73.6, "elapsed_time": "2 days, 6:46:46", "remaining_time": "19:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7086, "total_steps": 9627, "loss": 1.4045, "learning_rate": 1.622700630931412e-05, "epoch": 0.7360548457463384, "percentage": 73.61, "elapsed_time": "2 days, 6:47:17", "remaining_time": "19:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7087, "total_steps": 9627, "loss": 1.6824, "learning_rate": 1.6214976321189768e-05, "epoch": 0.7361587202659188, "percentage": 73.62, "elapsed_time": "2 days, 6:47:49", "remaining_time": "19:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7088, "total_steps": 9627, "loss": 1.6501, "learning_rate": 1.6202949930906893e-05, "epoch": 0.7362625947854992, "percentage": 73.63, "elapsed_time": "2 days, 6:48:21", "remaining_time": "19:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7089, "total_steps": 9627, "loss": 1.7141, "learning_rate": 1.6190927139746255e-05, "epoch": 0.7363664693050794, "percentage": 73.64, "elapsed_time": "2 days, 6:48:54", "remaining_time": "19:37:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7090, "total_steps": 9627, "loss": 1.8566, "learning_rate": 1.617890794898812e-05, "epoch": 0.7364703438246598, "percentage": 73.65, "elapsed_time": "2 days, 6:49:27", "remaining_time": "19:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7091, "total_steps": 9627, "loss": 1.6646, "learning_rate": 1.616689235991249e-05, "epoch": 0.7365742183442402, "percentage": 73.66, "elapsed_time": "2 days, 6:49:59", "remaining_time": "19:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7092, "total_steps": 9627, "loss": 1.6597, "learning_rate": 1.6154880373798918e-05, "epoch": 0.7366780928638205, "percentage": 73.67, "elapsed_time": "2 days, 6:50:31", "remaining_time": "19:36:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7093, "total_steps": 9627, "loss": 1.8035, "learning_rate": 1.6142871991926584e-05, "epoch": 0.7367819673834008, "percentage": 73.68, "elapsed_time": "2 days, 6:51:04", "remaining_time": "19:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7094, "total_steps": 9627, "loss": 1.446, "learning_rate": 1.6130867215574284e-05, "epoch": 0.7368858419029812, "percentage": 73.69, "elapsed_time": "2 days, 6:51:36", "remaining_time": "19:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7095, "total_steps": 9627, "loss": 1.5551, "learning_rate": 1.6118866046020438e-05, "epoch": 0.7369897164225615, "percentage": 73.7, "elapsed_time": "2 days, 6:52:08", "remaining_time": "19:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7096, "total_steps": 9627, "loss": 1.8941, "learning_rate": 1.6106868484543076e-05, "epoch": 0.7370935909421419, "percentage": 73.71, "elapsed_time": "2 days, 6:52:41", "remaining_time": "19:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7097, "total_steps": 9627, "loss": 1.6175, "learning_rate": 1.6094874532419828e-05, "epoch": 0.7371974654617223, "percentage": 73.72, "elapsed_time": "2 days, 6:53:12", "remaining_time": "19:33:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7098, "total_steps": 9627, "loss": 1.7482, "learning_rate": 1.6082884190928004e-05, "epoch": 0.7373013399813025, "percentage": 73.73, "elapsed_time": "2 days, 6:53:45", "remaining_time": "19:33:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7099, "total_steps": 9627, "loss": 1.7566, "learning_rate": 1.6070897461344413e-05, "epoch": 0.7374052145008829, "percentage": 73.74, "elapsed_time": "2 days, 6:54:17", "remaining_time": "19:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7100, "total_steps": 9627, "loss": 1.576, "learning_rate": 1.6058914344945607e-05, "epoch": 0.7375090890204633, "percentage": 73.75, "elapsed_time": "2 days, 6:54:49", "remaining_time": "19:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7101, "total_steps": 9627, "loss": 1.6982, "learning_rate": 1.604693484300767e-05, "epoch": 0.7376129635400436, "percentage": 73.76, "elapsed_time": "2 days, 6:55:22", "remaining_time": "19:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7102, "total_steps": 9627, "loss": 1.8107, "learning_rate": 1.6034958956806333e-05, "epoch": 0.737716838059624, "percentage": 73.77, "elapsed_time": "2 days, 6:55:54", "remaining_time": "19:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7103, "total_steps": 9627, "loss": 1.5234, "learning_rate": 1.6022986687616926e-05, "epoch": 0.7378207125792043, "percentage": 73.78, "elapsed_time": "2 days, 6:56:26", "remaining_time": "19:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7104, "total_steps": 9627, "loss": 1.7615, "learning_rate": 1.6011018036714388e-05, "epoch": 0.7379245870987847, "percentage": 73.79, "elapsed_time": "2 days, 6:56:58", "remaining_time": "19:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7105, "total_steps": 9627, "loss": 1.7623, "learning_rate": 1.599905300537334e-05, "epoch": 0.738028461618365, "percentage": 73.8, "elapsed_time": "2 days, 6:57:30", "remaining_time": "19:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7106, "total_steps": 9627, "loss": 1.7175, "learning_rate": 1.598709159486789e-05, "epoch": 0.7381323361379454, "percentage": 73.81, "elapsed_time": "2 days, 6:58:03", "remaining_time": "19:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7107, "total_steps": 9627, "loss": 1.8187, "learning_rate": 1.5975133806471903e-05, "epoch": 0.7382362106575258, "percentage": 73.82, "elapsed_time": "2 days, 6:58:35", "remaining_time": "19:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7108, "total_steps": 9627, "loss": 1.6612, "learning_rate": 1.596317964145877e-05, "epoch": 0.738340085177106, "percentage": 73.83, "elapsed_time": "2 days, 6:59:07", "remaining_time": "19:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7109, "total_steps": 9627, "loss": 1.6154, "learning_rate": 1.5951229101101473e-05, "epoch": 0.7384439596966864, "percentage": 73.84, "elapsed_time": "2 days, 6:59:39", "remaining_time": "19:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7110, "total_steps": 9627, "loss": 1.706, "learning_rate": 1.5939282186672705e-05, "epoch": 0.7385478342162668, "percentage": 73.85, "elapsed_time": "2 days, 7:00:12", "remaining_time": "19:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7111, "total_steps": 9627, "loss": 1.6324, "learning_rate": 1.5927338899444706e-05, "epoch": 0.7386517087358471, "percentage": 73.87, "elapsed_time": "2 days, 7:00:44", "remaining_time": "19:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7112, "total_steps": 9627, "loss": 1.6332, "learning_rate": 1.5915399240689325e-05, "epoch": 0.7387555832554275, "percentage": 73.88, "elapsed_time": "2 days, 7:01:16", "remaining_time": "19:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7113, "total_steps": 9627, "loss": 1.6949, "learning_rate": 1.5903463211678067e-05, "epoch": 0.7388594577750078, "percentage": 73.89, "elapsed_time": "2 days, 7:01:48", "remaining_time": "19:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7114, "total_steps": 9627, "loss": 1.6298, "learning_rate": 1.5891530813682008e-05, "epoch": 0.7389633322945881, "percentage": 73.9, "elapsed_time": "2 days, 7:02:20", "remaining_time": "19:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7115, "total_steps": 9627, "loss": 1.4948, "learning_rate": 1.5879602047971865e-05, "epoch": 0.7390672068141685, "percentage": 73.91, "elapsed_time": "2 days, 7:02:52", "remaining_time": "19:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7116, "total_steps": 9627, "loss": 1.607, "learning_rate": 1.586767691581793e-05, "epoch": 0.7391710813337489, "percentage": 73.92, "elapsed_time": "2 days, 7:03:25", "remaining_time": "19:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7117, "total_steps": 9627, "loss": 1.5812, "learning_rate": 1.58557554184902e-05, "epoch": 0.7392749558533291, "percentage": 73.93, "elapsed_time": "2 days, 7:03:57", "remaining_time": "19:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7118, "total_steps": 9627, "loss": 1.6636, "learning_rate": 1.584383755725815e-05, "epoch": 0.7393788303729095, "percentage": 73.94, "elapsed_time": "2 days, 7:04:29", "remaining_time": "19:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7119, "total_steps": 9627, "loss": 1.4104, "learning_rate": 1.5831923333390985e-05, "epoch": 0.7394827048924899, "percentage": 73.95, "elapsed_time": "2 days, 7:05:02", "remaining_time": "19:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7120, "total_steps": 9627, "loss": 1.4713, "learning_rate": 1.5820012748157464e-05, "epoch": 0.7395865794120702, "percentage": 73.96, "elapsed_time": "2 days, 7:05:34", "remaining_time": "19:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7121, "total_steps": 9627, "loss": 1.3777, "learning_rate": 1.5808105802825975e-05, "epoch": 0.7396904539316506, "percentage": 73.97, "elapsed_time": "2 days, 7:06:06", "remaining_time": "19:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7122, "total_steps": 9627, "loss": 1.6707, "learning_rate": 1.579620249866451e-05, "epoch": 0.7397943284512309, "percentage": 73.98, "elapsed_time": "2 days, 7:06:38", "remaining_time": "19:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7123, "total_steps": 9627, "loss": 1.4956, "learning_rate": 1.5784302836940678e-05, "epoch": 0.7398982029708112, "percentage": 73.99, "elapsed_time": "2 days, 7:07:11", "remaining_time": "19:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7124, "total_steps": 9627, "loss": 1.7082, "learning_rate": 1.5772406818921697e-05, "epoch": 0.7400020774903916, "percentage": 74.0, "elapsed_time": "2 days, 7:07:43", "remaining_time": "19:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7125, "total_steps": 9627, "loss": 1.7969, "learning_rate": 1.576051444587439e-05, "epoch": 0.740105952009972, "percentage": 74.01, "elapsed_time": "2 days, 7:08:15", "remaining_time": "19:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7126, "total_steps": 9627, "loss": 1.7028, "learning_rate": 1.574862571906525e-05, "epoch": 0.7402098265295523, "percentage": 74.02, "elapsed_time": "2 days, 7:08:47", "remaining_time": "19:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7127, "total_steps": 9627, "loss": 1.6769, "learning_rate": 1.5736740639760272e-05, "epoch": 0.7403137010491326, "percentage": 74.03, "elapsed_time": "2 days, 7:09:20", "remaining_time": "19:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7128, "total_steps": 9627, "loss": 1.5418, "learning_rate": 1.5724859209225168e-05, "epoch": 0.740417575568713, "percentage": 74.04, "elapsed_time": "2 days, 7:09:52", "remaining_time": "19:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7129, "total_steps": 9627, "loss": 1.5925, "learning_rate": 1.5712981428725192e-05, "epoch": 0.7405214500882933, "percentage": 74.05, "elapsed_time": "2 days, 7:10:24", "remaining_time": "19:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7130, "total_steps": 9627, "loss": 1.5975, "learning_rate": 1.5701107299525253e-05, "epoch": 0.7406253246078737, "percentage": 74.06, "elapsed_time": "2 days, 7:10:57", "remaining_time": "19:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7131, "total_steps": 9627, "loss": 1.8195, "learning_rate": 1.5689236822889846e-05, "epoch": 0.740729199127454, "percentage": 74.07, "elapsed_time": "2 days, 7:11:29", "remaining_time": "19:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7132, "total_steps": 9627, "loss": 1.4801, "learning_rate": 1.5677370000083065e-05, "epoch": 0.7408330736470344, "percentage": 74.08, "elapsed_time": "2 days, 7:12:01", "remaining_time": "19:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7133, "total_steps": 9627, "loss": 1.4249, "learning_rate": 1.566550683236868e-05, "epoch": 0.7409369481666147, "percentage": 74.09, "elapsed_time": "2 days, 7:12:33", "remaining_time": "19:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7134, "total_steps": 9627, "loss": 1.8544, "learning_rate": 1.5653647321009973e-05, "epoch": 0.7410408226861951, "percentage": 74.1, "elapsed_time": "2 days, 7:13:06", "remaining_time": "19:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7135, "total_steps": 9627, "loss": 1.5443, "learning_rate": 1.5641791467269922e-05, "epoch": 0.7411446972057755, "percentage": 74.11, "elapsed_time": "2 days, 7:13:38", "remaining_time": "19:17:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7136, "total_steps": 9627, "loss": 1.6799, "learning_rate": 1.56299392724111e-05, "epoch": 0.7412485717253557, "percentage": 74.12, "elapsed_time": "2 days, 7:14:10", "remaining_time": "19:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7137, "total_steps": 9627, "loss": 1.5797, "learning_rate": 1.561809073769561e-05, "epoch": 0.7413524462449361, "percentage": 74.14, "elapsed_time": "2 days, 7:14:42", "remaining_time": "19:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7138, "total_steps": 9627, "loss": 1.6916, "learning_rate": 1.5606245864385287e-05, "epoch": 0.7414563207645165, "percentage": 74.15, "elapsed_time": "2 days, 7:15:14", "remaining_time": "19:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7139, "total_steps": 9627, "loss": 1.4902, "learning_rate": 1.5594404653741494e-05, "epoch": 0.7415601952840968, "percentage": 74.16, "elapsed_time": "2 days, 7:15:46", "remaining_time": "19:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7140, "total_steps": 9627, "loss": 1.6821, "learning_rate": 1.5582567107025237e-05, "epoch": 0.7416640698036772, "percentage": 74.17, "elapsed_time": "2 days, 7:16:19", "remaining_time": "19:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7141, "total_steps": 9627, "loss": 1.6489, "learning_rate": 1.5570733225497115e-05, "epoch": 0.7417679443232575, "percentage": 74.18, "elapsed_time": "2 days, 7:16:51", "remaining_time": "19:14:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7142, "total_steps": 9627, "loss": 1.766, "learning_rate": 1.5558903010417346e-05, "epoch": 0.7418718188428378, "percentage": 74.19, "elapsed_time": "2 days, 7:17:23", "remaining_time": "19:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7143, "total_steps": 9627, "loss": 1.6973, "learning_rate": 1.5547076463045756e-05, "epoch": 0.7419756933624182, "percentage": 74.2, "elapsed_time": "2 days, 7:17:56", "remaining_time": "19:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7144, "total_steps": 9627, "loss": 1.7257, "learning_rate": 1.5535253584641762e-05, "epoch": 0.7420795678819986, "percentage": 74.21, "elapsed_time": "2 days, 7:18:28", "remaining_time": "19:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7145, "total_steps": 9627, "loss": 1.7526, "learning_rate": 1.552343437646446e-05, "epoch": 0.7421834424015789, "percentage": 74.22, "elapsed_time": "2 days, 7:19:00", "remaining_time": "19:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7146, "total_steps": 9627, "loss": 1.6038, "learning_rate": 1.5511618839772437e-05, "epoch": 0.7422873169211592, "percentage": 74.23, "elapsed_time": "2 days, 7:19:32", "remaining_time": "19:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7147, "total_steps": 9627, "loss": 1.6295, "learning_rate": 1.5499806975824e-05, "epoch": 0.7423911914407396, "percentage": 74.24, "elapsed_time": "2 days, 7:20:05", "remaining_time": "19:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7148, "total_steps": 9627, "loss": 1.6083, "learning_rate": 1.5487998785877005e-05, "epoch": 0.7424950659603199, "percentage": 74.25, "elapsed_time": "2 days, 7:20:37", "remaining_time": "19:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7149, "total_steps": 9627, "loss": 1.6872, "learning_rate": 1.5476194271188944e-05, "epoch": 0.7425989404799003, "percentage": 74.26, "elapsed_time": "2 days, 7:21:09", "remaining_time": "19:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7150, "total_steps": 9627, "loss": 1.6835, "learning_rate": 1.5464393433016895e-05, "epoch": 0.7427028149994807, "percentage": 74.27, "elapsed_time": "2 days, 7:21:41", "remaining_time": "19:10:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7151, "total_steps": 9627, "loss": 1.6991, "learning_rate": 1.5452596272617555e-05, "epoch": 0.7428066895190609, "percentage": 74.28, "elapsed_time": "2 days, 7:22:14", "remaining_time": "19:10:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7152, "total_steps": 9627, "loss": 1.5401, "learning_rate": 1.5440802791247234e-05, "epoch": 0.7429105640386413, "percentage": 74.29, "elapsed_time": "2 days, 7:22:46", "remaining_time": "19:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7153, "total_steps": 9627, "loss": 1.604, "learning_rate": 1.5429012990161827e-05, "epoch": 0.7430144385582217, "percentage": 74.3, "elapsed_time": "2 days, 7:23:18", "remaining_time": "19:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7154, "total_steps": 9627, "loss": 1.6432, "learning_rate": 1.5417226870616902e-05, "epoch": 0.743118313077802, "percentage": 74.31, "elapsed_time": "2 days, 7:23:50", "remaining_time": "19:08:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7155, "total_steps": 9627, "loss": 1.5474, "learning_rate": 1.540544443386753e-05, "epoch": 0.7432221875973823, "percentage": 74.32, "elapsed_time": "2 days, 7:24:23", "remaining_time": "19:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7156, "total_steps": 9627, "loss": 1.8406, "learning_rate": 1.5393665681168496e-05, "epoch": 0.7433260621169627, "percentage": 74.33, "elapsed_time": "2 days, 7:24:55", "remaining_time": "19:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7157, "total_steps": 9627, "loss": 1.589, "learning_rate": 1.5381890613774126e-05, "epoch": 0.7434299366365431, "percentage": 74.34, "elapsed_time": "2 days, 7:25:27", "remaining_time": "19:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7158, "total_steps": 9627, "loss": 1.4567, "learning_rate": 1.537011923293837e-05, "epoch": 0.7435338111561234, "percentage": 74.35, "elapsed_time": "2 days, 7:25:59", "remaining_time": "19:07:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7159, "total_steps": 9627, "loss": 1.5574, "learning_rate": 1.5358351539914794e-05, "epoch": 0.7436376856757038, "percentage": 74.36, "elapsed_time": "2 days, 7:26:32", "remaining_time": "19:06:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7160, "total_steps": 9627, "loss": 1.7159, "learning_rate": 1.5346587535956547e-05, "epoch": 0.7437415601952841, "percentage": 74.37, "elapsed_time": "2 days, 7:27:04", "remaining_time": "19:06:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7161, "total_steps": 9627, "loss": 1.6007, "learning_rate": 1.5334827222316457e-05, "epoch": 0.7438454347148644, "percentage": 74.38, "elapsed_time": "2 days, 7:27:36", "remaining_time": "19:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7162, "total_steps": 9627, "loss": 1.7471, "learning_rate": 1.5323070600246832e-05, "epoch": 0.7439493092344448, "percentage": 74.39, "elapsed_time": "2 days, 7:28:09", "remaining_time": "19:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7163, "total_steps": 9627, "loss": 1.6716, "learning_rate": 1.5311317670999714e-05, "epoch": 0.7440531837540252, "percentage": 74.41, "elapsed_time": "2 days, 7:28:41", "remaining_time": "19:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7164, "total_steps": 9627, "loss": 1.7037, "learning_rate": 1.52995684358267e-05, "epoch": 0.7441570582736055, "percentage": 74.42, "elapsed_time": "2 days, 7:29:13", "remaining_time": "19:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7165, "total_steps": 9627, "loss": 1.6881, "learning_rate": 1.5287822895978942e-05, "epoch": 0.7442609327931858, "percentage": 74.43, "elapsed_time": "2 days, 7:29:45", "remaining_time": "19:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7166, "total_steps": 9627, "loss": 1.7643, "learning_rate": 1.52760810527073e-05, "epoch": 0.7443648073127662, "percentage": 74.44, "elapsed_time": "2 days, 7:30:18", "remaining_time": "19:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7167, "total_steps": 9627, "loss": 1.6576, "learning_rate": 1.5264342907262164e-05, "epoch": 0.7444686818323465, "percentage": 74.45, "elapsed_time": "2 days, 7:30:50", "remaining_time": "19:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7168, "total_steps": 9627, "loss": 1.7985, "learning_rate": 1.5252608460893558e-05, "epoch": 0.7445725563519269, "percentage": 74.46, "elapsed_time": "2 days, 7:31:22", "remaining_time": "19:02:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7169, "total_steps": 9627, "loss": 1.6071, "learning_rate": 1.5240877714851115e-05, "epoch": 0.7446764308715073, "percentage": 74.47, "elapsed_time": "2 days, 7:31:55", "remaining_time": "19:02:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7170, "total_steps": 9627, "loss": 1.6072, "learning_rate": 1.5229150670384056e-05, "epoch": 0.7447803053910875, "percentage": 74.48, "elapsed_time": "2 days, 7:32:27", "remaining_time": "19:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7171, "total_steps": 9627, "loss": 1.642, "learning_rate": 1.5217427328741235e-05, "epoch": 0.7448841799106679, "percentage": 74.49, "elapsed_time": "2 days, 7:32:59", "remaining_time": "19:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7172, "total_steps": 9627, "loss": 1.7441, "learning_rate": 1.5205707691171074e-05, "epoch": 0.7449880544302483, "percentage": 74.5, "elapsed_time": "2 days, 7:33:32", "remaining_time": "19:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7173, "total_steps": 9627, "loss": 1.7042, "learning_rate": 1.5193991758921666e-05, "epoch": 0.7450919289498286, "percentage": 74.51, "elapsed_time": "2 days, 7:34:04", "remaining_time": "19:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7174, "total_steps": 9627, "loss": 1.4862, "learning_rate": 1.5182279533240606e-05, "epoch": 0.745195803469409, "percentage": 74.52, "elapsed_time": "2 days, 7:34:37", "remaining_time": "19:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7175, "total_steps": 9627, "loss": 1.8971, "learning_rate": 1.5170571015375207e-05, "epoch": 0.7452996779889893, "percentage": 74.53, "elapsed_time": "2 days, 7:35:09", "remaining_time": "18:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7176, "total_steps": 9627, "loss": 1.5441, "learning_rate": 1.5158866206572313e-05, "epoch": 0.7454035525085696, "percentage": 74.54, "elapsed_time": "2 days, 7:35:42", "remaining_time": "18:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7177, "total_steps": 9627, "loss": 1.7365, "learning_rate": 1.5147165108078398e-05, "epoch": 0.74550742702815, "percentage": 74.55, "elapsed_time": "2 days, 7:36:14", "remaining_time": "18:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7178, "total_steps": 9627, "loss": 1.5903, "learning_rate": 1.5135467721139535e-05, "epoch": 0.7456113015477304, "percentage": 74.56, "elapsed_time": "2 days, 7:36:46", "remaining_time": "18:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7179, "total_steps": 9627, "loss": 1.6461, "learning_rate": 1.5123774047001404e-05, "epoch": 0.7457151760673106, "percentage": 74.57, "elapsed_time": "2 days, 7:37:19", "remaining_time": "18:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7180, "total_steps": 9627, "loss": 1.5398, "learning_rate": 1.5112084086909296e-05, "epoch": 0.745819050586891, "percentage": 74.58, "elapsed_time": "2 days, 7:37:51", "remaining_time": "18:57:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7181, "total_steps": 9627, "loss": 1.612, "learning_rate": 1.5100397842108078e-05, "epoch": 0.7459229251064714, "percentage": 74.59, "elapsed_time": "2 days, 7:38:23", "remaining_time": "18:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7182, "total_steps": 9627, "loss": 1.5695, "learning_rate": 1.5088715313842278e-05, "epoch": 0.7460267996260518, "percentage": 74.6, "elapsed_time": "2 days, 7:38:56", "remaining_time": "18:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7183, "total_steps": 9627, "loss": 1.6183, "learning_rate": 1.507703650335598e-05, "epoch": 0.7461306741456321, "percentage": 74.61, "elapsed_time": "2 days, 7:39:28", "remaining_time": "18:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7184, "total_steps": 9627, "loss": 1.6235, "learning_rate": 1.506536141189288e-05, "epoch": 0.7462345486652124, "percentage": 74.62, "elapsed_time": "2 days, 7:40:00", "remaining_time": "18:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7185, "total_steps": 9627, "loss": 1.6717, "learning_rate": 1.5053690040696295e-05, "epoch": 0.7463384231847928, "percentage": 74.63, "elapsed_time": "2 days, 7:40:32", "remaining_time": "18:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7186, "total_steps": 9627, "loss": 1.5891, "learning_rate": 1.504202239100913e-05, "epoch": 0.7464422977043731, "percentage": 74.64, "elapsed_time": "2 days, 7:41:05", "remaining_time": "18:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7187, "total_steps": 9627, "loss": 1.6755, "learning_rate": 1.5030358464073891e-05, "epoch": 0.7465461722239535, "percentage": 74.65, "elapsed_time": "2 days, 7:41:37", "remaining_time": "18:54:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7188, "total_steps": 9627, "loss": 1.6644, "learning_rate": 1.501869826113269e-05, "epoch": 0.7466500467435339, "percentage": 74.67, "elapsed_time": "2 days, 7:42:09", "remaining_time": "18:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7189, "total_steps": 9627, "loss": 1.6723, "learning_rate": 1.5007041783427294e-05, "epoch": 0.7467539212631141, "percentage": 74.68, "elapsed_time": "2 days, 7:42:41", "remaining_time": "18:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7190, "total_steps": 9627, "loss": 1.7799, "learning_rate": 1.4995389032198958e-05, "epoch": 0.7468577957826945, "percentage": 74.69, "elapsed_time": "2 days, 7:43:14", "remaining_time": "18:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7191, "total_steps": 9627, "loss": 1.6653, "learning_rate": 1.4983740008688657e-05, "epoch": 0.7469616703022749, "percentage": 74.7, "elapsed_time": "2 days, 7:43:46", "remaining_time": "18:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7192, "total_steps": 9627, "loss": 1.5746, "learning_rate": 1.4972094714136926e-05, "epoch": 0.7470655448218552, "percentage": 74.71, "elapsed_time": "2 days, 7:44:18", "remaining_time": "18:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7193, "total_steps": 9627, "loss": 1.5334, "learning_rate": 1.4960453149783848e-05, "epoch": 0.7471694193414355, "percentage": 74.72, "elapsed_time": "2 days, 7:44:50", "remaining_time": "18:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7194, "total_steps": 9627, "loss": 1.7637, "learning_rate": 1.4948815316869207e-05, "epoch": 0.7472732938610159, "percentage": 74.73, "elapsed_time": "2 days, 7:45:23", "remaining_time": "18:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7195, "total_steps": 9627, "loss": 1.7789, "learning_rate": 1.4937181216632323e-05, "epoch": 0.7473771683805962, "percentage": 74.74, "elapsed_time": "2 days, 7:45:55", "remaining_time": "18:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7196, "total_steps": 9627, "loss": 1.7327, "learning_rate": 1.4925550850312142e-05, "epoch": 0.7474810429001766, "percentage": 74.75, "elapsed_time": "2 days, 7:46:27", "remaining_time": "18:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7197, "total_steps": 9627, "loss": 1.6193, "learning_rate": 1.4913924219147202e-05, "epoch": 0.747584917419757, "percentage": 74.76, "elapsed_time": "2 days, 7:46:59", "remaining_time": "18:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7198, "total_steps": 9627, "loss": 1.75, "learning_rate": 1.490230132437565e-05, "epoch": 0.7476887919393372, "percentage": 74.77, "elapsed_time": "2 days, 7:47:32", "remaining_time": "18:49:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7199, "total_steps": 9627, "loss": 1.5587, "learning_rate": 1.4890682167235238e-05, "epoch": 0.7477926664589176, "percentage": 74.78, "elapsed_time": "2 days, 7:48:04", "remaining_time": "18:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7200, "total_steps": 9627, "loss": 1.7437, "learning_rate": 1.4879066748963295e-05, "epoch": 0.747896540978498, "percentage": 74.79, "elapsed_time": "2 days, 7:48:36", "remaining_time": "18:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7201, "total_steps": 9627, "loss": 1.6074, "learning_rate": 1.4867455070796816e-05, "epoch": 0.7480004154980783, "percentage": 74.8, "elapsed_time": "2 days, 7:49:09", "remaining_time": "18:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7202, "total_steps": 9627, "loss": 1.5822, "learning_rate": 1.48558471339723e-05, "epoch": 0.7481042900176587, "percentage": 74.81, "elapsed_time": "2 days, 7:49:41", "remaining_time": "18:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7203, "total_steps": 9627, "loss": 1.6097, "learning_rate": 1.4844242939725944e-05, "epoch": 0.748208164537239, "percentage": 74.82, "elapsed_time": "2 days, 7:50:13", "remaining_time": "18:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7204, "total_steps": 9627, "loss": 1.7464, "learning_rate": 1.483264248929349e-05, "epoch": 0.7483120390568193, "percentage": 74.83, "elapsed_time": "2 days, 7:50:45", "remaining_time": "18:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7205, "total_steps": 9627, "loss": 1.6601, "learning_rate": 1.4821045783910298e-05, "epoch": 0.7484159135763997, "percentage": 74.84, "elapsed_time": "2 days, 7:51:18", "remaining_time": "18:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7206, "total_steps": 9627, "loss": 1.9072, "learning_rate": 1.480945282481132e-05, "epoch": 0.7485197880959801, "percentage": 74.85, "elapsed_time": "2 days, 7:51:50", "remaining_time": "18:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7207, "total_steps": 9627, "loss": 1.7274, "learning_rate": 1.4797863613231122e-05, "epoch": 0.7486236626155603, "percentage": 74.86, "elapsed_time": "2 days, 7:52:23", "remaining_time": "18:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7208, "total_steps": 9627, "loss": 1.5798, "learning_rate": 1.478627815040386e-05, "epoch": 0.7487275371351407, "percentage": 74.87, "elapsed_time": "2 days, 7:52:55", "remaining_time": "18:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7209, "total_steps": 9627, "loss": 1.5999, "learning_rate": 1.4774696437563278e-05, "epoch": 0.7488314116547211, "percentage": 74.88, "elapsed_time": "2 days, 7:53:27", "remaining_time": "18:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7210, "total_steps": 9627, "loss": 1.7148, "learning_rate": 1.4763118475942784e-05, "epoch": 0.7489352861743015, "percentage": 74.89, "elapsed_time": "2 days, 7:54:00", "remaining_time": "18:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7211, "total_steps": 9627, "loss": 1.7499, "learning_rate": 1.4751544266775302e-05, "epoch": 0.7490391606938818, "percentage": 74.9, "elapsed_time": "2 days, 7:54:32", "remaining_time": "18:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7212, "total_steps": 9627, "loss": 1.6405, "learning_rate": 1.473997381129341e-05, "epoch": 0.7491430352134621, "percentage": 74.91, "elapsed_time": "2 days, 7:55:05", "remaining_time": "18:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7213, "total_steps": 9627, "loss": 1.7749, "learning_rate": 1.4728407110729275e-05, "epoch": 0.7492469097330425, "percentage": 74.92, "elapsed_time": "2 days, 7:55:37", "remaining_time": "18:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7214, "total_steps": 9627, "loss": 1.6553, "learning_rate": 1.4716844166314648e-05, "epoch": 0.7493507842526228, "percentage": 74.94, "elapsed_time": "2 days, 7:56:09", "remaining_time": "18:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7215, "total_steps": 9627, "loss": 1.8334, "learning_rate": 1.4705284979280898e-05, "epoch": 0.7494546587722032, "percentage": 74.95, "elapsed_time": "2 days, 7:56:42", "remaining_time": "18:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7216, "total_steps": 9627, "loss": 1.6999, "learning_rate": 1.4693729550858976e-05, "epoch": 0.7495585332917836, "percentage": 74.96, "elapsed_time": "2 days, 7:57:14", "remaining_time": "18:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7217, "total_steps": 9627, "loss": 1.7192, "learning_rate": 1.4682177882279486e-05, "epoch": 0.7496624078113638, "percentage": 74.97, "elapsed_time": "2 days, 7:57:47", "remaining_time": "18:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7218, "total_steps": 9627, "loss": 1.725, "learning_rate": 1.4670629974772532e-05, "epoch": 0.7497662823309442, "percentage": 74.98, "elapsed_time": "2 days, 7:58:19", "remaining_time": "18:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7219, "total_steps": 9627, "loss": 1.5319, "learning_rate": 1.465908582956792e-05, "epoch": 0.7498701568505246, "percentage": 74.99, "elapsed_time": "2 days, 7:58:51", "remaining_time": "18:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7220, "total_steps": 9627, "loss": 1.6354, "learning_rate": 1.4647545447895017e-05, "epoch": 0.7499740313701049, "percentage": 75.0, "elapsed_time": "2 days, 7:59:23", "remaining_time": "18:39:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7221, "total_steps": 9627, "loss": 1.8322, "learning_rate": 1.4636008830982729e-05, "epoch": 0.7500779058896853, "percentage": 75.01, "elapsed_time": "2 days, 7:59:56", "remaining_time": "18:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7222, "total_steps": 9627, "loss": 1.5982, "learning_rate": 1.4624475980059665e-05, "epoch": 0.7501817804092656, "percentage": 75.02, "elapsed_time": "2 days, 8:00:28", "remaining_time": "18:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7223, "total_steps": 9627, "loss": 1.5379, "learning_rate": 1.4612946896353974e-05, "epoch": 0.7502856549288459, "percentage": 75.03, "elapsed_time": "2 days, 8:01:00", "remaining_time": "18:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7224, "total_steps": 9627, "loss": 1.6689, "learning_rate": 1.4601421581093406e-05, "epoch": 0.7503895294484263, "percentage": 75.04, "elapsed_time": "2 days, 8:01:33", "remaining_time": "18:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7225, "total_steps": 9627, "loss": 1.6664, "learning_rate": 1.4589900035505321e-05, "epoch": 0.7504934039680067, "percentage": 75.05, "elapsed_time": "2 days, 8:02:05", "remaining_time": "18:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7226, "total_steps": 9627, "loss": 1.81, "learning_rate": 1.4578382260816669e-05, "epoch": 0.750597278487587, "percentage": 75.06, "elapsed_time": "2 days, 8:02:38", "remaining_time": "18:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7227, "total_steps": 9627, "loss": 1.5913, "learning_rate": 1.4566868258254013e-05, "epoch": 0.7507011530071673, "percentage": 75.07, "elapsed_time": "2 days, 8:03:10", "remaining_time": "18:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7228, "total_steps": 9627, "loss": 1.6758, "learning_rate": 1.455535802904348e-05, "epoch": 0.7508050275267477, "percentage": 75.08, "elapsed_time": "2 days, 8:03:42", "remaining_time": "18:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7229, "total_steps": 9627, "loss": 1.6397, "learning_rate": 1.4543851574410872e-05, "epoch": 0.750908902046328, "percentage": 75.09, "elapsed_time": "2 days, 8:04:14", "remaining_time": "18:35:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7230, "total_steps": 9627, "loss": 1.6516, "learning_rate": 1.4532348895581465e-05, "epoch": 0.7510127765659084, "percentage": 75.1, "elapsed_time": "2 days, 8:04:47", "remaining_time": "18:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7231, "total_steps": 9627, "loss": 1.6518, "learning_rate": 1.4520849993780266e-05, "epoch": 0.7511166510854888, "percentage": 75.11, "elapsed_time": "2 days, 8:05:19", "remaining_time": "18:35:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7232, "total_steps": 9627, "loss": 1.5553, "learning_rate": 1.450935487023179e-05, "epoch": 0.751220525605069, "percentage": 75.12, "elapsed_time": "2 days, 8:05:52", "remaining_time": "18:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7233, "total_steps": 9627, "loss": 1.6917, "learning_rate": 1.4497863526160183e-05, "epoch": 0.7513244001246494, "percentage": 75.13, "elapsed_time": "2 days, 8:06:24", "remaining_time": "18:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7234, "total_steps": 9627, "loss": 1.4978, "learning_rate": 1.4486375962789184e-05, "epoch": 0.7514282746442298, "percentage": 75.14, "elapsed_time": "2 days, 8:06:57", "remaining_time": "18:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7235, "total_steps": 9627, "loss": 1.7395, "learning_rate": 1.447489218134211e-05, "epoch": 0.7515321491638102, "percentage": 75.15, "elapsed_time": "2 days, 8:07:29", "remaining_time": "18:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7236, "total_steps": 9627, "loss": 1.771, "learning_rate": 1.4463412183041947e-05, "epoch": 0.7516360236833904, "percentage": 75.16, "elapsed_time": "2 days, 8:08:01", "remaining_time": "18:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7237, "total_steps": 9627, "loss": 1.621, "learning_rate": 1.4451935969111158e-05, "epoch": 0.7517398982029708, "percentage": 75.17, "elapsed_time": "2 days, 8:08:34", "remaining_time": "18:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7238, "total_steps": 9627, "loss": 1.8537, "learning_rate": 1.4440463540771914e-05, "epoch": 0.7518437727225512, "percentage": 75.18, "elapsed_time": "2 days, 8:09:06", "remaining_time": "18:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7239, "total_steps": 9627, "loss": 1.6614, "learning_rate": 1.4428994899245934e-05, "epoch": 0.7519476472421315, "percentage": 75.19, "elapsed_time": "2 days, 8:09:39", "remaining_time": "18:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7240, "total_steps": 9627, "loss": 1.6751, "learning_rate": 1.4417530045754529e-05, "epoch": 0.7520515217617119, "percentage": 75.21, "elapsed_time": "2 days, 8:10:11", "remaining_time": "18:31:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7241, "total_steps": 9627, "loss": 1.8038, "learning_rate": 1.4406068981518623e-05, "epoch": 0.7521553962812922, "percentage": 75.22, "elapsed_time": "2 days, 8:10:44", "remaining_time": "18:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7242, "total_steps": 9627, "loss": 1.6524, "learning_rate": 1.4394611707758726e-05, "epoch": 0.7522592708008725, "percentage": 75.23, "elapsed_time": "2 days, 8:11:15", "remaining_time": "18:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7243, "total_steps": 9627, "loss": 1.7706, "learning_rate": 1.4383158225694948e-05, "epoch": 0.7523631453204529, "percentage": 75.24, "elapsed_time": "2 days, 8:11:48", "remaining_time": "18:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7244, "total_steps": 9627, "loss": 1.5644, "learning_rate": 1.4371708536546985e-05, "epoch": 0.7524670198400333, "percentage": 75.25, "elapsed_time": "2 days, 8:12:20", "remaining_time": "18:29:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7245, "total_steps": 9627, "loss": 1.6406, "learning_rate": 1.4360262641534179e-05, "epoch": 0.7525708943596136, "percentage": 75.26, "elapsed_time": "2 days, 8:12:53", "remaining_time": "18:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7246, "total_steps": 9627, "loss": 1.6899, "learning_rate": 1.4348820541875374e-05, "epoch": 0.7526747688791939, "percentage": 75.27, "elapsed_time": "2 days, 8:13:25", "remaining_time": "18:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7247, "total_steps": 9627, "loss": 1.4451, "learning_rate": 1.4337382238789105e-05, "epoch": 0.7527786433987743, "percentage": 75.28, "elapsed_time": "2 days, 8:13:57", "remaining_time": "18:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7248, "total_steps": 9627, "loss": 1.7071, "learning_rate": 1.432594773349346e-05, "epoch": 0.7528825179183546, "percentage": 75.29, "elapsed_time": "2 days, 8:14:29", "remaining_time": "18:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7249, "total_steps": 9627, "loss": 1.6278, "learning_rate": 1.4314517027206086e-05, "epoch": 0.752986392437935, "percentage": 75.3, "elapsed_time": "2 days, 8:15:02", "remaining_time": "18:27:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7250, "total_steps": 9627, "loss": 1.6032, "learning_rate": 1.4303090121144302e-05, "epoch": 0.7530902669575154, "percentage": 75.31, "elapsed_time": "2 days, 8:15:34", "remaining_time": "18:26:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7251, "total_steps": 9627, "loss": 1.5404, "learning_rate": 1.429166701652498e-05, "epoch": 0.7531941414770956, "percentage": 75.32, "elapsed_time": "2 days, 8:16:06", "remaining_time": "18:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7252, "total_steps": 9627, "loss": 1.73, "learning_rate": 1.4280247714564582e-05, "epoch": 0.753298015996676, "percentage": 75.33, "elapsed_time": "2 days, 8:16:39", "remaining_time": "18:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7253, "total_steps": 9627, "loss": 1.7523, "learning_rate": 1.4268832216479177e-05, "epoch": 0.7534018905162564, "percentage": 75.34, "elapsed_time": "2 days, 8:17:11", "remaining_time": "18:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7254, "total_steps": 9627, "loss": 1.605, "learning_rate": 1.4257420523484427e-05, "epoch": 0.7535057650358367, "percentage": 75.35, "elapsed_time": "2 days, 8:17:44", "remaining_time": "18:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7255, "total_steps": 9627, "loss": 1.5916, "learning_rate": 1.4246012636795592e-05, "epoch": 0.753609639555417, "percentage": 75.36, "elapsed_time": "2 days, 8:18:16", "remaining_time": "18:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7256, "total_steps": 9627, "loss": 1.7938, "learning_rate": 1.42346085576275e-05, "epoch": 0.7537135140749974, "percentage": 75.37, "elapsed_time": "2 days, 8:18:48", "remaining_time": "18:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7257, "total_steps": 9627, "loss": 1.5843, "learning_rate": 1.422320828719465e-05, "epoch": 0.7538173885945777, "percentage": 75.38, "elapsed_time": "2 days, 8:19:21", "remaining_time": "18:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7258, "total_steps": 9627, "loss": 1.5989, "learning_rate": 1.4211811826711014e-05, "epoch": 0.7539212631141581, "percentage": 75.39, "elapsed_time": "2 days, 8:19:53", "remaining_time": "18:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7259, "total_steps": 9627, "loss": 1.6587, "learning_rate": 1.4200419177390279e-05, "epoch": 0.7540251376337385, "percentage": 75.4, "elapsed_time": "2 days, 8:20:25", "remaining_time": "18:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7260, "total_steps": 9627, "loss": 1.5246, "learning_rate": 1.4189030340445646e-05, "epoch": 0.7541290121533188, "percentage": 75.41, "elapsed_time": "2 days, 8:20:58", "remaining_time": "18:22:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7261, "total_steps": 9627, "loss": 1.6807, "learning_rate": 1.4177645317089954e-05, "epoch": 0.7542328866728991, "percentage": 75.42, "elapsed_time": "2 days, 8:21:30", "remaining_time": "18:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7262, "total_steps": 9627, "loss": 1.6379, "learning_rate": 1.416626410853561e-05, "epoch": 0.7543367611924795, "percentage": 75.43, "elapsed_time": "2 days, 8:22:02", "remaining_time": "18:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7263, "total_steps": 9627, "loss": 1.6603, "learning_rate": 1.4154886715994603e-05, "epoch": 0.7544406357120599, "percentage": 75.44, "elapsed_time": "2 days, 8:22:35", "remaining_time": "18:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7264, "total_steps": 9627, "loss": 1.8564, "learning_rate": 1.4143513140678595e-05, "epoch": 0.7545445102316402, "percentage": 75.45, "elapsed_time": "2 days, 8:23:07", "remaining_time": "18:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7265, "total_steps": 9627, "loss": 1.7624, "learning_rate": 1.4132143383798713e-05, "epoch": 0.7546483847512205, "percentage": 75.46, "elapsed_time": "2 days, 8:23:39", "remaining_time": "18:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7266, "total_steps": 9627, "loss": 1.6411, "learning_rate": 1.4120777446565791e-05, "epoch": 0.7547522592708009, "percentage": 75.48, "elapsed_time": "2 days, 8:24:11", "remaining_time": "18:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7267, "total_steps": 9627, "loss": 1.6907, "learning_rate": 1.4109415330190213e-05, "epoch": 0.7548561337903812, "percentage": 75.49, "elapsed_time": "2 days, 8:24:43", "remaining_time": "18:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7268, "total_steps": 9627, "loss": 1.6414, "learning_rate": 1.4098057035881934e-05, "epoch": 0.7549600083099616, "percentage": 75.5, "elapsed_time": "2 days, 8:25:15", "remaining_time": "18:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7269, "total_steps": 9627, "loss": 1.5862, "learning_rate": 1.408670256485054e-05, "epoch": 0.755063882829542, "percentage": 75.51, "elapsed_time": "2 days, 8:25:47", "remaining_time": "18:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7270, "total_steps": 9627, "loss": 1.7012, "learning_rate": 1.4075351918305191e-05, "epoch": 0.7551677573491222, "percentage": 75.52, "elapsed_time": "2 days, 8:26:20", "remaining_time": "18:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7271, "total_steps": 9627, "loss": 1.7653, "learning_rate": 1.4064005097454635e-05, "epoch": 0.7552716318687026, "percentage": 75.53, "elapsed_time": "2 days, 8:26:52", "remaining_time": "18:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7272, "total_steps": 9627, "loss": 1.6584, "learning_rate": 1.4052662103507214e-05, "epoch": 0.755375506388283, "percentage": 75.54, "elapsed_time": "2 days, 8:27:25", "remaining_time": "18:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7273, "total_steps": 9627, "loss": 1.7567, "learning_rate": 1.4041322937670903e-05, "epoch": 0.7554793809078633, "percentage": 75.55, "elapsed_time": "2 days, 8:27:57", "remaining_time": "18:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7274, "total_steps": 9627, "loss": 1.6985, "learning_rate": 1.4029987601153188e-05, "epoch": 0.7555832554274436, "percentage": 75.56, "elapsed_time": "2 days, 8:28:29", "remaining_time": "18:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7275, "total_steps": 9627, "loss": 1.6191, "learning_rate": 1.4018656095161226e-05, "epoch": 0.755687129947024, "percentage": 75.57, "elapsed_time": "2 days, 8:29:01", "remaining_time": "18:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7276, "total_steps": 9627, "loss": 1.6991, "learning_rate": 1.400732842090174e-05, "epoch": 0.7557910044666043, "percentage": 75.58, "elapsed_time": "2 days, 8:29:33", "remaining_time": "18:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7277, "total_steps": 9627, "loss": 1.8434, "learning_rate": 1.3996004579580995e-05, "epoch": 0.7558948789861847, "percentage": 75.59, "elapsed_time": "2 days, 8:30:05", "remaining_time": "18:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7278, "total_steps": 9627, "loss": 1.7706, "learning_rate": 1.3984684572404938e-05, "epoch": 0.7559987535057651, "percentage": 75.6, "elapsed_time": "2 days, 8:30:38", "remaining_time": "18:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7279, "total_steps": 9627, "loss": 1.6742, "learning_rate": 1.397336840057904e-05, "epoch": 0.7561026280253453, "percentage": 75.61, "elapsed_time": "2 days, 8:31:10", "remaining_time": "18:13:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7280, "total_steps": 9627, "loss": 1.6319, "learning_rate": 1.3962056065308388e-05, "epoch": 0.7562065025449257, "percentage": 75.62, "elapsed_time": "2 days, 8:31:42", "remaining_time": "18:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7281, "total_steps": 9627, "loss": 1.6619, "learning_rate": 1.3950747567797662e-05, "epoch": 0.7563103770645061, "percentage": 75.63, "elapsed_time": "2 days, 8:32:15", "remaining_time": "18:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7282, "total_steps": 9627, "loss": 1.4829, "learning_rate": 1.3939442909251121e-05, "epoch": 0.7564142515840864, "percentage": 75.64, "elapsed_time": "2 days, 8:32:47", "remaining_time": "18:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7283, "total_steps": 9627, "loss": 1.6641, "learning_rate": 1.3928142090872632e-05, "epoch": 0.7565181261036668, "percentage": 75.65, "elapsed_time": "2 days, 8:33:19", "remaining_time": "18:12:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7284, "total_steps": 9627, "loss": 2.0066, "learning_rate": 1.3916845113865618e-05, "epoch": 0.7566220006232471, "percentage": 75.66, "elapsed_time": "2 days, 8:33:52", "remaining_time": "18:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7285, "total_steps": 9627, "loss": 1.6202, "learning_rate": 1.3905551979433157e-05, "epoch": 0.7567258751428275, "percentage": 75.67, "elapsed_time": "2 days, 8:34:24", "remaining_time": "18:11:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7286, "total_steps": 9627, "loss": 1.595, "learning_rate": 1.3894262688777865e-05, "epoch": 0.7568297496624078, "percentage": 75.68, "elapsed_time": "2 days, 8:34:56", "remaining_time": "18:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7287, "total_steps": 9627, "loss": 1.6401, "learning_rate": 1.3882977243101957e-05, "epoch": 0.7569336241819882, "percentage": 75.69, "elapsed_time": "2 days, 8:35:29", "remaining_time": "18:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7288, "total_steps": 9627, "loss": 1.415, "learning_rate": 1.3871695643607252e-05, "epoch": 0.7570374987015686, "percentage": 75.7, "elapsed_time": "2 days, 8:36:01", "remaining_time": "18:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7289, "total_steps": 9627, "loss": 1.7223, "learning_rate": 1.3860417891495154e-05, "epoch": 0.7571413732211488, "percentage": 75.71, "elapsed_time": "2 days, 8:36:33", "remaining_time": "18:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7290, "total_steps": 9627, "loss": 1.558, "learning_rate": 1.3849143987966645e-05, "epoch": 0.7572452477407292, "percentage": 75.72, "elapsed_time": "2 days, 8:37:05", "remaining_time": "18:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7291, "total_steps": 9627, "loss": 1.5861, "learning_rate": 1.38378739342223e-05, "epoch": 0.7573491222603096, "percentage": 75.73, "elapsed_time": "2 days, 8:37:38", "remaining_time": "18:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7292, "total_steps": 9627, "loss": 1.5489, "learning_rate": 1.3826607731462332e-05, "epoch": 0.7574529967798899, "percentage": 75.75, "elapsed_time": "2 days, 8:38:10", "remaining_time": "18:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7293, "total_steps": 9627, "loss": 1.5094, "learning_rate": 1.3815345380886452e-05, "epoch": 0.7575568712994702, "percentage": 75.76, "elapsed_time": "2 days, 8:38:42", "remaining_time": "18:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7294, "total_steps": 9627, "loss": 1.5909, "learning_rate": 1.380408688369405e-05, "epoch": 0.7576607458190506, "percentage": 75.77, "elapsed_time": "2 days, 8:39:14", "remaining_time": "18:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7295, "total_steps": 9627, "loss": 1.6435, "learning_rate": 1.3792832241084058e-05, "epoch": 0.7577646203386309, "percentage": 75.78, "elapsed_time": "2 days, 8:39:47", "remaining_time": "18:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7296, "total_steps": 9627, "loss": 1.6698, "learning_rate": 1.3781581454255005e-05, "epoch": 0.7578684948582113, "percentage": 75.79, "elapsed_time": "2 days, 8:40:19", "remaining_time": "18:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7297, "total_steps": 9627, "loss": 1.6468, "learning_rate": 1.3770334524405015e-05, "epoch": 0.7579723693777917, "percentage": 75.8, "elapsed_time": "2 days, 8:40:51", "remaining_time": "18:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7298, "total_steps": 9627, "loss": 1.7338, "learning_rate": 1.3759091452731792e-05, "epoch": 0.7580762438973719, "percentage": 75.81, "elapsed_time": "2 days, 8:41:23", "remaining_time": "18:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7299, "total_steps": 9627, "loss": 1.6291, "learning_rate": 1.3747852240432641e-05, "epoch": 0.7581801184169523, "percentage": 75.82, "elapsed_time": "2 days, 8:41:54", "remaining_time": "18:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7300, "total_steps": 9627, "loss": 1.8468, "learning_rate": 1.3736616888704434e-05, "epoch": 0.7582839929365327, "percentage": 75.83, "elapsed_time": "2 days, 8:42:26", "remaining_time": "18:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7301, "total_steps": 9627, "loss": 1.6639, "learning_rate": 1.372538539874369e-05, "epoch": 0.758387867456113, "percentage": 75.84, "elapsed_time": "2 days, 8:42:59", "remaining_time": "18:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7302, "total_steps": 9627, "loss": 1.5665, "learning_rate": 1.3714157771746422e-05, "epoch": 0.7584917419756934, "percentage": 75.85, "elapsed_time": "2 days, 8:43:31", "remaining_time": "18:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7303, "total_steps": 9627, "loss": 1.8113, "learning_rate": 1.3702934008908325e-05, "epoch": 0.7585956164952737, "percentage": 75.86, "elapsed_time": "2 days, 8:44:03", "remaining_time": "18:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7304, "total_steps": 9627, "loss": 1.7394, "learning_rate": 1.3691714111424641e-05, "epoch": 0.758699491014854, "percentage": 75.87, "elapsed_time": "2 days, 8:44:35", "remaining_time": "18:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7305, "total_steps": 9627, "loss": 1.6745, "learning_rate": 1.3680498080490161e-05, "epoch": 0.7588033655344344, "percentage": 75.88, "elapsed_time": "2 days, 8:45:07", "remaining_time": "18:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7306, "total_steps": 9627, "loss": 1.6433, "learning_rate": 1.3669285917299347e-05, "epoch": 0.7589072400540148, "percentage": 75.89, "elapsed_time": "2 days, 8:45:39", "remaining_time": "18:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7307, "total_steps": 9627, "loss": 1.5712, "learning_rate": 1.3658077623046195e-05, "epoch": 0.759011114573595, "percentage": 75.9, "elapsed_time": "2 days, 8:46:12", "remaining_time": "18:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7308, "total_steps": 9627, "loss": 1.6891, "learning_rate": 1.3646873198924293e-05, "epoch": 0.7591149890931754, "percentage": 75.91, "elapsed_time": "2 days, 8:46:44", "remaining_time": "18:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7309, "total_steps": 9627, "loss": 1.7747, "learning_rate": 1.3635672646126835e-05, "epoch": 0.7592188636127558, "percentage": 75.92, "elapsed_time": "2 days, 8:47:16", "remaining_time": "18:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7310, "total_steps": 9627, "loss": 1.5922, "learning_rate": 1.3624475965846584e-05, "epoch": 0.7593227381323361, "percentage": 75.93, "elapsed_time": "2 days, 8:47:48", "remaining_time": "18:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7311, "total_steps": 9627, "loss": 1.8192, "learning_rate": 1.3613283159275902e-05, "epoch": 0.7594266126519165, "percentage": 75.94, "elapsed_time": "2 days, 8:48:20", "remaining_time": "17:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7312, "total_steps": 9627, "loss": 1.5317, "learning_rate": 1.3602094227606721e-05, "epoch": 0.7595304871714968, "percentage": 75.95, "elapsed_time": "2 days, 8:48:53", "remaining_time": "17:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7313, "total_steps": 9627, "loss": 1.7496, "learning_rate": 1.3590909172030608e-05, "epoch": 0.7596343616910772, "percentage": 75.96, "elapsed_time": "2 days, 8:49:25", "remaining_time": "17:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7314, "total_steps": 9627, "loss": 1.7095, "learning_rate": 1.3579727993738666e-05, "epoch": 0.7597382362106575, "percentage": 75.97, "elapsed_time": "2 days, 8:49:57", "remaining_time": "17:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7315, "total_steps": 9627, "loss": 1.8207, "learning_rate": 1.3568550693921605e-05, "epoch": 0.7598421107302379, "percentage": 75.98, "elapsed_time": "2 days, 8:50:29", "remaining_time": "17:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7316, "total_steps": 9627, "loss": 1.7672, "learning_rate": 1.3557377273769718e-05, "epoch": 0.7599459852498183, "percentage": 75.99, "elapsed_time": "2 days, 8:51:01", "remaining_time": "17:57:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7317, "total_steps": 9627, "loss": 1.565, "learning_rate": 1.3546207734472882e-05, "epoch": 0.7600498597693985, "percentage": 76.0, "elapsed_time": "2 days, 8:51:34", "remaining_time": "17:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7318, "total_steps": 9627, "loss": 1.7241, "learning_rate": 1.3535042077220578e-05, "epoch": 0.7601537342889789, "percentage": 76.02, "elapsed_time": "2 days, 8:52:05", "remaining_time": "17:56:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7319, "total_steps": 9627, "loss": 1.6718, "learning_rate": 1.3523880303201842e-05, "epoch": 0.7602576088085593, "percentage": 76.03, "elapsed_time": "2 days, 8:52:38", "remaining_time": "17:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7320, "total_steps": 9627, "loss": 1.7467, "learning_rate": 1.3512722413605355e-05, "epoch": 0.7603614833281396, "percentage": 76.04, "elapsed_time": "2 days, 8:53:10", "remaining_time": "17:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7321, "total_steps": 9627, "loss": 1.6112, "learning_rate": 1.3501568409619286e-05, "epoch": 0.76046535784772, "percentage": 76.05, "elapsed_time": "2 days, 8:53:42", "remaining_time": "17:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7322, "total_steps": 9627, "loss": 1.7561, "learning_rate": 1.3490418292431506e-05, "epoch": 0.7605692323673003, "percentage": 76.06, "elapsed_time": "2 days, 8:54:14", "remaining_time": "17:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7323, "total_steps": 9627, "loss": 1.7218, "learning_rate": 1.3479272063229387e-05, "epoch": 0.7606731068868806, "percentage": 76.07, "elapsed_time": "2 days, 8:54:46", "remaining_time": "17:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7324, "total_steps": 9627, "loss": 1.777, "learning_rate": 1.3468129723199919e-05, "epoch": 0.760776981406461, "percentage": 76.08, "elapsed_time": "2 days, 8:55:19", "remaining_time": "17:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7325, "total_steps": 9627, "loss": 1.7544, "learning_rate": 1.3456991273529679e-05, "epoch": 0.7608808559260414, "percentage": 76.09, "elapsed_time": "2 days, 8:55:51", "remaining_time": "17:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7326, "total_steps": 9627, "loss": 1.6227, "learning_rate": 1.344585671540482e-05, "epoch": 0.7609847304456216, "percentage": 76.1, "elapsed_time": "2 days, 8:56:23", "remaining_time": "17:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7327, "total_steps": 9627, "loss": 1.6841, "learning_rate": 1.3434726050011093e-05, "epoch": 0.761088604965202, "percentage": 76.11, "elapsed_time": "2 days, 8:56:56", "remaining_time": "17:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7328, "total_steps": 9627, "loss": 1.6404, "learning_rate": 1.34235992785338e-05, "epoch": 0.7611924794847824, "percentage": 76.12, "elapsed_time": "2 days, 8:57:28", "remaining_time": "17:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7329, "total_steps": 9627, "loss": 1.7414, "learning_rate": 1.3412476402157908e-05, "epoch": 0.7612963540043627, "percentage": 76.13, "elapsed_time": "2 days, 8:58:00", "remaining_time": "17:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7330, "total_steps": 9627, "loss": 1.7274, "learning_rate": 1.3401357422067857e-05, "epoch": 0.7614002285239431, "percentage": 76.14, "elapsed_time": "2 days, 8:58:32", "remaining_time": "17:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7331, "total_steps": 9627, "loss": 1.7611, "learning_rate": 1.3390242339447779e-05, "epoch": 0.7615041030435235, "percentage": 76.15, "elapsed_time": "2 days, 8:59:04", "remaining_time": "17:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7332, "total_steps": 9627, "loss": 1.7494, "learning_rate": 1.3379131155481334e-05, "epoch": 0.7616079775631037, "percentage": 76.16, "elapsed_time": "2 days, 8:59:36", "remaining_time": "17:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7333, "total_steps": 9627, "loss": 1.6216, "learning_rate": 1.3368023871351737e-05, "epoch": 0.7617118520826841, "percentage": 76.17, "elapsed_time": "2 days, 9:00:09", "remaining_time": "17:49:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7334, "total_steps": 9627, "loss": 1.5723, "learning_rate": 1.3356920488241875e-05, "epoch": 0.7618157266022645, "percentage": 76.18, "elapsed_time": "2 days, 9:00:41", "remaining_time": "17:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7335, "total_steps": 9627, "loss": 1.6863, "learning_rate": 1.3345821007334153e-05, "epoch": 0.7619196011218448, "percentage": 76.19, "elapsed_time": "2 days, 9:01:13", "remaining_time": "17:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7336, "total_steps": 9627, "loss": 1.7284, "learning_rate": 1.333472542981058e-05, "epoch": 0.7620234756414251, "percentage": 76.2, "elapsed_time": "2 days, 9:01:46", "remaining_time": "17:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7337, "total_steps": 9627, "loss": 1.5037, "learning_rate": 1.3323633756852749e-05, "epoch": 0.7621273501610055, "percentage": 76.21, "elapsed_time": "2 days, 9:02:17", "remaining_time": "17:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7338, "total_steps": 9627, "loss": 1.5679, "learning_rate": 1.3312545989641823e-05, "epoch": 0.7622312246805859, "percentage": 76.22, "elapsed_time": "2 days, 9:02:50", "remaining_time": "17:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7339, "total_steps": 9627, "loss": 1.6756, "learning_rate": 1.3301462129358605e-05, "epoch": 0.7623350992001662, "percentage": 76.23, "elapsed_time": "2 days, 9:03:22", "remaining_time": "17:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7340, "total_steps": 9627, "loss": 1.8475, "learning_rate": 1.329038217718338e-05, "epoch": 0.7624389737197466, "percentage": 76.24, "elapsed_time": "2 days, 9:03:54", "remaining_time": "17:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7341, "total_steps": 9627, "loss": 1.6682, "learning_rate": 1.3279306134296122e-05, "epoch": 0.7625428482393269, "percentage": 76.25, "elapsed_time": "2 days, 9:04:26", "remaining_time": "17:46:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7342, "total_steps": 9627, "loss": 1.6528, "learning_rate": 1.3268234001876328e-05, "epoch": 0.7626467227589072, "percentage": 76.26, "elapsed_time": "2 days, 9:04:59", "remaining_time": "17:45:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7343, "total_steps": 9627, "loss": 1.5253, "learning_rate": 1.3257165781103093e-05, "epoch": 0.7627505972784876, "percentage": 76.28, "elapsed_time": "2 days, 9:05:31", "remaining_time": "17:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7344, "total_steps": 9627, "loss": 1.4581, "learning_rate": 1.3246101473155098e-05, "epoch": 0.762854471798068, "percentage": 76.29, "elapsed_time": "2 days, 9:06:03", "remaining_time": "17:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7345, "total_steps": 9627, "loss": 1.5694, "learning_rate": 1.3235041079210603e-05, "epoch": 0.7629583463176483, "percentage": 76.3, "elapsed_time": "2 days, 9:06:35", "remaining_time": "17:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7346, "total_steps": 9627, "loss": 1.6775, "learning_rate": 1.3223984600447459e-05, "epoch": 0.7630622208372286, "percentage": 76.31, "elapsed_time": "2 days, 9:07:07", "remaining_time": "17:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7347, "total_steps": 9627, "loss": 1.4226, "learning_rate": 1.3212932038043075e-05, "epoch": 0.763166095356809, "percentage": 76.32, "elapsed_time": "2 days, 9:07:40", "remaining_time": "17:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7348, "total_steps": 9627, "loss": 1.6444, "learning_rate": 1.3201883393174508e-05, "epoch": 0.7632699698763893, "percentage": 76.33, "elapsed_time": "2 days, 9:08:12", "remaining_time": "17:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7349, "total_steps": 9627, "loss": 1.4875, "learning_rate": 1.3190838667018297e-05, "epoch": 0.7633738443959697, "percentage": 76.34, "elapsed_time": "2 days, 9:08:44", "remaining_time": "17:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7350, "total_steps": 9627, "loss": 1.7218, "learning_rate": 1.3179797860750653e-05, "epoch": 0.76347771891555, "percentage": 76.35, "elapsed_time": "2 days, 9:09:17", "remaining_time": "17:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7351, "total_steps": 9627, "loss": 1.7828, "learning_rate": 1.3168760975547335e-05, "epoch": 0.7635815934351303, "percentage": 76.36, "elapsed_time": "2 days, 9:09:49", "remaining_time": "17:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7352, "total_steps": 9627, "loss": 1.7086, "learning_rate": 1.3157728012583675e-05, "epoch": 0.7636854679547107, "percentage": 76.37, "elapsed_time": "2 days, 9:10:21", "remaining_time": "17:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7353, "total_steps": 9627, "loss": 1.72, "learning_rate": 1.3146698973034599e-05, "epoch": 0.7637893424742911, "percentage": 76.38, "elapsed_time": "2 days, 9:10:53", "remaining_time": "17:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7354, "total_steps": 9627, "loss": 1.7184, "learning_rate": 1.3135673858074621e-05, "epoch": 0.7638932169938714, "percentage": 76.39, "elapsed_time": "2 days, 9:11:25", "remaining_time": "17:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7355, "total_steps": 9627, "loss": 1.6402, "learning_rate": 1.3124652668877819e-05, "epoch": 0.7639970915134517, "percentage": 76.4, "elapsed_time": "2 days, 9:11:57", "remaining_time": "17:40:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7356, "total_steps": 9627, "loss": 1.7906, "learning_rate": 1.3113635406617858e-05, "epoch": 0.7641009660330321, "percentage": 76.41, "elapsed_time": "2 days, 9:12:29", "remaining_time": "17:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7357, "total_steps": 9627, "loss": 1.6315, "learning_rate": 1.310262207246803e-05, "epoch": 0.7642048405526124, "percentage": 76.42, "elapsed_time": "2 days, 9:13:02", "remaining_time": "17:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7358, "total_steps": 9627, "loss": 1.7554, "learning_rate": 1.3091612667601111e-05, "epoch": 0.7643087150721928, "percentage": 76.43, "elapsed_time": "2 days, 9:13:34", "remaining_time": "17:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7359, "total_steps": 9627, "loss": 1.5465, "learning_rate": 1.3080607193189559e-05, "epoch": 0.7644125895917732, "percentage": 76.44, "elapsed_time": "2 days, 9:14:07", "remaining_time": "17:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7360, "total_steps": 9627, "loss": 1.6579, "learning_rate": 1.3069605650405375e-05, "epoch": 0.7645164641113534, "percentage": 76.45, "elapsed_time": "2 days, 9:14:38", "remaining_time": "17:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7361, "total_steps": 9627, "loss": 1.5157, "learning_rate": 1.3058608040420095e-05, "epoch": 0.7646203386309338, "percentage": 76.46, "elapsed_time": "2 days, 9:15:10", "remaining_time": "17:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7362, "total_steps": 9627, "loss": 1.6494, "learning_rate": 1.3047614364404914e-05, "epoch": 0.7647242131505142, "percentage": 76.47, "elapsed_time": "2 days, 9:15:43", "remaining_time": "17:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7363, "total_steps": 9627, "loss": 1.6405, "learning_rate": 1.3036624623530552e-05, "epoch": 0.7648280876700946, "percentage": 76.48, "elapsed_time": "2 days, 9:16:15", "remaining_time": "17:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7364, "total_steps": 9627, "loss": 1.5746, "learning_rate": 1.3025638818967373e-05, "epoch": 0.7649319621896749, "percentage": 76.49, "elapsed_time": "2 days, 9:16:47", "remaining_time": "17:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7365, "total_steps": 9627, "loss": 1.7997, "learning_rate": 1.3014656951885229e-05, "epoch": 0.7650358367092552, "percentage": 76.5, "elapsed_time": "2 days, 9:17:19", "remaining_time": "17:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7366, "total_steps": 9627, "loss": 1.52, "learning_rate": 1.3003679023453614e-05, "epoch": 0.7651397112288356, "percentage": 76.51, "elapsed_time": "2 days, 9:17:51", "remaining_time": "17:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7367, "total_steps": 9627, "loss": 1.707, "learning_rate": 1.2992705034841623e-05, "epoch": 0.7652435857484159, "percentage": 76.52, "elapsed_time": "2 days, 9:18:24", "remaining_time": "17:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7368, "total_steps": 9627, "loss": 1.788, "learning_rate": 1.2981734987217853e-05, "epoch": 0.7653474602679963, "percentage": 76.53, "elapsed_time": "2 days, 9:18:56", "remaining_time": "17:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7369, "total_steps": 9627, "loss": 1.6524, "learning_rate": 1.2970768881750567e-05, "epoch": 0.7654513347875767, "percentage": 76.55, "elapsed_time": "2 days, 9:19:28", "remaining_time": "17:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7370, "total_steps": 9627, "loss": 1.6253, "learning_rate": 1.295980671960756e-05, "epoch": 0.7655552093071569, "percentage": 76.56, "elapsed_time": "2 days, 9:20:00", "remaining_time": "17:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7371, "total_steps": 9627, "loss": 1.6816, "learning_rate": 1.2948848501956207e-05, "epoch": 0.7656590838267373, "percentage": 76.57, "elapsed_time": "2 days, 9:20:32", "remaining_time": "17:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7372, "total_steps": 9627, "loss": 1.5858, "learning_rate": 1.2937894229963483e-05, "epoch": 0.7657629583463177, "percentage": 76.58, "elapsed_time": "2 days, 9:21:04", "remaining_time": "17:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7373, "total_steps": 9627, "loss": 1.7703, "learning_rate": 1.2926943904795925e-05, "epoch": 0.765866832865898, "percentage": 76.59, "elapsed_time": "2 days, 9:21:36", "remaining_time": "17:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7374, "total_steps": 9627, "loss": 1.6223, "learning_rate": 1.291599752761966e-05, "epoch": 0.7659707073854783, "percentage": 76.6, "elapsed_time": "2 days, 9:22:08", "remaining_time": "17:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7375, "total_steps": 9627, "loss": 1.6564, "learning_rate": 1.2905055099600378e-05, "epoch": 0.7660745819050587, "percentage": 76.61, "elapsed_time": "2 days, 9:22:40", "remaining_time": "17:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7376, "total_steps": 9627, "loss": 1.5993, "learning_rate": 1.2894116621903402e-05, "epoch": 0.766178456424639, "percentage": 76.62, "elapsed_time": "2 days, 9:23:12", "remaining_time": "17:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7377, "total_steps": 9627, "loss": 1.5434, "learning_rate": 1.2883182095693547e-05, "epoch": 0.7662823309442194, "percentage": 76.63, "elapsed_time": "2 days, 9:23:44", "remaining_time": "17:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7378, "total_steps": 9627, "loss": 1.5887, "learning_rate": 1.2872251522135286e-05, "epoch": 0.7663862054637998, "percentage": 76.64, "elapsed_time": "2 days, 9:24:16", "remaining_time": "17:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7379, "total_steps": 9627, "loss": 1.7188, "learning_rate": 1.286132490239263e-05, "epoch": 0.76649007998338, "percentage": 76.65, "elapsed_time": "2 days, 9:24:48", "remaining_time": "17:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7380, "total_steps": 9627, "loss": 1.869, "learning_rate": 1.2850402237629183e-05, "epoch": 0.7665939545029604, "percentage": 76.66, "elapsed_time": "2 days, 9:25:20", "remaining_time": "17:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7381, "total_steps": 9627, "loss": 1.7155, "learning_rate": 1.2839483529008117e-05, "epoch": 0.7666978290225408, "percentage": 76.67, "elapsed_time": "2 days, 9:25:53", "remaining_time": "17:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7382, "total_steps": 9627, "loss": 1.6919, "learning_rate": 1.2828568777692191e-05, "epoch": 0.7668017035421211, "percentage": 76.68, "elapsed_time": "2 days, 9:26:25", "remaining_time": "17:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7383, "total_steps": 9627, "loss": 1.7123, "learning_rate": 1.2817657984843746e-05, "epoch": 0.7669055780617015, "percentage": 76.69, "elapsed_time": "2 days, 9:26:57", "remaining_time": "17:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7384, "total_steps": 9627, "loss": 1.7498, "learning_rate": 1.280675115162467e-05, "epoch": 0.7670094525812818, "percentage": 76.7, "elapsed_time": "2 days, 9:27:29", "remaining_time": "17:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7385, "total_steps": 9627, "loss": 1.6622, "learning_rate": 1.2795848279196515e-05, "epoch": 0.7671133271008621, "percentage": 76.71, "elapsed_time": "2 days, 9:28:01", "remaining_time": "17:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7386, "total_steps": 9627, "loss": 1.7493, "learning_rate": 1.2784949368720295e-05, "epoch": 0.7672172016204425, "percentage": 76.72, "elapsed_time": "2 days, 9:28:34", "remaining_time": "17:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7387, "total_steps": 9627, "loss": 1.767, "learning_rate": 1.2774054421356668e-05, "epoch": 0.7673210761400229, "percentage": 76.73, "elapsed_time": "2 days, 9:29:06", "remaining_time": "17:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7388, "total_steps": 9627, "loss": 1.7475, "learning_rate": 1.2763163438265896e-05, "epoch": 0.7674249506596031, "percentage": 76.74, "elapsed_time": "2 days, 9:29:38", "remaining_time": "17:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7389, "total_steps": 9627, "loss": 1.756, "learning_rate": 1.2752276420607735e-05, "epoch": 0.7675288251791835, "percentage": 76.75, "elapsed_time": "2 days, 9:30:11", "remaining_time": "17:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7390, "total_steps": 9627, "loss": 1.8209, "learning_rate": 1.2741393369541604e-05, "epoch": 0.7676326996987639, "percentage": 76.76, "elapsed_time": "2 days, 9:30:43", "remaining_time": "17:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7391, "total_steps": 9627, "loss": 1.5466, "learning_rate": 1.2730514286226435e-05, "epoch": 0.7677365742183443, "percentage": 76.77, "elapsed_time": "2 days, 9:31:15", "remaining_time": "17:24:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7392, "total_steps": 9627, "loss": 1.6497, "learning_rate": 1.2719639171820812e-05, "epoch": 0.7678404487379246, "percentage": 76.78, "elapsed_time": "2 days, 9:31:47", "remaining_time": "17:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7393, "total_steps": 9627, "loss": 1.3777, "learning_rate": 1.2708768027482804e-05, "epoch": 0.767944323257505, "percentage": 76.79, "elapsed_time": "2 days, 9:32:19", "remaining_time": "17:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7394, "total_steps": 9627, "loss": 1.6038, "learning_rate": 1.2697900854370103e-05, "epoch": 0.7680481977770853, "percentage": 76.8, "elapsed_time": "2 days, 9:32:51", "remaining_time": "17:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7395, "total_steps": 9627, "loss": 1.6013, "learning_rate": 1.2687037653640026e-05, "epoch": 0.7681520722966656, "percentage": 76.82, "elapsed_time": "2 days, 9:33:24", "remaining_time": "17:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7396, "total_steps": 9627, "loss": 1.6607, "learning_rate": 1.2676178426449353e-05, "epoch": 0.768255946816246, "percentage": 76.83, "elapsed_time": "2 days, 9:33:56", "remaining_time": "17:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7397, "total_steps": 9627, "loss": 1.659, "learning_rate": 1.2665323173954557e-05, "epoch": 0.7683598213358264, "percentage": 76.84, "elapsed_time": "2 days, 9:34:28", "remaining_time": "17:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7398, "total_steps": 9627, "loss": 1.6306, "learning_rate": 1.2654471897311627e-05, "epoch": 0.7684636958554066, "percentage": 76.85, "elapsed_time": "2 days, 9:35:00", "remaining_time": "17:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7399, "total_steps": 9627, "loss": 1.5395, "learning_rate": 1.2643624597676123e-05, "epoch": 0.768567570374987, "percentage": 76.86, "elapsed_time": "2 days, 9:35:32", "remaining_time": "17:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7400, "total_steps": 9627, "loss": 1.6195, "learning_rate": 1.2632781276203216e-05, "epoch": 0.7686714448945674, "percentage": 76.87, "elapsed_time": "2 days, 9:36:05", "remaining_time": "17:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7401, "total_steps": 9627, "loss": 1.5897, "learning_rate": 1.2621941934047626e-05, "epoch": 0.7687753194141477, "percentage": 76.88, "elapsed_time": "2 days, 9:36:37", "remaining_time": "17:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7402, "total_steps": 9627, "loss": 1.4635, "learning_rate": 1.2611106572363663e-05, "epoch": 0.7688791939337281, "percentage": 76.89, "elapsed_time": "2 days, 9:37:08", "remaining_time": "17:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7403, "total_steps": 9627, "loss": 1.6104, "learning_rate": 1.2600275192305184e-05, "epoch": 0.7689830684533084, "percentage": 76.9, "elapsed_time": "2 days, 9:37:41", "remaining_time": "17:18:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7404, "total_steps": 9627, "loss": 1.7406, "learning_rate": 1.2589447795025699e-05, "epoch": 0.7690869429728887, "percentage": 76.91, "elapsed_time": "2 days, 9:38:13", "remaining_time": "17:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7405, "total_steps": 9627, "loss": 1.7893, "learning_rate": 1.2578624381678183e-05, "epoch": 0.7691908174924691, "percentage": 76.92, "elapsed_time": "2 days, 9:38:45", "remaining_time": "17:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7406, "total_steps": 9627, "loss": 1.5755, "learning_rate": 1.2567804953415286e-05, "epoch": 0.7692946920120495, "percentage": 76.93, "elapsed_time": "2 days, 9:39:17", "remaining_time": "17:17:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7407, "total_steps": 9627, "loss": 1.6138, "learning_rate": 1.2556989511389183e-05, "epoch": 0.7693985665316297, "percentage": 76.94, "elapsed_time": "2 days, 9:39:50", "remaining_time": "17:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7408, "total_steps": 9627, "loss": 1.5875, "learning_rate": 1.2546178056751623e-05, "epoch": 0.7695024410512101, "percentage": 76.95, "elapsed_time": "2 days, 9:40:22", "remaining_time": "17:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7409, "total_steps": 9627, "loss": 1.5919, "learning_rate": 1.2535370590653955e-05, "epoch": 0.7696063155707905, "percentage": 76.96, "elapsed_time": "2 days, 9:40:54", "remaining_time": "17:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7410, "total_steps": 9627, "loss": 1.6622, "learning_rate": 1.2524567114247082e-05, "epoch": 0.7697101900903708, "percentage": 76.97, "elapsed_time": "2 days, 9:41:26", "remaining_time": "17:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7411, "total_steps": 9627, "loss": 1.5001, "learning_rate": 1.2513767628681489e-05, "epoch": 0.7698140646099512, "percentage": 76.98, "elapsed_time": "2 days, 9:41:58", "remaining_time": "17:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7412, "total_steps": 9627, "loss": 1.6887, "learning_rate": 1.2502972135107227e-05, "epoch": 0.7699179391295315, "percentage": 76.99, "elapsed_time": "2 days, 9:42:30", "remaining_time": "17:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7413, "total_steps": 9627, "loss": 1.6159, "learning_rate": 1.2492180634673978e-05, "epoch": 0.7700218136491118, "percentage": 77.0, "elapsed_time": "2 days, 9:43:02", "remaining_time": "17:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7414, "total_steps": 9627, "loss": 1.6015, "learning_rate": 1.24813931285309e-05, "epoch": 0.7701256881686922, "percentage": 77.01, "elapsed_time": "2 days, 9:43:35", "remaining_time": "17:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7415, "total_steps": 9627, "loss": 1.3466, "learning_rate": 1.2470609617826784e-05, "epoch": 0.7702295626882726, "percentage": 77.02, "elapsed_time": "2 days, 9:44:07", "remaining_time": "17:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7416, "total_steps": 9627, "loss": 1.7882, "learning_rate": 1.2459830103710019e-05, "epoch": 0.770333437207853, "percentage": 77.03, "elapsed_time": "2 days, 9:44:38", "remaining_time": "17:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7417, "total_steps": 9627, "loss": 1.6455, "learning_rate": 1.2449054587328519e-05, "epoch": 0.7704373117274332, "percentage": 77.04, "elapsed_time": "2 days, 9:45:11", "remaining_time": "17:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7418, "total_steps": 9627, "loss": 1.7585, "learning_rate": 1.2438283069829799e-05, "epoch": 0.7705411862470136, "percentage": 77.05, "elapsed_time": "2 days, 9:45:43", "remaining_time": "17:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7419, "total_steps": 9627, "loss": 1.502, "learning_rate": 1.2427515552360924e-05, "epoch": 0.770645060766594, "percentage": 77.06, "elapsed_time": "2 days, 9:46:15", "remaining_time": "17:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7420, "total_steps": 9627, "loss": 1.7382, "learning_rate": 1.2416752036068596e-05, "epoch": 0.7707489352861743, "percentage": 77.07, "elapsed_time": "2 days, 9:46:48", "remaining_time": "17:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7421, "total_steps": 9627, "loss": 1.5567, "learning_rate": 1.2405992522099002e-05, "epoch": 0.7708528098057547, "percentage": 77.09, "elapsed_time": "2 days, 9:47:20", "remaining_time": "17:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7422, "total_steps": 9627, "loss": 1.8138, "learning_rate": 1.2395237011597949e-05, "epoch": 0.770956684325335, "percentage": 77.1, "elapsed_time": "2 days, 9:47:52", "remaining_time": "17:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7423, "total_steps": 9627, "loss": 1.6393, "learning_rate": 1.2384485505710847e-05, "epoch": 0.7710605588449153, "percentage": 77.11, "elapsed_time": "2 days, 9:48:24", "remaining_time": "17:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7424, "total_steps": 9627, "loss": 1.5276, "learning_rate": 1.2373738005582603e-05, "epoch": 0.7711644333644957, "percentage": 77.12, "elapsed_time": "2 days, 9:48:56", "remaining_time": "17:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7425, "total_steps": 9627, "loss": 1.7476, "learning_rate": 1.2362994512357779e-05, "epoch": 0.7712683078840761, "percentage": 77.13, "elapsed_time": "2 days, 9:49:28", "remaining_time": "17:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7426, "total_steps": 9627, "loss": 1.8217, "learning_rate": 1.235225502718046e-05, "epoch": 0.7713721824036563, "percentage": 77.14, "elapsed_time": "2 days, 9:50:01", "remaining_time": "17:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7427, "total_steps": 9627, "loss": 1.5592, "learning_rate": 1.2341519551194314e-05, "epoch": 0.7714760569232367, "percentage": 77.15, "elapsed_time": "2 days, 9:50:33", "remaining_time": "17:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7428, "total_steps": 9627, "loss": 1.7773, "learning_rate": 1.2330788085542589e-05, "epoch": 0.7715799314428171, "percentage": 77.16, "elapsed_time": "2 days, 9:51:04", "remaining_time": "17:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7429, "total_steps": 9627, "loss": 1.6483, "learning_rate": 1.2320060631368103e-05, "epoch": 0.7716838059623974, "percentage": 77.17, "elapsed_time": "2 days, 9:51:36", "remaining_time": "17:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7430, "total_steps": 9627, "loss": 1.5655, "learning_rate": 1.2309337189813242e-05, "epoch": 0.7717876804819778, "percentage": 77.18, "elapsed_time": "2 days, 9:52:09", "remaining_time": "17:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7431, "total_steps": 9627, "loss": 1.5819, "learning_rate": 1.229861776201996e-05, "epoch": 0.7718915550015581, "percentage": 77.19, "elapsed_time": "2 days, 9:52:41", "remaining_time": "17:06:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7432, "total_steps": 9627, "loss": 1.5958, "learning_rate": 1.2287902349129832e-05, "epoch": 0.7719954295211384, "percentage": 77.2, "elapsed_time": "2 days, 9:53:13", "remaining_time": "17:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7433, "total_steps": 9627, "loss": 1.6924, "learning_rate": 1.2277190952283912e-05, "epoch": 0.7720993040407188, "percentage": 77.21, "elapsed_time": "2 days, 9:53:45", "remaining_time": "17:05:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7434, "total_steps": 9627, "loss": 1.6906, "learning_rate": 1.2266483572622916e-05, "epoch": 0.7722031785602992, "percentage": 77.22, "elapsed_time": "2 days, 9:54:17", "remaining_time": "17:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7435, "total_steps": 9627, "loss": 1.718, "learning_rate": 1.2255780211287094e-05, "epoch": 0.7723070530798795, "percentage": 77.23, "elapsed_time": "2 days, 9:54:48", "remaining_time": "17:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7436, "total_steps": 9627, "loss": 1.636, "learning_rate": 1.2245080869416258e-05, "epoch": 0.7724109275994598, "percentage": 77.24, "elapsed_time": "2 days, 9:55:20", "remaining_time": "17:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7437, "total_steps": 9627, "loss": 1.7592, "learning_rate": 1.2234385548149813e-05, "epoch": 0.7725148021190402, "percentage": 77.25, "elapsed_time": "2 days, 9:55:53", "remaining_time": "17:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7438, "total_steps": 9627, "loss": 1.7048, "learning_rate": 1.2223694248626721e-05, "epoch": 0.7726186766386205, "percentage": 77.26, "elapsed_time": "2 days, 9:56:25", "remaining_time": "17:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7439, "total_steps": 9627, "loss": 1.808, "learning_rate": 1.2213006971985524e-05, "epoch": 0.7727225511582009, "percentage": 77.27, "elapsed_time": "2 days, 9:56:56", "remaining_time": "17:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7440, "total_steps": 9627, "loss": 1.6744, "learning_rate": 1.2202323719364323e-05, "epoch": 0.7728264256777813, "percentage": 77.28, "elapsed_time": "2 days, 9:57:28", "remaining_time": "17:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7441, "total_steps": 9627, "loss": 1.5021, "learning_rate": 1.2191644491900822e-05, "epoch": 0.7729303001973616, "percentage": 77.29, "elapsed_time": "2 days, 9:58:00", "remaining_time": "17:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7442, "total_steps": 9627, "loss": 1.7047, "learning_rate": 1.2180969290732286e-05, "epoch": 0.7730341747169419, "percentage": 77.3, "elapsed_time": "2 days, 9:58:32", "remaining_time": "17:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7443, "total_steps": 9627, "loss": 1.5239, "learning_rate": 1.2170298116995493e-05, "epoch": 0.7731380492365223, "percentage": 77.31, "elapsed_time": "2 days, 9:59:05", "remaining_time": "17:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7444, "total_steps": 9627, "loss": 1.4872, "learning_rate": 1.2159630971826879e-05, "epoch": 0.7732419237561027, "percentage": 77.32, "elapsed_time": "2 days, 9:59:36", "remaining_time": "17:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7445, "total_steps": 9627, "loss": 1.813, "learning_rate": 1.2148967856362398e-05, "epoch": 0.773345798275683, "percentage": 77.33, "elapsed_time": "2 days, 10:00:09", "remaining_time": "16:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7446, "total_steps": 9627, "loss": 1.5849, "learning_rate": 1.2138308771737594e-05, "epoch": 0.7734496727952633, "percentage": 77.34, "elapsed_time": "2 days, 10:00:41", "remaining_time": "16:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7447, "total_steps": 9627, "loss": 1.7053, "learning_rate": 1.2127653719087572e-05, "epoch": 0.7735535473148437, "percentage": 77.36, "elapsed_time": "2 days, 10:01:12", "remaining_time": "16:59:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7448, "total_steps": 9627, "loss": 1.7733, "learning_rate": 1.2117002699547015e-05, "epoch": 0.773657421834424, "percentage": 77.37, "elapsed_time": "2 days, 10:01:44", "remaining_time": "16:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7449, "total_steps": 9627, "loss": 1.7352, "learning_rate": 1.2106355714250172e-05, "epoch": 0.7737612963540044, "percentage": 77.38, "elapsed_time": "2 days, 10:02:16", "remaining_time": "16:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7450, "total_steps": 9627, "loss": 1.9348, "learning_rate": 1.2095712764330847e-05, "epoch": 0.7738651708735848, "percentage": 77.39, "elapsed_time": "2 days, 10:02:48", "remaining_time": "16:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7451, "total_steps": 9627, "loss": 1.659, "learning_rate": 1.2085073850922479e-05, "epoch": 0.773969045393165, "percentage": 77.4, "elapsed_time": "2 days, 10:03:20", "remaining_time": "16:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7452, "total_steps": 9627, "loss": 1.8332, "learning_rate": 1.2074438975157964e-05, "epoch": 0.7740729199127454, "percentage": 77.41, "elapsed_time": "2 days, 10:03:53", "remaining_time": "16:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7453, "total_steps": 9627, "loss": 1.3752, "learning_rate": 1.2063808138169891e-05, "epoch": 0.7741767944323258, "percentage": 77.42, "elapsed_time": "2 days, 10:04:25", "remaining_time": "16:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7454, "total_steps": 9627, "loss": 1.632, "learning_rate": 1.205318134109033e-05, "epoch": 0.7742806689519061, "percentage": 77.43, "elapsed_time": "2 days, 10:04:56", "remaining_time": "16:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7455, "total_steps": 9627, "loss": 1.5544, "learning_rate": 1.2042558585050961e-05, "epoch": 0.7743845434714864, "percentage": 77.44, "elapsed_time": "2 days, 10:05:28", "remaining_time": "16:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7456, "total_steps": 9627, "loss": 1.8892, "learning_rate": 1.2031939871183023e-05, "epoch": 0.7744884179910668, "percentage": 77.45, "elapsed_time": "2 days, 10:06:00", "remaining_time": "16:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7457, "total_steps": 9627, "loss": 1.6822, "learning_rate": 1.2021325200617329e-05, "epoch": 0.7745922925106471, "percentage": 77.46, "elapsed_time": "2 days, 10:06:33", "remaining_time": "16:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7458, "total_steps": 9627, "loss": 1.6621, "learning_rate": 1.2010714574484255e-05, "epoch": 0.7746961670302275, "percentage": 77.47, "elapsed_time": "2 days, 10:07:05", "remaining_time": "16:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7459, "total_steps": 9627, "loss": 1.5825, "learning_rate": 1.2000107993913739e-05, "epoch": 0.7748000415498079, "percentage": 77.48, "elapsed_time": "2 days, 10:07:37", "remaining_time": "16:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7460, "total_steps": 9627, "loss": 1.573, "learning_rate": 1.1989505460035333e-05, "epoch": 0.7749039160693881, "percentage": 77.49, "elapsed_time": "2 days, 10:08:09", "remaining_time": "16:53:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7461, "total_steps": 9627, "loss": 1.68, "learning_rate": 1.1978906973978083e-05, "epoch": 0.7750077905889685, "percentage": 77.5, "elapsed_time": "2 days, 10:08:41", "remaining_time": "16:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7462, "total_steps": 9627, "loss": 1.5407, "learning_rate": 1.1968312536870668e-05, "epoch": 0.7751116651085489, "percentage": 77.51, "elapsed_time": "2 days, 10:09:13", "remaining_time": "16:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7463, "total_steps": 9627, "loss": 1.4685, "learning_rate": 1.1957722149841317e-05, "epoch": 0.7752155396281292, "percentage": 77.52, "elapsed_time": "2 days, 10:09:46", "remaining_time": "16:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7464, "total_steps": 9627, "loss": 1.4937, "learning_rate": 1.1947135814017812e-05, "epoch": 0.7753194141477096, "percentage": 77.53, "elapsed_time": "2 days, 10:10:18", "remaining_time": "16:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7465, "total_steps": 9627, "loss": 1.5106, "learning_rate": 1.1936553530527523e-05, "epoch": 0.7754232886672899, "percentage": 77.54, "elapsed_time": "2 days, 10:10:50", "remaining_time": "16:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7466, "total_steps": 9627, "loss": 1.4574, "learning_rate": 1.1925975300497371e-05, "epoch": 0.7755271631868702, "percentage": 77.55, "elapsed_time": "2 days, 10:11:21", "remaining_time": "16:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7467, "total_steps": 9627, "loss": 1.749, "learning_rate": 1.1915401125053866e-05, "epoch": 0.7756310377064506, "percentage": 77.56, "elapsed_time": "2 days, 10:11:53", "remaining_time": "16:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7468, "total_steps": 9627, "loss": 1.5465, "learning_rate": 1.1904831005323053e-05, "epoch": 0.775734912226031, "percentage": 77.57, "elapsed_time": "2 days, 10:12:25", "remaining_time": "16:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7469, "total_steps": 9627, "loss": 1.487, "learning_rate": 1.18942649424306e-05, "epoch": 0.7758387867456114, "percentage": 77.58, "elapsed_time": "2 days, 10:12:57", "remaining_time": "16:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7470, "total_steps": 9627, "loss": 1.6149, "learning_rate": 1.1883702937501705e-05, "epoch": 0.7759426612651916, "percentage": 77.59, "elapsed_time": "2 days, 10:13:29", "remaining_time": "16:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7471, "total_steps": 9627, "loss": 1.567, "learning_rate": 1.1873144991661106e-05, "epoch": 0.776046535784772, "percentage": 77.6, "elapsed_time": "2 days, 10:14:02", "remaining_time": "16:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7472, "total_steps": 9627, "loss": 1.7902, "learning_rate": 1.1862591106033178e-05, "epoch": 0.7761504103043524, "percentage": 77.62, "elapsed_time": "2 days, 10:14:34", "remaining_time": "16:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7473, "total_steps": 9627, "loss": 1.6518, "learning_rate": 1.185204128174181e-05, "epoch": 0.7762542848239327, "percentage": 77.63, "elapsed_time": "2 days, 10:15:05", "remaining_time": "16:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7474, "total_steps": 9627, "loss": 1.6971, "learning_rate": 1.1841495519910485e-05, "epoch": 0.776358159343513, "percentage": 77.64, "elapsed_time": "2 days, 10:15:38", "remaining_time": "16:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7475, "total_steps": 9627, "loss": 1.6166, "learning_rate": 1.1830953821662232e-05, "epoch": 0.7764620338630934, "percentage": 77.65, "elapsed_time": "2 days, 10:16:10", "remaining_time": "16:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7476, "total_steps": 9627, "loss": 1.611, "learning_rate": 1.182041618811967e-05, "epoch": 0.7765659083826737, "percentage": 77.66, "elapsed_time": "2 days, 10:16:41", "remaining_time": "16:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7477, "total_steps": 9627, "loss": 1.586, "learning_rate": 1.1809882620404972e-05, "epoch": 0.7766697829022541, "percentage": 77.67, "elapsed_time": "2 days, 10:17:13", "remaining_time": "16:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7478, "total_steps": 9627, "loss": 1.7642, "learning_rate": 1.1799353119639867e-05, "epoch": 0.7767736574218345, "percentage": 77.68, "elapsed_time": "2 days, 10:17:45", "remaining_time": "16:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7479, "total_steps": 9627, "loss": 1.6689, "learning_rate": 1.1788827686945708e-05, "epoch": 0.7768775319414147, "percentage": 77.69, "elapsed_time": "2 days, 10:18:18", "remaining_time": "16:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7480, "total_steps": 9627, "loss": 1.8645, "learning_rate": 1.177830632344331e-05, "epoch": 0.7769814064609951, "percentage": 77.7, "elapsed_time": "2 days, 10:18:50", "remaining_time": "16:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7481, "total_steps": 9627, "loss": 1.6404, "learning_rate": 1.1767789030253168e-05, "epoch": 0.7770852809805755, "percentage": 77.71, "elapsed_time": "2 days, 10:19:22", "remaining_time": "16:43:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7482, "total_steps": 9627, "loss": 1.7545, "learning_rate": 1.1757275808495266e-05, "epoch": 0.7771891555001558, "percentage": 77.72, "elapsed_time": "2 days, 10:19:55", "remaining_time": "16:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7483, "total_steps": 9627, "loss": 1.6952, "learning_rate": 1.1746766659289188e-05, "epoch": 0.7772930300197362, "percentage": 77.73, "elapsed_time": "2 days, 10:20:26", "remaining_time": "16:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7484, "total_steps": 9627, "loss": 1.5784, "learning_rate": 1.1736261583754072e-05, "epoch": 0.7773969045393165, "percentage": 77.74, "elapsed_time": "2 days, 10:20:58", "remaining_time": "16:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7485, "total_steps": 9627, "loss": 1.7849, "learning_rate": 1.1725760583008633e-05, "epoch": 0.7775007790588968, "percentage": 77.75, "elapsed_time": "2 days, 10:21:31", "remaining_time": "16:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7486, "total_steps": 9627, "loss": 1.6088, "learning_rate": 1.171526365817114e-05, "epoch": 0.7776046535784772, "percentage": 77.76, "elapsed_time": "2 days, 10:22:02", "remaining_time": "16:41:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7487, "total_steps": 9627, "loss": 1.5425, "learning_rate": 1.1704770810359417e-05, "epoch": 0.7777085280980576, "percentage": 77.77, "elapsed_time": "2 days, 10:22:35", "remaining_time": "16:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7488, "total_steps": 9627, "loss": 1.5142, "learning_rate": 1.1694282040690919e-05, "epoch": 0.7778124026176378, "percentage": 77.78, "elapsed_time": "2 days, 10:23:07", "remaining_time": "16:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7489, "total_steps": 9627, "loss": 1.4844, "learning_rate": 1.168379735028256e-05, "epoch": 0.7779162771372182, "percentage": 77.79, "elapsed_time": "2 days, 10:23:38", "remaining_time": "16:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7490, "total_steps": 9627, "loss": 1.647, "learning_rate": 1.1673316740250916e-05, "epoch": 0.7780201516567986, "percentage": 77.8, "elapsed_time": "2 days, 10:24:11", "remaining_time": "16:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7491, "total_steps": 9627, "loss": 1.6546, "learning_rate": 1.1662840211712084e-05, "epoch": 0.7781240261763789, "percentage": 77.81, "elapsed_time": "2 days, 10:24:42", "remaining_time": "16:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7492, "total_steps": 9627, "loss": 1.7317, "learning_rate": 1.1652367765781724e-05, "epoch": 0.7782279006959593, "percentage": 77.82, "elapsed_time": "2 days, 10:25:14", "remaining_time": "16:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7493, "total_steps": 9627, "loss": 1.6996, "learning_rate": 1.164189940357508e-05, "epoch": 0.7783317752155396, "percentage": 77.83, "elapsed_time": "2 days, 10:25:46", "remaining_time": "16:38:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7494, "total_steps": 9627, "loss": 1.5694, "learning_rate": 1.1631435126206924e-05, "epoch": 0.77843564973512, "percentage": 77.84, "elapsed_time": "2 days, 10:26:18", "remaining_time": "16:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7495, "total_steps": 9627, "loss": 1.5474, "learning_rate": 1.1620974934791673e-05, "epoch": 0.7785395242547003, "percentage": 77.85, "elapsed_time": "2 days, 10:26:50", "remaining_time": "16:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7496, "total_steps": 9627, "loss": 1.3948, "learning_rate": 1.1610518830443195e-05, "epoch": 0.7786433987742807, "percentage": 77.86, "elapsed_time": "2 days, 10:27:21", "remaining_time": "16:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7497, "total_steps": 9627, "loss": 1.7093, "learning_rate": 1.1600066814275028e-05, "epoch": 0.7787472732938611, "percentage": 77.87, "elapsed_time": "2 days, 10:27:54", "remaining_time": "16:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7498, "total_steps": 9627, "loss": 1.6267, "learning_rate": 1.1589618887400223e-05, "epoch": 0.7788511478134413, "percentage": 77.89, "elapsed_time": "2 days, 10:28:25", "remaining_time": "16:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7499, "total_steps": 9627, "loss": 1.4813, "learning_rate": 1.1579175050931369e-05, "epoch": 0.7789550223330217, "percentage": 77.9, "elapsed_time": "2 days, 10:28:58", "remaining_time": "16:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7500, "total_steps": 9627, "loss": 1.6934, "learning_rate": 1.1568735305980693e-05, "epoch": 0.7790588968526021, "percentage": 77.91, "elapsed_time": "2 days, 10:29:29", "remaining_time": "16:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7501, "total_steps": 9627, "loss": 1.7808, "learning_rate": 1.1558299653659931e-05, "epoch": 0.7791627713721824, "percentage": 77.92, "elapsed_time": "2 days, 10:30:02", "remaining_time": "16:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7502, "total_steps": 9627, "loss": 1.5262, "learning_rate": 1.15478680950804e-05, "epoch": 0.7792666458917628, "percentage": 77.93, "elapsed_time": "2 days, 10:30:34", "remaining_time": "16:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7503, "total_steps": 9627, "loss": 1.6568, "learning_rate": 1.1537440631352975e-05, "epoch": 0.7793705204113431, "percentage": 77.94, "elapsed_time": "2 days, 10:31:06", "remaining_time": "16:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7504, "total_steps": 9627, "loss": 1.5999, "learning_rate": 1.1527017263588108e-05, "epoch": 0.7794743949309234, "percentage": 77.95, "elapsed_time": "2 days, 10:31:39", "remaining_time": "16:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7505, "total_steps": 9627, "loss": 1.4227, "learning_rate": 1.15165979928958e-05, "epoch": 0.7795782694505038, "percentage": 77.96, "elapsed_time": "2 days, 10:32:11", "remaining_time": "16:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7506, "total_steps": 9627, "loss": 1.6902, "learning_rate": 1.1506182820385608e-05, "epoch": 0.7796821439700842, "percentage": 77.97, "elapsed_time": "2 days, 10:32:41", "remaining_time": "16:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7507, "total_steps": 9627, "loss": 1.543, "learning_rate": 1.149577174716671e-05, "epoch": 0.7797860184896644, "percentage": 77.98, "elapsed_time": "2 days, 10:33:14", "remaining_time": "16:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7508, "total_steps": 9627, "loss": 1.6154, "learning_rate": 1.148536477434775e-05, "epoch": 0.7798898930092448, "percentage": 77.99, "elapsed_time": "2 days, 10:33:45", "remaining_time": "16:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7509, "total_steps": 9627, "loss": 1.6337, "learning_rate": 1.1474961903037029e-05, "epoch": 0.7799937675288252, "percentage": 78.0, "elapsed_time": "2 days, 10:34:17", "remaining_time": "16:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7510, "total_steps": 9627, "loss": 1.6047, "learning_rate": 1.146456313434236e-05, "epoch": 0.7800976420484055, "percentage": 78.01, "elapsed_time": "2 days, 10:34:49", "remaining_time": "16:30:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7511, "total_steps": 9627, "loss": 1.5502, "learning_rate": 1.145416846937113e-05, "epoch": 0.7802015165679859, "percentage": 78.02, "elapsed_time": "2 days, 10:35:20", "remaining_time": "16:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7512, "total_steps": 9627, "loss": 1.8176, "learning_rate": 1.1443777909230286e-05, "epoch": 0.7803053910875662, "percentage": 78.03, "elapsed_time": "2 days, 10:35:52", "remaining_time": "16:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7513, "total_steps": 9627, "loss": 1.6699, "learning_rate": 1.1433391455026343e-05, "epoch": 0.7804092656071465, "percentage": 78.04, "elapsed_time": "2 days, 10:36:24", "remaining_time": "16:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7514, "total_steps": 9627, "loss": 1.9029, "learning_rate": 1.1423009107865384e-05, "epoch": 0.7805131401267269, "percentage": 78.05, "elapsed_time": "2 days, 10:36:56", "remaining_time": "16:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7515, "total_steps": 9627, "loss": 1.6599, "learning_rate": 1.1412630868853024e-05, "epoch": 0.7806170146463073, "percentage": 78.06, "elapsed_time": "2 days, 10:37:26", "remaining_time": "16:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7516, "total_steps": 9627, "loss": 1.9605, "learning_rate": 1.1402256739094513e-05, "epoch": 0.7807208891658876, "percentage": 78.07, "elapsed_time": "2 days, 10:37:58", "remaining_time": "16:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7517, "total_steps": 9627, "loss": 1.6042, "learning_rate": 1.1391886719694561e-05, "epoch": 0.7808247636854679, "percentage": 78.08, "elapsed_time": "2 days, 10:38:30", "remaining_time": "16:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7518, "total_steps": 9627, "loss": 1.6724, "learning_rate": 1.1381520811757529e-05, "epoch": 0.7809286382050483, "percentage": 78.09, "elapsed_time": "2 days, 10:39:02", "remaining_time": "16:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7519, "total_steps": 9627, "loss": 1.55, "learning_rate": 1.1371159016387296e-05, "epoch": 0.7810325127246287, "percentage": 78.1, "elapsed_time": "2 days, 10:39:34", "remaining_time": "16:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7520, "total_steps": 9627, "loss": 1.6557, "learning_rate": 1.136080133468731e-05, "epoch": 0.781136387244209, "percentage": 78.11, "elapsed_time": "2 days, 10:40:06", "remaining_time": "16:26:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7521, "total_steps": 9627, "loss": 1.642, "learning_rate": 1.1350447767760586e-05, "epoch": 0.7812402617637894, "percentage": 78.12, "elapsed_time": "2 days, 10:40:38", "remaining_time": "16:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7522, "total_steps": 9627, "loss": 1.6731, "learning_rate": 1.134009831670968e-05, "epoch": 0.7813441362833697, "percentage": 78.13, "elapsed_time": "2 days, 10:41:09", "remaining_time": "16:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7523, "total_steps": 9627, "loss": 1.6211, "learning_rate": 1.1329752982636776e-05, "epoch": 0.78144801080295, "percentage": 78.14, "elapsed_time": "2 days, 10:41:41", "remaining_time": "16:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7524, "total_steps": 9627, "loss": 1.5965, "learning_rate": 1.1319411766643512e-05, "epoch": 0.7815518853225304, "percentage": 78.16, "elapsed_time": "2 days, 10:42:13", "remaining_time": "16:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7525, "total_steps": 9627, "loss": 1.7404, "learning_rate": 1.1309074669831189e-05, "epoch": 0.7816557598421108, "percentage": 78.17, "elapsed_time": "2 days, 10:42:44", "remaining_time": "16:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7526, "total_steps": 9627, "loss": 1.6904, "learning_rate": 1.1298741693300624e-05, "epoch": 0.781759634361691, "percentage": 78.18, "elapsed_time": "2 days, 10:43:16", "remaining_time": "16:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7527, "total_steps": 9627, "loss": 1.8278, "learning_rate": 1.1288412838152157e-05, "epoch": 0.7818635088812714, "percentage": 78.19, "elapsed_time": "2 days, 10:43:47", "remaining_time": "16:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7528, "total_steps": 9627, "loss": 1.714, "learning_rate": 1.1278088105485778e-05, "epoch": 0.7819673834008518, "percentage": 78.2, "elapsed_time": "2 days, 10:44:19", "remaining_time": "16:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7529, "total_steps": 9627, "loss": 1.6401, "learning_rate": 1.1267767496400972e-05, "epoch": 0.7820712579204321, "percentage": 78.21, "elapsed_time": "2 days, 10:44:51", "remaining_time": "16:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7530, "total_steps": 9627, "loss": 1.6266, "learning_rate": 1.1257451011996805e-05, "epoch": 0.7821751324400125, "percentage": 78.22, "elapsed_time": "2 days, 10:45:23", "remaining_time": "16:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7531, "total_steps": 9627, "loss": 1.6743, "learning_rate": 1.1247138653371903e-05, "epoch": 0.7822790069595928, "percentage": 78.23, "elapsed_time": "2 days, 10:45:56", "remaining_time": "16:21:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7532, "total_steps": 9627, "loss": 1.6527, "learning_rate": 1.123683042162445e-05, "epoch": 0.7823828814791731, "percentage": 78.24, "elapsed_time": "2 days, 10:46:26", "remaining_time": "16:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7533, "total_steps": 9627, "loss": 1.8607, "learning_rate": 1.1226526317852193e-05, "epoch": 0.7824867559987535, "percentage": 78.25, "elapsed_time": "2 days, 10:46:58", "remaining_time": "16:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7534, "total_steps": 9627, "loss": 1.5447, "learning_rate": 1.1216226343152424e-05, "epoch": 0.7825906305183339, "percentage": 78.26, "elapsed_time": "2 days, 10:47:30", "remaining_time": "16:19:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7535, "total_steps": 9627, "loss": 1.6129, "learning_rate": 1.1205930498622053e-05, "epoch": 0.7826945050379142, "percentage": 78.27, "elapsed_time": "2 days, 10:48:01", "remaining_time": "16:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7536, "total_steps": 9627, "loss": 1.5621, "learning_rate": 1.1195638785357448e-05, "epoch": 0.7827983795574945, "percentage": 78.28, "elapsed_time": "2 days, 10:48:33", "remaining_time": "16:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7537, "total_steps": 9627, "loss": 1.7632, "learning_rate": 1.1185351204454647e-05, "epoch": 0.7829022540770749, "percentage": 78.29, "elapsed_time": "2 days, 10:49:06", "remaining_time": "16:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7538, "total_steps": 9627, "loss": 1.5052, "learning_rate": 1.1175067757009171e-05, "epoch": 0.7830061285966552, "percentage": 78.3, "elapsed_time": "2 days, 10:49:36", "remaining_time": "16:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7539, "total_steps": 9627, "loss": 1.7971, "learning_rate": 1.1164788444116131e-05, "epoch": 0.7831100031162356, "percentage": 78.31, "elapsed_time": "2 days, 10:50:09", "remaining_time": "16:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7540, "total_steps": 9627, "loss": 1.5101, "learning_rate": 1.1154513266870204e-05, "epoch": 0.783213877635816, "percentage": 78.32, "elapsed_time": "2 days, 10:50:41", "remaining_time": "16:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7541, "total_steps": 9627, "loss": 1.8468, "learning_rate": 1.1144242226365599e-05, "epoch": 0.7833177521553962, "percentage": 78.33, "elapsed_time": "2 days, 10:51:12", "remaining_time": "16:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7542, "total_steps": 9627, "loss": 1.6425, "learning_rate": 1.1133975323696111e-05, "epoch": 0.7834216266749766, "percentage": 78.34, "elapsed_time": "2 days, 10:51:44", "remaining_time": "16:16:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7543, "total_steps": 9627, "loss": 1.5772, "learning_rate": 1.1123712559955075e-05, "epoch": 0.783525501194557, "percentage": 78.35, "elapsed_time": "2 days, 10:52:14", "remaining_time": "16:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7544, "total_steps": 9627, "loss": 1.632, "learning_rate": 1.1113453936235418e-05, "epoch": 0.7836293757141374, "percentage": 78.36, "elapsed_time": "2 days, 10:52:47", "remaining_time": "16:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7545, "total_steps": 9627, "loss": 1.6937, "learning_rate": 1.1103199453629587e-05, "epoch": 0.7837332502337176, "percentage": 78.37, "elapsed_time": "2 days, 10:53:18", "remaining_time": "16:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7546, "total_steps": 9627, "loss": 1.7399, "learning_rate": 1.1092949113229612e-05, "epoch": 0.783837124753298, "percentage": 78.38, "elapsed_time": "2 days, 10:53:49", "remaining_time": "16:14:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7547, "total_steps": 9627, "loss": 1.6816, "learning_rate": 1.1082702916127063e-05, "epoch": 0.7839409992728784, "percentage": 78.39, "elapsed_time": "2 days, 10:54:21", "remaining_time": "16:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7548, "total_steps": 9627, "loss": 1.3392, "learning_rate": 1.1072460863413092e-05, "epoch": 0.7840448737924587, "percentage": 78.4, "elapsed_time": "2 days, 10:54:54", "remaining_time": "16:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7549, "total_steps": 9627, "loss": 1.6167, "learning_rate": 1.1062222956178391e-05, "epoch": 0.7841487483120391, "percentage": 78.41, "elapsed_time": "2 days, 10:55:26", "remaining_time": "16:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7550, "total_steps": 9627, "loss": 1.7752, "learning_rate": 1.1051989195513207e-05, "epoch": 0.7842526228316195, "percentage": 78.43, "elapsed_time": "2 days, 10:55:56", "remaining_time": "16:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7551, "total_steps": 9627, "loss": 1.6396, "learning_rate": 1.1041759582507393e-05, "epoch": 0.7843564973511997, "percentage": 78.44, "elapsed_time": "2 days, 10:56:28", "remaining_time": "16:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7552, "total_steps": 9627, "loss": 1.697, "learning_rate": 1.1031534118250269e-05, "epoch": 0.7844603718707801, "percentage": 78.45, "elapsed_time": "2 days, 10:56:59", "remaining_time": "16:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7553, "total_steps": 9627, "loss": 1.5987, "learning_rate": 1.1021312803830813e-05, "epoch": 0.7845642463903605, "percentage": 78.46, "elapsed_time": "2 days, 10:57:31", "remaining_time": "16:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7554, "total_steps": 9627, "loss": 1.5662, "learning_rate": 1.101109564033751e-05, "epoch": 0.7846681209099408, "percentage": 78.47, "elapsed_time": "2 days, 10:58:03", "remaining_time": "16:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7555, "total_steps": 9627, "loss": 1.4838, "learning_rate": 1.1000882628858367e-05, "epoch": 0.7847719954295211, "percentage": 78.48, "elapsed_time": "2 days, 10:58:34", "remaining_time": "16:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7556, "total_steps": 9627, "loss": 1.6211, "learning_rate": 1.0990673770481036e-05, "epoch": 0.7848758699491015, "percentage": 78.49, "elapsed_time": "2 days, 10:59:07", "remaining_time": "16:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7557, "total_steps": 9627, "loss": 1.5268, "learning_rate": 1.0980469066292659e-05, "epoch": 0.7849797444686818, "percentage": 78.5, "elapsed_time": "2 days, 10:59:38", "remaining_time": "16:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7558, "total_steps": 9627, "loss": 1.7556, "learning_rate": 1.0970268517379967e-05, "epoch": 0.7850836189882622, "percentage": 78.51, "elapsed_time": "2 days, 11:00:09", "remaining_time": "16:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7559, "total_steps": 9627, "loss": 1.5014, "learning_rate": 1.0960072124829235e-05, "epoch": 0.7851874935078426, "percentage": 78.52, "elapsed_time": "2 days, 11:00:42", "remaining_time": "16:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7560, "total_steps": 9627, "loss": 1.6162, "learning_rate": 1.0949879889726294e-05, "epoch": 0.7852913680274228, "percentage": 78.53, "elapsed_time": "2 days, 11:01:14", "remaining_time": "16:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7561, "total_steps": 9627, "loss": 1.7035, "learning_rate": 1.0939691813156544e-05, "epoch": 0.7853952425470032, "percentage": 78.54, "elapsed_time": "2 days, 11:01:45", "remaining_time": "16:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7562, "total_steps": 9627, "loss": 1.6337, "learning_rate": 1.0929507896204921e-05, "epoch": 0.7854991170665836, "percentage": 78.55, "elapsed_time": "2 days, 11:02:18", "remaining_time": "16:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7563, "total_steps": 9627, "loss": 1.6693, "learning_rate": 1.0919328139955976e-05, "epoch": 0.7856029915861639, "percentage": 78.56, "elapsed_time": "2 days, 11:02:50", "remaining_time": "16:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7564, "total_steps": 9627, "loss": 1.6461, "learning_rate": 1.0909152545493712e-05, "epoch": 0.7857068661057443, "percentage": 78.57, "elapsed_time": "2 days, 11:03:22", "remaining_time": "16:06:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7565, "total_steps": 9627, "loss": 1.6278, "learning_rate": 1.089898111390179e-05, "epoch": 0.7858107406253246, "percentage": 78.58, "elapsed_time": "2 days, 11:03:55", "remaining_time": "16:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7566, "total_steps": 9627, "loss": 1.5302, "learning_rate": 1.0888813846263391e-05, "epoch": 0.7859146151449049, "percentage": 78.59, "elapsed_time": "2 days, 11:04:25", "remaining_time": "16:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7567, "total_steps": 9627, "loss": 1.6846, "learning_rate": 1.0878650743661229e-05, "epoch": 0.7860184896644853, "percentage": 78.6, "elapsed_time": "2 days, 11:04:57", "remaining_time": "16:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7568, "total_steps": 9627, "loss": 1.6535, "learning_rate": 1.086849180717761e-05, "epoch": 0.7861223641840657, "percentage": 78.61, "elapsed_time": "2 days, 11:05:29", "remaining_time": "16:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7569, "total_steps": 9627, "loss": 1.6498, "learning_rate": 1.0858337037894372e-05, "epoch": 0.7862262387036459, "percentage": 78.62, "elapsed_time": "2 days, 11:06:02", "remaining_time": "16:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7570, "total_steps": 9627, "loss": 1.5972, "learning_rate": 1.0848186436892927e-05, "epoch": 0.7863301132232263, "percentage": 78.63, "elapsed_time": "2 days, 11:06:34", "remaining_time": "16:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7571, "total_steps": 9627, "loss": 1.618, "learning_rate": 1.0838040005254213e-05, "epoch": 0.7864339877428067, "percentage": 78.64, "elapsed_time": "2 days, 11:07:05", "remaining_time": "16:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7572, "total_steps": 9627, "loss": 1.5818, "learning_rate": 1.082789774405878e-05, "epoch": 0.7865378622623871, "percentage": 78.65, "elapsed_time": "2 days, 11:07:37", "remaining_time": "16:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7573, "total_steps": 9627, "loss": 1.512, "learning_rate": 1.0817759654386684e-05, "epoch": 0.7866417367819674, "percentage": 78.66, "elapsed_time": "2 days, 11:08:09", "remaining_time": "16:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7574, "total_steps": 9627, "loss": 1.6786, "learning_rate": 1.0807625737317545e-05, "epoch": 0.7867456113015477, "percentage": 78.67, "elapsed_time": "2 days, 11:08:40", "remaining_time": "16:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7575, "total_steps": 9627, "loss": 1.7152, "learning_rate": 1.0797495993930562e-05, "epoch": 0.7868494858211281, "percentage": 78.68, "elapsed_time": "2 days, 11:09:12", "remaining_time": "16:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7576, "total_steps": 9627, "loss": 1.7505, "learning_rate": 1.0787370425304454e-05, "epoch": 0.7869533603407084, "percentage": 78.7, "elapsed_time": "2 days, 11:09:44", "remaining_time": "16:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7577, "total_steps": 9627, "loss": 1.6145, "learning_rate": 1.0777249032517534e-05, "epoch": 0.7870572348602888, "percentage": 78.71, "elapsed_time": "2 days, 11:10:16", "remaining_time": "16:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7578, "total_steps": 9627, "loss": 1.4186, "learning_rate": 1.0767131816647624e-05, "epoch": 0.7871611093798692, "percentage": 78.72, "elapsed_time": "2 days, 11:10:48", "remaining_time": "16:00:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7579, "total_steps": 9627, "loss": 1.7788, "learning_rate": 1.0757018778772181e-05, "epoch": 0.7872649838994494, "percentage": 78.73, "elapsed_time": "2 days, 11:11:21", "remaining_time": "15:59:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7580, "total_steps": 9627, "loss": 1.7623, "learning_rate": 1.0746909919968102e-05, "epoch": 0.7873688584190298, "percentage": 78.74, "elapsed_time": "2 days, 11:11:53", "remaining_time": "15:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7581, "total_steps": 9627, "loss": 1.7721, "learning_rate": 1.0736805241311937e-05, "epoch": 0.7874727329386102, "percentage": 78.75, "elapsed_time": "2 days, 11:12:23", "remaining_time": "15:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7582, "total_steps": 9627, "loss": 1.6909, "learning_rate": 1.0726704743879767e-05, "epoch": 0.7875766074581905, "percentage": 78.76, "elapsed_time": "2 days, 11:12:55", "remaining_time": "15:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7583, "total_steps": 9627, "loss": 1.6288, "learning_rate": 1.0716608428747177e-05, "epoch": 0.7876804819777709, "percentage": 78.77, "elapsed_time": "2 days, 11:13:28", "remaining_time": "15:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7584, "total_steps": 9627, "loss": 1.7996, "learning_rate": 1.0706516296989372e-05, "epoch": 0.7877843564973512, "percentage": 78.78, "elapsed_time": "2 days, 11:14:00", "remaining_time": "15:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7585, "total_steps": 9627, "loss": 1.5053, "learning_rate": 1.0696428349681087e-05, "epoch": 0.7878882310169315, "percentage": 78.79, "elapsed_time": "2 days, 11:14:32", "remaining_time": "15:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7586, "total_steps": 9627, "loss": 1.6293, "learning_rate": 1.0686344587896597e-05, "epoch": 0.7879921055365119, "percentage": 78.8, "elapsed_time": "2 days, 11:15:04", "remaining_time": "15:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7587, "total_steps": 9627, "loss": 1.628, "learning_rate": 1.0676265012709752e-05, "epoch": 0.7880959800560923, "percentage": 78.81, "elapsed_time": "2 days, 11:15:36", "remaining_time": "15:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7588, "total_steps": 9627, "loss": 1.8276, "learning_rate": 1.066618962519395e-05, "epoch": 0.7881998545756725, "percentage": 78.82, "elapsed_time": "2 days, 11:16:09", "remaining_time": "15:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7589, "total_steps": 9627, "loss": 1.6578, "learning_rate": 1.0656118426422134e-05, "epoch": 0.7883037290952529, "percentage": 78.83, "elapsed_time": "2 days, 11:16:39", "remaining_time": "15:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7590, "total_steps": 9627, "loss": 1.74, "learning_rate": 1.06460514174668e-05, "epoch": 0.7884076036148333, "percentage": 78.84, "elapsed_time": "2 days, 11:17:11", "remaining_time": "15:54:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7591, "total_steps": 9627, "loss": 1.7842, "learning_rate": 1.0635988599400043e-05, "epoch": 0.7885114781344136, "percentage": 78.85, "elapsed_time": "2 days, 11:17:44", "remaining_time": "15:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7592, "total_steps": 9627, "loss": 1.5922, "learning_rate": 1.0625929973293419e-05, "epoch": 0.788615352653994, "percentage": 78.86, "elapsed_time": "2 days, 11:18:16", "remaining_time": "15:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7593, "total_steps": 9627, "loss": 1.7011, "learning_rate": 1.061587554021814e-05, "epoch": 0.7887192271735743, "percentage": 78.87, "elapsed_time": "2 days, 11:18:47", "remaining_time": "15:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7594, "total_steps": 9627, "loss": 1.683, "learning_rate": 1.0605825301244909e-05, "epoch": 0.7888231016931546, "percentage": 78.88, "elapsed_time": "2 days, 11:19:18", "remaining_time": "15:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7595, "total_steps": 9627, "loss": 1.4897, "learning_rate": 1.0595779257444e-05, "epoch": 0.788926976212735, "percentage": 78.89, "elapsed_time": "2 days, 11:19:51", "remaining_time": "15:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7596, "total_steps": 9627, "loss": 1.6298, "learning_rate": 1.0585737409885227e-05, "epoch": 0.7890308507323154, "percentage": 78.9, "elapsed_time": "2 days, 11:20:22", "remaining_time": "15:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7597, "total_steps": 9627, "loss": 1.6549, "learning_rate": 1.057569975963797e-05, "epoch": 0.7891347252518958, "percentage": 78.91, "elapsed_time": "2 days, 11:20:55", "remaining_time": "15:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7598, "total_steps": 9627, "loss": 1.7137, "learning_rate": 1.0565666307771193e-05, "epoch": 0.789238599771476, "percentage": 78.92, "elapsed_time": "2 days, 11:21:26", "remaining_time": "15:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7599, "total_steps": 9627, "loss": 1.5784, "learning_rate": 1.0555637055353324e-05, "epoch": 0.7893424742910564, "percentage": 78.93, "elapsed_time": "2 days, 11:21:57", "remaining_time": "15:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7600, "total_steps": 9627, "loss": 1.6315, "learning_rate": 1.054561200345245e-05, "epoch": 0.7894463488106368, "percentage": 78.94, "elapsed_time": "2 days, 11:22:29", "remaining_time": "15:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7601, "total_steps": 9627, "loss": 1.7496, "learning_rate": 1.0535591153136137e-05, "epoch": 0.7895502233302171, "percentage": 78.96, "elapsed_time": "2 days, 11:23:00", "remaining_time": "15:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7602, "total_steps": 9627, "loss": 1.6808, "learning_rate": 1.0525574505471531e-05, "epoch": 0.7896540978497975, "percentage": 78.97, "elapsed_time": "2 days, 11:23:32", "remaining_time": "15:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7603, "total_steps": 9627, "loss": 1.5215, "learning_rate": 1.051556206152533e-05, "epoch": 0.7897579723693778, "percentage": 78.98, "elapsed_time": "2 days, 11:24:04", "remaining_time": "15:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7604, "total_steps": 9627, "loss": 1.6401, "learning_rate": 1.0505553822363783e-05, "epoch": 0.7898618468889581, "percentage": 78.99, "elapsed_time": "2 days, 11:24:35", "remaining_time": "15:48:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7605, "total_steps": 9627, "loss": 1.613, "learning_rate": 1.0495549789052678e-05, "epoch": 0.7899657214085385, "percentage": 79.0, "elapsed_time": "2 days, 11:25:07", "remaining_time": "15:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7606, "total_steps": 9627, "loss": 1.6405, "learning_rate": 1.0485549962657365e-05, "epoch": 0.7900695959281189, "percentage": 79.01, "elapsed_time": "2 days, 11:25:38", "remaining_time": "15:47:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7607, "total_steps": 9627, "loss": 1.5479, "learning_rate": 1.0475554344242783e-05, "epoch": 0.7901734704476991, "percentage": 79.02, "elapsed_time": "2 days, 11:26:09", "remaining_time": "15:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7608, "total_steps": 9627, "loss": 1.8367, "learning_rate": 1.0465562934873335e-05, "epoch": 0.7902773449672795, "percentage": 79.03, "elapsed_time": "2 days, 11:26:40", "remaining_time": "15:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7609, "total_steps": 9627, "loss": 1.6501, "learning_rate": 1.0455575735613066e-05, "epoch": 0.7903812194868599, "percentage": 79.04, "elapsed_time": "2 days, 11:27:13", "remaining_time": "15:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7610, "total_steps": 9627, "loss": 1.5864, "learning_rate": 1.0445592747525534e-05, "epoch": 0.7904850940064402, "percentage": 79.05, "elapsed_time": "2 days, 11:27:45", "remaining_time": "15:45:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7611, "total_steps": 9627, "loss": 1.5591, "learning_rate": 1.0435613971673813e-05, "epoch": 0.7905889685260206, "percentage": 79.06, "elapsed_time": "2 days, 11:28:18", "remaining_time": "15:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7612, "total_steps": 9627, "loss": 1.6134, "learning_rate": 1.0425639409120602e-05, "epoch": 0.790692843045601, "percentage": 79.07, "elapsed_time": "2 days, 11:28:49", "remaining_time": "15:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7613, "total_steps": 9627, "loss": 1.7608, "learning_rate": 1.0415669060928108e-05, "epoch": 0.7907967175651812, "percentage": 79.08, "elapsed_time": "2 days, 11:29:20", "remaining_time": "15:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7614, "total_steps": 9627, "loss": 1.7024, "learning_rate": 1.0405702928158085e-05, "epoch": 0.7909005920847616, "percentage": 79.09, "elapsed_time": "2 days, 11:29:53", "remaining_time": "15:43:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7615, "total_steps": 9627, "loss": 1.6004, "learning_rate": 1.0395741011871851e-05, "epoch": 0.791004466604342, "percentage": 79.1, "elapsed_time": "2 days, 11:30:23", "remaining_time": "15:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7616, "total_steps": 9627, "loss": 1.6282, "learning_rate": 1.0385783313130276e-05, "epoch": 0.7911083411239223, "percentage": 79.11, "elapsed_time": "2 days, 11:30:55", "remaining_time": "15:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7617, "total_steps": 9627, "loss": 1.7222, "learning_rate": 1.0375829832993772e-05, "epoch": 0.7912122156435026, "percentage": 79.12, "elapsed_time": "2 days, 11:31:26", "remaining_time": "15:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7618, "total_steps": 9627, "loss": 1.7329, "learning_rate": 1.0365880572522302e-05, "epoch": 0.791316090163083, "percentage": 79.13, "elapsed_time": "2 days, 11:31:59", "remaining_time": "15:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7619, "total_steps": 9627, "loss": 1.5133, "learning_rate": 1.0355935532775419e-05, "epoch": 0.7914199646826633, "percentage": 79.14, "elapsed_time": "2 days, 11:32:31", "remaining_time": "15:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7620, "total_steps": 9627, "loss": 1.4862, "learning_rate": 1.0345994714812135e-05, "epoch": 0.7915238392022437, "percentage": 79.15, "elapsed_time": "2 days, 11:33:02", "remaining_time": "15:41:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7621, "total_steps": 9627, "loss": 1.5222, "learning_rate": 1.0336058119691122e-05, "epoch": 0.7916277137218241, "percentage": 79.16, "elapsed_time": "2 days, 11:33:35", "remaining_time": "15:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7622, "total_steps": 9627, "loss": 1.6171, "learning_rate": 1.0326125748470522e-05, "epoch": 0.7917315882414044, "percentage": 79.17, "elapsed_time": "2 days, 11:34:06", "remaining_time": "15:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7623, "total_steps": 9627, "loss": 1.7382, "learning_rate": 1.0316197602208067e-05, "epoch": 0.7918354627609847, "percentage": 79.18, "elapsed_time": "2 days, 11:34:38", "remaining_time": "15:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7624, "total_steps": 9627, "loss": 1.8618, "learning_rate": 1.0306273681961014e-05, "epoch": 0.7919393372805651, "percentage": 79.19, "elapsed_time": "2 days, 11:35:11", "remaining_time": "15:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7625, "total_steps": 9627, "loss": 1.7562, "learning_rate": 1.0296353988786184e-05, "epoch": 0.7920432118001455, "percentage": 79.2, "elapsed_time": "2 days, 11:35:42", "remaining_time": "15:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7626, "total_steps": 9627, "loss": 1.5518, "learning_rate": 1.0286438523739978e-05, "epoch": 0.7921470863197257, "percentage": 79.21, "elapsed_time": "2 days, 11:36:13", "remaining_time": "15:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7627, "total_steps": 9627, "loss": 1.831, "learning_rate": 1.0276527287878268e-05, "epoch": 0.7922509608393061, "percentage": 79.23, "elapsed_time": "2 days, 11:36:46", "remaining_time": "15:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7628, "total_steps": 9627, "loss": 1.69, "learning_rate": 1.0266620282256556e-05, "epoch": 0.7923548353588865, "percentage": 79.24, "elapsed_time": "2 days, 11:37:17", "remaining_time": "15:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7629, "total_steps": 9627, "loss": 1.4931, "learning_rate": 1.0256717507929852e-05, "epoch": 0.7924587098784668, "percentage": 79.25, "elapsed_time": "2 days, 11:37:48", "remaining_time": "15:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7630, "total_steps": 9627, "loss": 1.5392, "learning_rate": 1.0246818965952727e-05, "epoch": 0.7925625843980472, "percentage": 79.26, "elapsed_time": "2 days, 11:38:20", "remaining_time": "15:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7631, "total_steps": 9627, "loss": 1.5485, "learning_rate": 1.0236924657379293e-05, "epoch": 0.7926664589176275, "percentage": 79.27, "elapsed_time": "2 days, 11:38:51", "remaining_time": "15:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7632, "total_steps": 9627, "loss": 1.7733, "learning_rate": 1.0227034583263218e-05, "epoch": 0.7927703334372078, "percentage": 79.28, "elapsed_time": "2 days, 11:39:23", "remaining_time": "15:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7633, "total_steps": 9627, "loss": 1.7832, "learning_rate": 1.0217148744657723e-05, "epoch": 0.7928742079567882, "percentage": 79.29, "elapsed_time": "2 days, 11:39:54", "remaining_time": "15:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7634, "total_steps": 9627, "loss": 1.6996, "learning_rate": 1.0207267142615552e-05, "epoch": 0.7929780824763686, "percentage": 79.3, "elapsed_time": "2 days, 11:40:26", "remaining_time": "15:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7635, "total_steps": 9627, "loss": 1.6218, "learning_rate": 1.0197389778189065e-05, "epoch": 0.7930819569959489, "percentage": 79.31, "elapsed_time": "2 days, 11:40:58", "remaining_time": "15:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7636, "total_steps": 9627, "loss": 1.6509, "learning_rate": 1.0187516652430062e-05, "epoch": 0.7931858315155292, "percentage": 79.32, "elapsed_time": "2 days, 11:41:29", "remaining_time": "15:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7637, "total_steps": 9627, "loss": 1.7145, "learning_rate": 1.0177647766390002e-05, "epoch": 0.7932897060351096, "percentage": 79.33, "elapsed_time": "2 days, 11:42:00", "remaining_time": "15:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7638, "total_steps": 9627, "loss": 1.3435, "learning_rate": 1.0167783121119845e-05, "epoch": 0.7933935805546899, "percentage": 79.34, "elapsed_time": "2 days, 11:42:32", "remaining_time": "15:32:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7639, "total_steps": 9627, "loss": 1.5719, "learning_rate": 1.0157922717670054e-05, "epoch": 0.7934974550742703, "percentage": 79.35, "elapsed_time": "2 days, 11:43:03", "remaining_time": "15:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7640, "total_steps": 9627, "loss": 1.6977, "learning_rate": 1.0148066557090724e-05, "epoch": 0.7936013295938507, "percentage": 79.36, "elapsed_time": "2 days, 11:43:35", "remaining_time": "15:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7641, "total_steps": 9627, "loss": 1.7793, "learning_rate": 1.0138214640431454e-05, "epoch": 0.7937052041134309, "percentage": 79.37, "elapsed_time": "2 days, 11:44:06", "remaining_time": "15:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7642, "total_steps": 9627, "loss": 1.7664, "learning_rate": 1.0128366968741387e-05, "epoch": 0.7938090786330113, "percentage": 79.38, "elapsed_time": "2 days, 11:44:38", "remaining_time": "15:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7643, "total_steps": 9627, "loss": 1.6902, "learning_rate": 1.0118523543069226e-05, "epoch": 0.7939129531525917, "percentage": 79.39, "elapsed_time": "2 days, 11:45:09", "remaining_time": "15:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7644, "total_steps": 9627, "loss": 1.6312, "learning_rate": 1.0108684364463222e-05, "epoch": 0.794016827672172, "percentage": 79.4, "elapsed_time": "2 days, 11:45:41", "remaining_time": "15:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7645, "total_steps": 9627, "loss": 1.6194, "learning_rate": 1.0098849433971169e-05, "epoch": 0.7941207021917523, "percentage": 79.41, "elapsed_time": "2 days, 11:46:12", "remaining_time": "15:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7646, "total_steps": 9627, "loss": 1.6965, "learning_rate": 1.0089018752640394e-05, "epoch": 0.7942245767113327, "percentage": 79.42, "elapsed_time": "2 days, 11:46:44", "remaining_time": "15:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7647, "total_steps": 9627, "loss": 1.7115, "learning_rate": 1.0079192321517838e-05, "epoch": 0.794328451230913, "percentage": 79.43, "elapsed_time": "2 days, 11:47:14", "remaining_time": "15:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7648, "total_steps": 9627, "loss": 1.4832, "learning_rate": 1.0069370141649876e-05, "epoch": 0.7944323257504934, "percentage": 79.44, "elapsed_time": "2 days, 11:47:46", "remaining_time": "15:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7649, "total_steps": 9627, "loss": 1.6654, "learning_rate": 1.0059552214082536e-05, "epoch": 0.7945362002700738, "percentage": 79.45, "elapsed_time": "2 days, 11:48:18", "remaining_time": "15:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7650, "total_steps": 9627, "loss": 1.6049, "learning_rate": 1.0049738539861332e-05, "epoch": 0.7946400747896541, "percentage": 79.46, "elapsed_time": "2 days, 11:48:50", "remaining_time": "15:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7651, "total_steps": 9627, "loss": 1.7055, "learning_rate": 1.0039929120031355e-05, "epoch": 0.7947439493092344, "percentage": 79.47, "elapsed_time": "2 days, 11:49:21", "remaining_time": "15:27:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7652, "total_steps": 9627, "loss": 1.7024, "learning_rate": 1.0030123955637227e-05, "epoch": 0.7948478238288148, "percentage": 79.48, "elapsed_time": "2 days, 11:49:52", "remaining_time": "15:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7653, "total_steps": 9627, "loss": 1.7098, "learning_rate": 1.0020323047723108e-05, "epoch": 0.7949516983483952, "percentage": 79.5, "elapsed_time": "2 days, 11:50:23", "remaining_time": "15:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7654, "total_steps": 9627, "loss": 1.5875, "learning_rate": 1.0010526397332754e-05, "epoch": 0.7950555728679755, "percentage": 79.51, "elapsed_time": "2 days, 11:50:55", "remaining_time": "15:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7655, "total_steps": 9627, "loss": 1.6725, "learning_rate": 1.0000734005509382e-05, "epoch": 0.7951594473875558, "percentage": 79.52, "elapsed_time": "2 days, 11:51:26", "remaining_time": "15:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7656, "total_steps": 9627, "loss": 1.6157, "learning_rate": 9.990945873295848e-06, "epoch": 0.7952633219071362, "percentage": 79.53, "elapsed_time": "2 days, 11:51:58", "remaining_time": "15:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7657, "total_steps": 9627, "loss": 1.7816, "learning_rate": 9.981162001734496e-06, "epoch": 0.7953671964267165, "percentage": 79.54, "elapsed_time": "2 days, 11:52:29", "remaining_time": "15:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7658, "total_steps": 9627, "loss": 1.6609, "learning_rate": 9.97138239186723e-06, "epoch": 0.7954710709462969, "percentage": 79.55, "elapsed_time": "2 days, 11:53:00", "remaining_time": "15:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7659, "total_steps": 9627, "loss": 1.5903, "learning_rate": 9.961607044735505e-06, "epoch": 0.7955749454658773, "percentage": 79.56, "elapsed_time": "2 days, 11:53:32", "remaining_time": "15:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7660, "total_steps": 9627, "loss": 1.655, "learning_rate": 9.951835961380317e-06, "epoch": 0.7956788199854575, "percentage": 79.57, "elapsed_time": "2 days, 11:54:04", "remaining_time": "15:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7661, "total_steps": 9627, "loss": 1.5481, "learning_rate": 9.942069142842214e-06, "epoch": 0.7957826945050379, "percentage": 79.58, "elapsed_time": "2 days, 11:54:36", "remaining_time": "15:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7662, "total_steps": 9627, "loss": 1.6456, "learning_rate": 9.932306590161266e-06, "epoch": 0.7958865690246183, "percentage": 79.59, "elapsed_time": "2 days, 11:55:07", "remaining_time": "15:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7663, "total_steps": 9627, "loss": 1.6836, "learning_rate": 9.922548304377154e-06, "epoch": 0.7959904435441986, "percentage": 79.6, "elapsed_time": "2 days, 11:55:39", "remaining_time": "15:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7664, "total_steps": 9627, "loss": 1.5107, "learning_rate": 9.91279428652901e-06, "epoch": 0.796094318063779, "percentage": 79.61, "elapsed_time": "2 days, 11:56:12", "remaining_time": "15:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7665, "total_steps": 9627, "loss": 1.6828, "learning_rate": 9.903044537655587e-06, "epoch": 0.7961981925833593, "percentage": 79.62, "elapsed_time": "2 days, 11:56:44", "remaining_time": "15:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7666, "total_steps": 9627, "loss": 1.5791, "learning_rate": 9.893299058795175e-06, "epoch": 0.7963020671029396, "percentage": 79.63, "elapsed_time": "2 days, 11:57:14", "remaining_time": "15:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7667, "total_steps": 9627, "loss": 1.6213, "learning_rate": 9.883557850985537e-06, "epoch": 0.79640594162252, "percentage": 79.64, "elapsed_time": "2 days, 11:57:46", "remaining_time": "15:19:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7668, "total_steps": 9627, "loss": 1.7171, "learning_rate": 9.873820915264082e-06, "epoch": 0.7965098161421004, "percentage": 79.65, "elapsed_time": "2 days, 11:58:18", "remaining_time": "15:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7669, "total_steps": 9627, "loss": 1.5873, "learning_rate": 9.864088252667702e-06, "epoch": 0.7966136906616806, "percentage": 79.66, "elapsed_time": "2 days, 11:58:49", "remaining_time": "15:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7670, "total_steps": 9627, "loss": 1.8697, "learning_rate": 9.854359864232854e-06, "epoch": 0.796717565181261, "percentage": 79.67, "elapsed_time": "2 days, 11:59:20", "remaining_time": "15:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7671, "total_steps": 9627, "loss": 1.6293, "learning_rate": 9.84463575099553e-06, "epoch": 0.7968214397008414, "percentage": 79.68, "elapsed_time": "2 days, 11:59:52", "remaining_time": "15:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7672, "total_steps": 9627, "loss": 1.7457, "learning_rate": 9.834915913991272e-06, "epoch": 0.7969253142204217, "percentage": 79.69, "elapsed_time": "2 days, 12:00:24", "remaining_time": "15:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7673, "total_steps": 9627, "loss": 1.5509, "learning_rate": 9.825200354255171e-06, "epoch": 0.7970291887400021, "percentage": 79.7, "elapsed_time": "2 days, 12:00:56", "remaining_time": "15:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7674, "total_steps": 9627, "loss": 1.6039, "learning_rate": 9.815489072821848e-06, "epoch": 0.7971330632595824, "percentage": 79.71, "elapsed_time": "2 days, 12:01:26", "remaining_time": "15:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7675, "total_steps": 9627, "loss": 1.5862, "learning_rate": 9.805782070725494e-06, "epoch": 0.7972369377791628, "percentage": 79.72, "elapsed_time": "2 days, 12:01:59", "remaining_time": "15:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7676, "total_steps": 9627, "loss": 1.6685, "learning_rate": 9.796079348999831e-06, "epoch": 0.7973408122987431, "percentage": 79.73, "elapsed_time": "2 days, 12:02:31", "remaining_time": "15:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7677, "total_steps": 9627, "loss": 1.6917, "learning_rate": 9.786380908678112e-06, "epoch": 0.7974446868183235, "percentage": 79.74, "elapsed_time": "2 days, 12:03:03", "remaining_time": "15:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7678, "total_steps": 9627, "loss": 1.6786, "learning_rate": 9.77668675079314e-06, "epoch": 0.7975485613379039, "percentage": 79.75, "elapsed_time": "2 days, 12:03:33", "remaining_time": "15:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7679, "total_steps": 9627, "loss": 1.5424, "learning_rate": 9.766996876377283e-06, "epoch": 0.7976524358574841, "percentage": 79.77, "elapsed_time": "2 days, 12:04:04", "remaining_time": "15:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7680, "total_steps": 9627, "loss": 1.6682, "learning_rate": 9.757311286462429e-06, "epoch": 0.7977563103770645, "percentage": 79.78, "elapsed_time": "2 days, 12:04:37", "remaining_time": "15:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7681, "total_steps": 9627, "loss": 1.7237, "learning_rate": 9.747629982080003e-06, "epoch": 0.7978601848966449, "percentage": 79.79, "elapsed_time": "2 days, 12:05:08", "remaining_time": "15:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7682, "total_steps": 9627, "loss": 1.7689, "learning_rate": 9.737952964261027e-06, "epoch": 0.7979640594162252, "percentage": 79.8, "elapsed_time": "2 days, 12:05:40", "remaining_time": "15:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7683, "total_steps": 9627, "loss": 1.6688, "learning_rate": 9.728280234035981e-06, "epoch": 0.7980679339358056, "percentage": 79.81, "elapsed_time": "2 days, 12:06:12", "remaining_time": "15:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7684, "total_steps": 9627, "loss": 1.7833, "learning_rate": 9.718611792434973e-06, "epoch": 0.7981718084553859, "percentage": 79.82, "elapsed_time": "2 days, 12:06:44", "remaining_time": "15:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7685, "total_steps": 9627, "loss": 1.6129, "learning_rate": 9.708947640487598e-06, "epoch": 0.7982756829749662, "percentage": 79.83, "elapsed_time": "2 days, 12:07:14", "remaining_time": "15:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7686, "total_steps": 9627, "loss": 1.7152, "learning_rate": 9.699287779223022e-06, "epoch": 0.7983795574945466, "percentage": 79.84, "elapsed_time": "2 days, 12:07:46", "remaining_time": "15:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7687, "total_steps": 9627, "loss": 1.5439, "learning_rate": 9.689632209669935e-06, "epoch": 0.798483432014127, "percentage": 79.85, "elapsed_time": "2 days, 12:08:18", "remaining_time": "15:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7688, "total_steps": 9627, "loss": 1.6193, "learning_rate": 9.679980932856591e-06, "epoch": 0.7985873065337072, "percentage": 79.86, "elapsed_time": "2 days, 12:08:50", "remaining_time": "15:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7689, "total_steps": 9627, "loss": 1.5908, "learning_rate": 9.670333949810761e-06, "epoch": 0.7986911810532876, "percentage": 79.87, "elapsed_time": "2 days, 12:09:23", "remaining_time": "15:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7690, "total_steps": 9627, "loss": 1.6236, "learning_rate": 9.660691261559774e-06, "epoch": 0.798795055572868, "percentage": 79.88, "elapsed_time": "2 days, 12:09:53", "remaining_time": "15:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7691, "total_steps": 9627, "loss": 1.5387, "learning_rate": 9.65105286913054e-06, "epoch": 0.7988989300924483, "percentage": 79.89, "elapsed_time": "2 days, 12:10:25", "remaining_time": "15:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7692, "total_steps": 9627, "loss": 1.583, "learning_rate": 9.641418773549405e-06, "epoch": 0.7990028046120287, "percentage": 79.9, "elapsed_time": "2 days, 12:10:56", "remaining_time": "15:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7693, "total_steps": 9627, "loss": 1.593, "learning_rate": 9.631788975842381e-06, "epoch": 0.799106679131609, "percentage": 79.91, "elapsed_time": "2 days, 12:11:26", "remaining_time": "15:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7694, "total_steps": 9627, "loss": 1.6916, "learning_rate": 9.622163477034957e-06, "epoch": 0.7992105536511893, "percentage": 79.92, "elapsed_time": "2 days, 12:11:59", "remaining_time": "15:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7695, "total_steps": 9627, "loss": 1.6192, "learning_rate": 9.612542278152142e-06, "epoch": 0.7993144281707697, "percentage": 79.93, "elapsed_time": "2 days, 12:12:31", "remaining_time": "15:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7696, "total_steps": 9627, "loss": 1.6866, "learning_rate": 9.602925380218547e-06, "epoch": 0.7994183026903501, "percentage": 79.94, "elapsed_time": "2 days, 12:13:01", "remaining_time": "15:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7697, "total_steps": 9627, "loss": 1.7376, "learning_rate": 9.593312784258297e-06, "epoch": 0.7995221772099304, "percentage": 79.95, "elapsed_time": "2 days, 12:13:34", "remaining_time": "15:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7698, "total_steps": 9627, "loss": 1.6386, "learning_rate": 9.583704491295042e-06, "epoch": 0.7996260517295107, "percentage": 79.96, "elapsed_time": "2 days, 12:14:04", "remaining_time": "15:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7699, "total_steps": 9627, "loss": 1.7478, "learning_rate": 9.574100502352007e-06, "epoch": 0.7997299262490911, "percentage": 79.97, "elapsed_time": "2 days, 12:14:37", "remaining_time": "15:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7700, "total_steps": 9627, "loss": 1.4819, "learning_rate": 9.564500818451916e-06, "epoch": 0.7998338007686715, "percentage": 79.98, "elapsed_time": "2 days, 12:15:08", "remaining_time": "15:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7701, "total_steps": 9627, "loss": 1.5952, "learning_rate": 9.554905440617108e-06, "epoch": 0.7999376752882518, "percentage": 79.99, "elapsed_time": "2 days, 12:15:39", "remaining_time": "15:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7702, "total_steps": 9627, "loss": 1.7333, "learning_rate": 9.545314369869362e-06, "epoch": 0.8000415498078322, "percentage": 80.0, "elapsed_time": "2 days, 12:16:11", "remaining_time": "15:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7703, "total_steps": 9627, "loss": 1.7021, "learning_rate": 9.535727607230088e-06, "epoch": 0.8001454243274125, "percentage": 80.01, "elapsed_time": "2 days, 12:16:41", "remaining_time": "15:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7704, "total_steps": 9627, "loss": 1.5992, "learning_rate": 9.52614515372019e-06, "epoch": 0.8002492988469928, "percentage": 80.02, "elapsed_time": "2 days, 12:17:13", "remaining_time": "15:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7705, "total_steps": 9627, "loss": 1.2576, "learning_rate": 9.516567010360127e-06, "epoch": 0.8003531733665732, "percentage": 80.04, "elapsed_time": "2 days, 12:17:44", "remaining_time": "15:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7706, "total_steps": 9627, "loss": 1.5702, "learning_rate": 9.506993178169892e-06, "epoch": 0.8004570478861536, "percentage": 80.05, "elapsed_time": "2 days, 12:18:15", "remaining_time": "15:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7707, "total_steps": 9627, "loss": 1.5422, "learning_rate": 9.497423658169025e-06, "epoch": 0.8005609224057338, "percentage": 80.06, "elapsed_time": "2 days, 12:18:47", "remaining_time": "15:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7708, "total_steps": 9627, "loss": 1.7401, "learning_rate": 9.487858451376608e-06, "epoch": 0.8006647969253142, "percentage": 80.07, "elapsed_time": "2 days, 12:19:20", "remaining_time": "15:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7709, "total_steps": 9627, "loss": 1.7727, "learning_rate": 9.47829755881125e-06, "epoch": 0.8007686714448946, "percentage": 80.08, "elapsed_time": "2 days, 12:19:49", "remaining_time": "15:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7710, "total_steps": 9627, "loss": 1.6619, "learning_rate": 9.468740981491143e-06, "epoch": 0.8008725459644749, "percentage": 80.09, "elapsed_time": "2 days, 12:20:22", "remaining_time": "15:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7711, "total_steps": 9627, "loss": 1.5847, "learning_rate": 9.459188720433937e-06, "epoch": 0.8009764204840553, "percentage": 80.1, "elapsed_time": "2 days, 12:20:54", "remaining_time": "14:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7712, "total_steps": 9627, "loss": 1.6943, "learning_rate": 9.449640776656915e-06, "epoch": 0.8010802950036356, "percentage": 80.11, "elapsed_time": "2 days, 12:21:24", "remaining_time": "14:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7713, "total_steps": 9627, "loss": 1.5879, "learning_rate": 9.440097151176846e-06, "epoch": 0.8011841695232159, "percentage": 80.12, "elapsed_time": "2 days, 12:21:56", "remaining_time": "14:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7714, "total_steps": 9627, "loss": 1.7309, "learning_rate": 9.430557845010058e-06, "epoch": 0.8012880440427963, "percentage": 80.13, "elapsed_time": "2 days, 12:22:27", "remaining_time": "14:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7715, "total_steps": 9627, "loss": 1.7228, "learning_rate": 9.421022859172397e-06, "epoch": 0.8013919185623767, "percentage": 80.14, "elapsed_time": "2 days, 12:22:59", "remaining_time": "14:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7716, "total_steps": 9627, "loss": 1.6439, "learning_rate": 9.411492194679277e-06, "epoch": 0.801495793081957, "percentage": 80.15, "elapsed_time": "2 days, 12:23:30", "remaining_time": "14:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7717, "total_steps": 9627, "loss": 1.5571, "learning_rate": 9.401965852545636e-06, "epoch": 0.8015996676015373, "percentage": 80.16, "elapsed_time": "2 days, 12:24:02", "remaining_time": "14:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7718, "total_steps": 9627, "loss": 1.7649, "learning_rate": 9.39244383378594e-06, "epoch": 0.8017035421211177, "percentage": 80.17, "elapsed_time": "2 days, 12:24:32", "remaining_time": "14:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7719, "total_steps": 9627, "loss": 1.3555, "learning_rate": 9.38292613941425e-06, "epoch": 0.801807416640698, "percentage": 80.18, "elapsed_time": "2 days, 12:25:04", "remaining_time": "14:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7720, "total_steps": 9627, "loss": 1.6209, "learning_rate": 9.37341277044408e-06, "epoch": 0.8019112911602784, "percentage": 80.19, "elapsed_time": "2 days, 12:25:35", "remaining_time": "14:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7721, "total_steps": 9627, "loss": 1.3753, "learning_rate": 9.363903727888556e-06, "epoch": 0.8020151656798588, "percentage": 80.2, "elapsed_time": "2 days, 12:26:06", "remaining_time": "14:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7722, "total_steps": 9627, "loss": 1.4721, "learning_rate": 9.354399012760328e-06, "epoch": 0.802119040199439, "percentage": 80.21, "elapsed_time": "2 days, 12:26:39", "remaining_time": "14:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7723, "total_steps": 9627, "loss": 1.5033, "learning_rate": 9.34489862607153e-06, "epoch": 0.8022229147190194, "percentage": 80.22, "elapsed_time": "2 days, 12:27:11", "remaining_time": "14:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7724, "total_steps": 9627, "loss": 1.8149, "learning_rate": 9.335402568833923e-06, "epoch": 0.8023267892385998, "percentage": 80.23, "elapsed_time": "2 days, 12:27:41", "remaining_time": "14:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7725, "total_steps": 9627, "loss": 1.7166, "learning_rate": 9.325910842058733e-06, "epoch": 0.8024306637581802, "percentage": 80.24, "elapsed_time": "2 days, 12:28:12", "remaining_time": "14:53:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7726, "total_steps": 9627, "loss": 1.4822, "learning_rate": 9.316423446756788e-06, "epoch": 0.8025345382777604, "percentage": 80.25, "elapsed_time": "2 days, 12:28:43", "remaining_time": "14:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7727, "total_steps": 9627, "loss": 1.7386, "learning_rate": 9.306940383938395e-06, "epoch": 0.8026384127973408, "percentage": 80.26, "elapsed_time": "2 days, 12:29:15", "remaining_time": "14:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7728, "total_steps": 9627, "loss": 1.6013, "learning_rate": 9.297461654613415e-06, "epoch": 0.8027422873169212, "percentage": 80.27, "elapsed_time": "2 days, 12:29:47", "remaining_time": "14:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7729, "total_steps": 9627, "loss": 1.6137, "learning_rate": 9.28798725979131e-06, "epoch": 0.8028461618365015, "percentage": 80.28, "elapsed_time": "2 days, 12:30:17", "remaining_time": "14:51:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7730, "total_steps": 9627, "loss": 1.8171, "learning_rate": 9.278517200480963e-06, "epoch": 0.8029500363560819, "percentage": 80.3, "elapsed_time": "2 days, 12:30:49", "remaining_time": "14:51:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7731, "total_steps": 9627, "loss": 1.6836, "learning_rate": 9.26905147769091e-06, "epoch": 0.8030539108756622, "percentage": 80.31, "elapsed_time": "2 days, 12:31:20", "remaining_time": "14:50:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7732, "total_steps": 9627, "loss": 1.9295, "learning_rate": 9.25959009242916e-06, "epoch": 0.8031577853952425, "percentage": 80.32, "elapsed_time": "2 days, 12:31:51", "remaining_time": "14:50:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7733, "total_steps": 9627, "loss": 1.8385, "learning_rate": 9.25013304570328e-06, "epoch": 0.8032616599148229, "percentage": 80.33, "elapsed_time": "2 days, 12:32:23", "remaining_time": "14:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7734, "total_steps": 9627, "loss": 1.5867, "learning_rate": 9.24068033852037e-06, "epoch": 0.8033655344344033, "percentage": 80.34, "elapsed_time": "2 days, 12:32:53", "remaining_time": "14:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7735, "total_steps": 9627, "loss": 1.6309, "learning_rate": 9.231231971887066e-06, "epoch": 0.8034694089539836, "percentage": 80.35, "elapsed_time": "2 days, 12:33:25", "remaining_time": "14:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7736, "total_steps": 9627, "loss": 1.5253, "learning_rate": 9.221787946809552e-06, "epoch": 0.8035732834735639, "percentage": 80.36, "elapsed_time": "2 days, 12:33:56", "remaining_time": "14:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7737, "total_steps": 9627, "loss": 1.5669, "learning_rate": 9.212348264293519e-06, "epoch": 0.8036771579931443, "percentage": 80.37, "elapsed_time": "2 days, 12:34:27", "remaining_time": "14:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7738, "total_steps": 9627, "loss": 1.6559, "learning_rate": 9.202912925344276e-06, "epoch": 0.8037810325127246, "percentage": 80.38, "elapsed_time": "2 days, 12:34:58", "remaining_time": "14:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7739, "total_steps": 9627, "loss": 1.7244, "learning_rate": 9.19348193096654e-06, "epoch": 0.803884907032305, "percentage": 80.39, "elapsed_time": "2 days, 12:35:29", "remaining_time": "14:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7740, "total_steps": 9627, "loss": 1.5402, "learning_rate": 9.184055282164699e-06, "epoch": 0.8039887815518854, "percentage": 80.4, "elapsed_time": "2 days, 12:36:02", "remaining_time": "14:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7741, "total_steps": 9627, "loss": 1.6772, "learning_rate": 9.174632979942587e-06, "epoch": 0.8040926560714656, "percentage": 80.41, "elapsed_time": "2 days, 12:36:33", "remaining_time": "14:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7742, "total_steps": 9627, "loss": 1.7684, "learning_rate": 9.165215025303614e-06, "epoch": 0.804196530591046, "percentage": 80.42, "elapsed_time": "2 days, 12:37:03", "remaining_time": "14:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7743, "total_steps": 9627, "loss": 1.8452, "learning_rate": 9.15580141925072e-06, "epoch": 0.8043004051106264, "percentage": 80.43, "elapsed_time": "2 days, 12:37:35", "remaining_time": "14:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7744, "total_steps": 9627, "loss": 1.7204, "learning_rate": 9.146392162786377e-06, "epoch": 0.8044042796302067, "percentage": 80.44, "elapsed_time": "2 days, 12:38:06", "remaining_time": "14:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7745, "total_steps": 9627, "loss": 1.4458, "learning_rate": 9.136987256912594e-06, "epoch": 0.804508154149787, "percentage": 80.45, "elapsed_time": "2 days, 12:38:37", "remaining_time": "14:44:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7746, "total_steps": 9627, "loss": 1.7218, "learning_rate": 9.127586702630913e-06, "epoch": 0.8046120286693674, "percentage": 80.46, "elapsed_time": "2 days, 12:39:09", "remaining_time": "14:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7747, "total_steps": 9627, "loss": 1.7473, "learning_rate": 9.118190500942459e-06, "epoch": 0.8047159031889477, "percentage": 80.47, "elapsed_time": "2 days, 12:39:40", "remaining_time": "14:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7748, "total_steps": 9627, "loss": 1.6519, "learning_rate": 9.108798652847811e-06, "epoch": 0.8048197777085281, "percentage": 80.48, "elapsed_time": "2 days, 12:40:11", "remaining_time": "14:42:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7749, "total_steps": 9627, "loss": 1.5866, "learning_rate": 9.099411159347133e-06, "epoch": 0.8049236522281085, "percentage": 80.49, "elapsed_time": "2 days, 12:40:42", "remaining_time": "14:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7750, "total_steps": 9627, "loss": 1.8477, "learning_rate": 9.090028021440155e-06, "epoch": 0.8050275267476887, "percentage": 80.5, "elapsed_time": "2 days, 12:41:14", "remaining_time": "14:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7751, "total_steps": 9627, "loss": 1.6118, "learning_rate": 9.080649240126054e-06, "epoch": 0.8051314012672691, "percentage": 80.51, "elapsed_time": "2 days, 12:41:46", "remaining_time": "14:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7752, "total_steps": 9627, "loss": 1.5275, "learning_rate": 9.07127481640364e-06, "epoch": 0.8052352757868495, "percentage": 80.52, "elapsed_time": "2 days, 12:42:17", "remaining_time": "14:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7753, "total_steps": 9627, "loss": 1.6641, "learning_rate": 9.061904751271193e-06, "epoch": 0.8053391503064299, "percentage": 80.53, "elapsed_time": "2 days, 12:42:48", "remaining_time": "14:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7754, "total_steps": 9627, "loss": 1.7141, "learning_rate": 9.052539045726583e-06, "epoch": 0.8054430248260102, "percentage": 80.54, "elapsed_time": "2 days, 12:43:18", "remaining_time": "14:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7755, "total_steps": 9627, "loss": 1.6593, "learning_rate": 9.043177700767148e-06, "epoch": 0.8055468993455905, "percentage": 80.55, "elapsed_time": "2 days, 12:43:51", "remaining_time": "14:39:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7756, "total_steps": 9627, "loss": 1.6844, "learning_rate": 9.033820717389802e-06, "epoch": 0.8056507738651709, "percentage": 80.57, "elapsed_time": "2 days, 12:44:22", "remaining_time": "14:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7757, "total_steps": 9627, "loss": 1.6062, "learning_rate": 9.024468096591022e-06, "epoch": 0.8057546483847512, "percentage": 80.58, "elapsed_time": "2 days, 12:44:52", "remaining_time": "14:38:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7758, "total_steps": 9627, "loss": 1.6187, "learning_rate": 9.015119839366748e-06, "epoch": 0.8058585229043316, "percentage": 80.59, "elapsed_time": "2 days, 12:45:25", "remaining_time": "14:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7759, "total_steps": 9627, "loss": 1.6813, "learning_rate": 9.005775946712524e-06, "epoch": 0.805962397423912, "percentage": 80.6, "elapsed_time": "2 days, 12:45:56", "remaining_time": "14:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7760, "total_steps": 9627, "loss": 1.8797, "learning_rate": 8.9964364196234e-06, "epoch": 0.8060662719434922, "percentage": 80.61, "elapsed_time": "2 days, 12:46:26", "remaining_time": "14:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7761, "total_steps": 9627, "loss": 1.6896, "learning_rate": 8.987101259093955e-06, "epoch": 0.8061701464630726, "percentage": 80.62, "elapsed_time": "2 days, 12:46:57", "remaining_time": "14:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7762, "total_steps": 9627, "loss": 1.574, "learning_rate": 8.977770466118313e-06, "epoch": 0.806274020982653, "percentage": 80.63, "elapsed_time": "2 days, 12:47:29", "remaining_time": "14:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7763, "total_steps": 9627, "loss": 1.5353, "learning_rate": 8.968444041690132e-06, "epoch": 0.8063778955022333, "percentage": 80.64, "elapsed_time": "2 days, 12:47:59", "remaining_time": "14:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7764, "total_steps": 9627, "loss": 1.494, "learning_rate": 8.959121986802599e-06, "epoch": 0.8064817700218136, "percentage": 80.65, "elapsed_time": "2 days, 12:48:31", "remaining_time": "14:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7765, "total_steps": 9627, "loss": 1.6712, "learning_rate": 8.949804302448433e-06, "epoch": 0.806585644541394, "percentage": 80.66, "elapsed_time": "2 days, 12:49:03", "remaining_time": "14:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7766, "total_steps": 9627, "loss": 1.6931, "learning_rate": 8.940490989619932e-06, "epoch": 0.8066895190609743, "percentage": 80.67, "elapsed_time": "2 days, 12:49:33", "remaining_time": "14:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7767, "total_steps": 9627, "loss": 1.616, "learning_rate": 8.931182049308833e-06, "epoch": 0.8067933935805547, "percentage": 80.68, "elapsed_time": "2 days, 12:50:05", "remaining_time": "14:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7768, "total_steps": 9627, "loss": 1.5328, "learning_rate": 8.921877482506518e-06, "epoch": 0.8068972681001351, "percentage": 80.69, "elapsed_time": "2 days, 12:50:35", "remaining_time": "14:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7769, "total_steps": 9627, "loss": 1.5393, "learning_rate": 8.912577290203822e-06, "epoch": 0.8070011426197153, "percentage": 80.7, "elapsed_time": "2 days, 12:51:07", "remaining_time": "14:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7770, "total_steps": 9627, "loss": 1.5114, "learning_rate": 8.90328147339115e-06, "epoch": 0.8071050171392957, "percentage": 80.71, "elapsed_time": "2 days, 12:51:39", "remaining_time": "14:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7771, "total_steps": 9627, "loss": 1.6231, "learning_rate": 8.893990033058442e-06, "epoch": 0.8072088916588761, "percentage": 80.72, "elapsed_time": "2 days, 12:52:09", "remaining_time": "14:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7772, "total_steps": 9627, "loss": 1.6152, "learning_rate": 8.884702970195152e-06, "epoch": 0.8073127661784564, "percentage": 80.73, "elapsed_time": "2 days, 12:52:40", "remaining_time": "14:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7773, "total_steps": 9627, "loss": 1.7177, "learning_rate": 8.875420285790281e-06, "epoch": 0.8074166406980368, "percentage": 80.74, "elapsed_time": "2 days, 12:53:13", "remaining_time": "14:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7774, "total_steps": 9627, "loss": 1.6195, "learning_rate": 8.866141980832354e-06, "epoch": 0.8075205152176171, "percentage": 80.75, "elapsed_time": "2 days, 12:53:44", "remaining_time": "14:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7775, "total_steps": 9627, "loss": 1.4594, "learning_rate": 8.856868056309475e-06, "epoch": 0.8076243897371974, "percentage": 80.76, "elapsed_time": "2 days, 12:54:15", "remaining_time": "14:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7776, "total_steps": 9627, "loss": 1.7521, "learning_rate": 8.84759851320921e-06, "epoch": 0.8077282642567778, "percentage": 80.77, "elapsed_time": "2 days, 12:54:46", "remaining_time": "14:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7777, "total_steps": 9627, "loss": 1.5742, "learning_rate": 8.838333352518685e-06, "epoch": 0.8078321387763582, "percentage": 80.78, "elapsed_time": "2 days, 12:55:17", "remaining_time": "14:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7778, "total_steps": 9627, "loss": 1.6479, "learning_rate": 8.829072575224601e-06, "epoch": 0.8079360132959386, "percentage": 80.79, "elapsed_time": "2 days, 12:55:49", "remaining_time": "14:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7779, "total_steps": 9627, "loss": 1.4088, "learning_rate": 8.819816182313139e-06, "epoch": 0.8080398878155188, "percentage": 80.8, "elapsed_time": "2 days, 12:56:19", "remaining_time": "14:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7780, "total_steps": 9627, "loss": 1.5949, "learning_rate": 8.810564174770043e-06, "epoch": 0.8081437623350992, "percentage": 80.81, "elapsed_time": "2 days, 12:56:50", "remaining_time": "14:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7781, "total_steps": 9627, "loss": 1.6899, "learning_rate": 8.801316553580551e-06, "epoch": 0.8082476368546796, "percentage": 80.82, "elapsed_time": "2 days, 12:57:22", "remaining_time": "14:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7782, "total_steps": 9627, "loss": 1.5462, "learning_rate": 8.792073319729516e-06, "epoch": 0.8083515113742599, "percentage": 80.84, "elapsed_time": "2 days, 12:57:54", "remaining_time": "14:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7783, "total_steps": 9627, "loss": 1.8192, "learning_rate": 8.782834474201217e-06, "epoch": 0.8084553858938403, "percentage": 80.85, "elapsed_time": "2 days, 12:58:24", "remaining_time": "14:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7784, "total_steps": 9627, "loss": 1.5268, "learning_rate": 8.773600017979538e-06, "epoch": 0.8085592604134206, "percentage": 80.86, "elapsed_time": "2 days, 12:58:55", "remaining_time": "14:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7785, "total_steps": 9627, "loss": 1.7217, "learning_rate": 8.764369952047896e-06, "epoch": 0.8086631349330009, "percentage": 80.87, "elapsed_time": "2 days, 12:59:26", "remaining_time": "14:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7786, "total_steps": 9627, "loss": 1.7892, "learning_rate": 8.755144277389183e-06, "epoch": 0.8087670094525813, "percentage": 80.88, "elapsed_time": "2 days, 12:59:56", "remaining_time": "14:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7787, "total_steps": 9627, "loss": 1.5297, "learning_rate": 8.745922994985895e-06, "epoch": 0.8088708839721617, "percentage": 80.89, "elapsed_time": "2 days, 13:00:29", "remaining_time": "14:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7788, "total_steps": 9627, "loss": 1.7274, "learning_rate": 8.736706105820008e-06, "epoch": 0.8089747584917419, "percentage": 80.9, "elapsed_time": "2 days, 13:01:00", "remaining_time": "14:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7789, "total_steps": 9627, "loss": 1.597, "learning_rate": 8.727493610873062e-06, "epoch": 0.8090786330113223, "percentage": 80.91, "elapsed_time": "2 days, 13:01:30", "remaining_time": "14:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7790, "total_steps": 9627, "loss": 1.7429, "learning_rate": 8.718285511126106e-06, "epoch": 0.8091825075309027, "percentage": 80.92, "elapsed_time": "2 days, 13:02:02", "remaining_time": "14:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7791, "total_steps": 9627, "loss": 1.6746, "learning_rate": 8.709081807559732e-06, "epoch": 0.809286382050483, "percentage": 80.93, "elapsed_time": "2 days, 13:02:33", "remaining_time": "14:23:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7792, "total_steps": 9627, "loss": 1.7955, "learning_rate": 8.699882501154067e-06, "epoch": 0.8093902565700634, "percentage": 80.94, "elapsed_time": "2 days, 13:03:04", "remaining_time": "14:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7793, "total_steps": 9627, "loss": 1.741, "learning_rate": 8.690687592888747e-06, "epoch": 0.8094941310896437, "percentage": 80.95, "elapsed_time": "2 days, 13:03:35", "remaining_time": "14:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7794, "total_steps": 9627, "loss": 1.5883, "learning_rate": 8.681497083742995e-06, "epoch": 0.809598005609224, "percentage": 80.96, "elapsed_time": "2 days, 13:04:05", "remaining_time": "14:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7795, "total_steps": 9627, "loss": 1.7313, "learning_rate": 8.672310974695485e-06, "epoch": 0.8097018801288044, "percentage": 80.97, "elapsed_time": "2 days, 13:04:36", "remaining_time": "14:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7796, "total_steps": 9627, "loss": 1.6054, "learning_rate": 8.663129266724501e-06, "epoch": 0.8098057546483848, "percentage": 80.98, "elapsed_time": "2 days, 13:05:07", "remaining_time": "14:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7797, "total_steps": 9627, "loss": 1.9036, "learning_rate": 8.65395196080781e-06, "epoch": 0.809909629167965, "percentage": 80.99, "elapsed_time": "2 days, 13:05:38", "remaining_time": "14:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7798, "total_steps": 9627, "loss": 1.7245, "learning_rate": 8.644779057922725e-06, "epoch": 0.8100135036875454, "percentage": 81.0, "elapsed_time": "2 days, 13:06:10", "remaining_time": "14:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7799, "total_steps": 9627, "loss": 1.6524, "learning_rate": 8.635610559046087e-06, "epoch": 0.8101173782071258, "percentage": 81.01, "elapsed_time": "2 days, 13:06:40", "remaining_time": "14:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7800, "total_steps": 9627, "loss": 1.6953, "learning_rate": 8.62644646515427e-06, "epoch": 0.8102212527267061, "percentage": 81.02, "elapsed_time": "2 days, 13:07:11", "remaining_time": "14:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7801, "total_steps": 9627, "loss": 1.5696, "learning_rate": 8.617286777223177e-06, "epoch": 0.8103251272462865, "percentage": 81.03, "elapsed_time": "2 days, 13:07:42", "remaining_time": "14:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7802, "total_steps": 9627, "loss": 1.5954, "learning_rate": 8.608131496228228e-06, "epoch": 0.8104290017658669, "percentage": 81.04, "elapsed_time": "2 days, 13:08:14", "remaining_time": "14:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7803, "total_steps": 9627, "loss": 2.0503, "learning_rate": 8.598980623144427e-06, "epoch": 0.8105328762854472, "percentage": 81.05, "elapsed_time": "2 days, 13:08:44", "remaining_time": "14:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7804, "total_steps": 9627, "loss": 1.8498, "learning_rate": 8.589834158946253e-06, "epoch": 0.8106367508050275, "percentage": 81.06, "elapsed_time": "2 days, 13:09:15", "remaining_time": "14:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7805, "total_steps": 9627, "loss": 1.6659, "learning_rate": 8.580692104607712e-06, "epoch": 0.8107406253246079, "percentage": 81.07, "elapsed_time": "2 days, 13:09:46", "remaining_time": "14:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7806, "total_steps": 9627, "loss": 1.625, "learning_rate": 8.571554461102389e-06, "epoch": 0.8108444998441883, "percentage": 81.08, "elapsed_time": "2 days, 13:10:17", "remaining_time": "14:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7807, "total_steps": 9627, "loss": 1.7467, "learning_rate": 8.562421229403356e-06, "epoch": 0.8109483743637685, "percentage": 81.09, "elapsed_time": "2 days, 13:10:48", "remaining_time": "14:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7808, "total_steps": 9627, "loss": 1.6585, "learning_rate": 8.553292410483243e-06, "epoch": 0.8110522488833489, "percentage": 81.11, "elapsed_time": "2 days, 13:11:19", "remaining_time": "14:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7809, "total_steps": 9627, "loss": 1.6903, "learning_rate": 8.544168005314191e-06, "epoch": 0.8111561234029293, "percentage": 81.12, "elapsed_time": "2 days, 13:11:50", "remaining_time": "14:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7810, "total_steps": 9627, "loss": 1.6525, "learning_rate": 8.535048014867875e-06, "epoch": 0.8112599979225096, "percentage": 81.13, "elapsed_time": "2 days, 13:12:20", "remaining_time": "14:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7811, "total_steps": 9627, "loss": 1.4948, "learning_rate": 8.525932440115509e-06, "epoch": 0.81136387244209, "percentage": 81.14, "elapsed_time": "2 days, 13:12:51", "remaining_time": "14:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7812, "total_steps": 9627, "loss": 1.5873, "learning_rate": 8.516821282027814e-06, "epoch": 0.8114677469616703, "percentage": 81.15, "elapsed_time": "2 days, 13:13:22", "remaining_time": "14:13:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7813, "total_steps": 9627, "loss": 1.5856, "learning_rate": 8.507714541575096e-06, "epoch": 0.8115716214812506, "percentage": 81.16, "elapsed_time": "2 days, 13:13:53", "remaining_time": "14:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7814, "total_steps": 9627, "loss": 1.6061, "learning_rate": 8.498612219727104e-06, "epoch": 0.811675496000831, "percentage": 81.17, "elapsed_time": "2 days, 13:14:24", "remaining_time": "14:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7815, "total_steps": 9627, "loss": 1.6078, "learning_rate": 8.4895143174532e-06, "epoch": 0.8117793705204114, "percentage": 81.18, "elapsed_time": "2 days, 13:14:55", "remaining_time": "14:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7816, "total_steps": 9627, "loss": 1.6971, "learning_rate": 8.480420835722224e-06, "epoch": 0.8118832450399917, "percentage": 81.19, "elapsed_time": "2 days, 13:15:26", "remaining_time": "14:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7817, "total_steps": 9627, "loss": 1.7409, "learning_rate": 8.471331775502566e-06, "epoch": 0.811987119559572, "percentage": 81.2, "elapsed_time": "2 days, 13:15:56", "remaining_time": "14:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7818, "total_steps": 9627, "loss": 1.6476, "learning_rate": 8.462247137762142e-06, "epoch": 0.8120909940791524, "percentage": 81.21, "elapsed_time": "2 days, 13:16:27", "remaining_time": "14:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7819, "total_steps": 9627, "loss": 1.6937, "learning_rate": 8.453166923468387e-06, "epoch": 0.8121948685987327, "percentage": 81.22, "elapsed_time": "2 days, 13:16:59", "remaining_time": "14:10:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7820, "total_steps": 9627, "loss": 1.7928, "learning_rate": 8.444091133588273e-06, "epoch": 0.8122987431183131, "percentage": 81.23, "elapsed_time": "2 days, 13:17:30", "remaining_time": "14:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7821, "total_steps": 9627, "loss": 1.6076, "learning_rate": 8.435019769088298e-06, "epoch": 0.8124026176378935, "percentage": 81.24, "elapsed_time": "2 days, 13:18:00", "remaining_time": "14:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7822, "total_steps": 9627, "loss": 1.8033, "learning_rate": 8.42595283093452e-06, "epoch": 0.8125064921574737, "percentage": 81.25, "elapsed_time": "2 days, 13:18:32", "remaining_time": "14:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7823, "total_steps": 9627, "loss": 1.613, "learning_rate": 8.416890320092451e-06, "epoch": 0.8126103666770541, "percentage": 81.26, "elapsed_time": "2 days, 13:19:02", "remaining_time": "14:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7824, "total_steps": 9627, "loss": 1.8238, "learning_rate": 8.407832237527214e-06, "epoch": 0.8127142411966345, "percentage": 81.27, "elapsed_time": "2 days, 13:19:34", "remaining_time": "14:07:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7825, "total_steps": 9627, "loss": 1.6164, "learning_rate": 8.398778584203414e-06, "epoch": 0.8128181157162148, "percentage": 81.28, "elapsed_time": "2 days, 13:20:05", "remaining_time": "14:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7826, "total_steps": 9627, "loss": 1.6903, "learning_rate": 8.389729361085192e-06, "epoch": 0.8129219902357951, "percentage": 81.29, "elapsed_time": "2 days, 13:20:36", "remaining_time": "14:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7827, "total_steps": 9627, "loss": 1.5846, "learning_rate": 8.380684569136222e-06, "epoch": 0.8130258647553755, "percentage": 81.3, "elapsed_time": "2 days, 13:21:06", "remaining_time": "14:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7828, "total_steps": 9627, "loss": 1.4752, "learning_rate": 8.371644209319702e-06, "epoch": 0.8131297392749558, "percentage": 81.31, "elapsed_time": "2 days, 13:21:39", "remaining_time": "14:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7829, "total_steps": 9627, "loss": 1.6837, "learning_rate": 8.362608282598355e-06, "epoch": 0.8132336137945362, "percentage": 81.32, "elapsed_time": "2 days, 13:22:08", "remaining_time": "14:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7830, "total_steps": 9627, "loss": 1.6555, "learning_rate": 8.353576789934436e-06, "epoch": 0.8133374883141166, "percentage": 81.33, "elapsed_time": "2 days, 13:22:39", "remaining_time": "14:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7831, "total_steps": 9627, "loss": 1.7406, "learning_rate": 8.344549732289741e-06, "epoch": 0.813441362833697, "percentage": 81.34, "elapsed_time": "2 days, 13:23:10", "remaining_time": "14:04:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7832, "total_steps": 9627, "loss": 1.7404, "learning_rate": 8.33552711062559e-06, "epoch": 0.8135452373532772, "percentage": 81.35, "elapsed_time": "2 days, 13:23:41", "remaining_time": "14:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7833, "total_steps": 9627, "loss": 1.4813, "learning_rate": 8.326508925902781e-06, "epoch": 0.8136491118728576, "percentage": 81.36, "elapsed_time": "2 days, 13:24:14", "remaining_time": "14:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7834, "total_steps": 9627, "loss": 1.3518, "learning_rate": 8.31749517908172e-06, "epoch": 0.813752986392438, "percentage": 81.38, "elapsed_time": "2 days, 13:24:45", "remaining_time": "14:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7835, "total_steps": 9627, "loss": 1.723, "learning_rate": 8.308485871122284e-06, "epoch": 0.8138568609120183, "percentage": 81.39, "elapsed_time": "2 days, 13:25:15", "remaining_time": "14:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7836, "total_steps": 9627, "loss": 1.8044, "learning_rate": 8.2994810029839e-06, "epoch": 0.8139607354315986, "percentage": 81.4, "elapsed_time": "2 days, 13:25:47", "remaining_time": "14:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7837, "total_steps": 9627, "loss": 1.6315, "learning_rate": 8.290480575625508e-06, "epoch": 0.814064609951179, "percentage": 81.41, "elapsed_time": "2 days, 13:26:17", "remaining_time": "14:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7838, "total_steps": 9627, "loss": 1.6415, "learning_rate": 8.28148459000559e-06, "epoch": 0.8141684844707593, "percentage": 81.42, "elapsed_time": "2 days, 13:26:50", "remaining_time": "14:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7839, "total_steps": 9627, "loss": 1.7884, "learning_rate": 8.272493047082147e-06, "epoch": 0.8142723589903397, "percentage": 81.43, "elapsed_time": "2 days, 13:27:21", "remaining_time": "14:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7840, "total_steps": 9627, "loss": 1.6999, "learning_rate": 8.263505947812694e-06, "epoch": 0.8143762335099201, "percentage": 81.44, "elapsed_time": "2 days, 13:27:51", "remaining_time": "14:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7841, "total_steps": 9627, "loss": 1.7044, "learning_rate": 8.254523293154325e-06, "epoch": 0.8144801080295003, "percentage": 81.45, "elapsed_time": "2 days, 13:28:23", "remaining_time": "14:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7842, "total_steps": 9627, "loss": 1.6382, "learning_rate": 8.245545084063572e-06, "epoch": 0.8145839825490807, "percentage": 81.46, "elapsed_time": "2 days, 13:28:53", "remaining_time": "13:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7843, "total_steps": 9627, "loss": 1.657, "learning_rate": 8.236571321496584e-06, "epoch": 0.8146878570686611, "percentage": 81.47, "elapsed_time": "2 days, 13:29:25", "remaining_time": "13:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7844, "total_steps": 9627, "loss": 1.6226, "learning_rate": 8.227602006408986e-06, "epoch": 0.8147917315882414, "percentage": 81.48, "elapsed_time": "2 days, 13:29:55", "remaining_time": "13:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7845, "total_steps": 9627, "loss": 1.6346, "learning_rate": 8.218637139755931e-06, "epoch": 0.8148956061078217, "percentage": 81.49, "elapsed_time": "2 days, 13:30:26", "remaining_time": "13:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7846, "total_steps": 9627, "loss": 1.6784, "learning_rate": 8.209676722492116e-06, "epoch": 0.8149994806274021, "percentage": 81.5, "elapsed_time": "2 days, 13:30:58", "remaining_time": "13:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7847, "total_steps": 9627, "loss": 1.6905, "learning_rate": 8.200720755571755e-06, "epoch": 0.8151033551469824, "percentage": 81.51, "elapsed_time": "2 days, 13:31:29", "remaining_time": "13:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7848, "total_steps": 9627, "loss": 1.8831, "learning_rate": 8.191769239948588e-06, "epoch": 0.8152072296665628, "percentage": 81.52, "elapsed_time": "2 days, 13:31:59", "remaining_time": "13:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7849, "total_steps": 9627, "loss": 1.6919, "learning_rate": 8.182822176575865e-06, "epoch": 0.8153111041861432, "percentage": 81.53, "elapsed_time": "2 days, 13:32:31", "remaining_time": "13:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7850, "total_steps": 9627, "loss": 1.6247, "learning_rate": 8.173879566406418e-06, "epoch": 0.8154149787057234, "percentage": 81.54, "elapsed_time": "2 days, 13:33:02", "remaining_time": "13:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7851, "total_steps": 9627, "loss": 1.662, "learning_rate": 8.164941410392519e-06, "epoch": 0.8155188532253038, "percentage": 81.55, "elapsed_time": "2 days, 13:33:33", "remaining_time": "13:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7852, "total_steps": 9627, "loss": 1.5751, "learning_rate": 8.15600770948604e-06, "epoch": 0.8156227277448842, "percentage": 81.56, "elapsed_time": "2 days, 13:34:04", "remaining_time": "13:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7853, "total_steps": 9627, "loss": 1.5519, "learning_rate": 8.147078464638346e-06, "epoch": 0.8157266022644645, "percentage": 81.57, "elapsed_time": "2 days, 13:34:35", "remaining_time": "13:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7854, "total_steps": 9627, "loss": 1.7116, "learning_rate": 8.138153676800336e-06, "epoch": 0.8158304767840449, "percentage": 81.58, "elapsed_time": "2 days, 13:35:06", "remaining_time": "13:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7855, "total_steps": 9627, "loss": 1.5981, "learning_rate": 8.129233346922422e-06, "epoch": 0.8159343513036252, "percentage": 81.59, "elapsed_time": "2 days, 13:35:36", "remaining_time": "13:53:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7856, "total_steps": 9627, "loss": 1.7425, "learning_rate": 8.120317475954536e-06, "epoch": 0.8160382258232056, "percentage": 81.6, "elapsed_time": "2 days, 13:36:08", "remaining_time": "13:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7857, "total_steps": 9627, "loss": 1.5632, "learning_rate": 8.111406064846194e-06, "epoch": 0.8161421003427859, "percentage": 81.61, "elapsed_time": "2 days, 13:36:38", "remaining_time": "13:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7858, "total_steps": 9627, "loss": 1.5863, "learning_rate": 8.102499114546335e-06, "epoch": 0.8162459748623663, "percentage": 81.62, "elapsed_time": "2 days, 13:37:08", "remaining_time": "13:52:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7859, "total_steps": 9627, "loss": 1.7937, "learning_rate": 8.093596626003519e-06, "epoch": 0.8163498493819467, "percentage": 81.63, "elapsed_time": "2 days, 13:37:41", "remaining_time": "13:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7860, "total_steps": 9627, "loss": 1.745, "learning_rate": 8.084698600165796e-06, "epoch": 0.8164537239015269, "percentage": 81.65, "elapsed_time": "2 days, 13:38:11", "remaining_time": "13:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7861, "total_steps": 9627, "loss": 1.528, "learning_rate": 8.075805037980688e-06, "epoch": 0.8165575984211073, "percentage": 81.66, "elapsed_time": "2 days, 13:38:42", "remaining_time": "13:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7862, "total_steps": 9627, "loss": 1.6715, "learning_rate": 8.066915940395341e-06, "epoch": 0.8166614729406877, "percentage": 81.67, "elapsed_time": "2 days, 13:39:14", "remaining_time": "13:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7863, "total_steps": 9627, "loss": 1.5871, "learning_rate": 8.058031308356357e-06, "epoch": 0.816765347460268, "percentage": 81.68, "elapsed_time": "2 days, 13:39:44", "remaining_time": "13:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7864, "total_steps": 9627, "loss": 1.8095, "learning_rate": 8.049151142809874e-06, "epoch": 0.8168692219798483, "percentage": 81.69, "elapsed_time": "2 days, 13:40:14", "remaining_time": "13:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7865, "total_steps": 9627, "loss": 1.712, "learning_rate": 8.040275444701567e-06, "epoch": 0.8169730964994287, "percentage": 81.7, "elapsed_time": "2 days, 13:40:45", "remaining_time": "13:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7866, "total_steps": 9627, "loss": 1.8676, "learning_rate": 8.031404214976628e-06, "epoch": 0.817076971019009, "percentage": 81.71, "elapsed_time": "2 days, 13:41:16", "remaining_time": "13:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7867, "total_steps": 9627, "loss": 1.5683, "learning_rate": 8.02253745457977e-06, "epoch": 0.8171808455385894, "percentage": 81.72, "elapsed_time": "2 days, 13:41:46", "remaining_time": "13:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7868, "total_steps": 9627, "loss": 1.6236, "learning_rate": 8.013675164455225e-06, "epoch": 0.8172847200581698, "percentage": 81.73, "elapsed_time": "2 days, 13:42:19", "remaining_time": "13:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7869, "total_steps": 9627, "loss": 1.677, "learning_rate": 8.004817345546794e-06, "epoch": 0.81738859457775, "percentage": 81.74, "elapsed_time": "2 days, 13:42:50", "remaining_time": "13:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7870, "total_steps": 9627, "loss": 1.6949, "learning_rate": 7.995963998797717e-06, "epoch": 0.8174924690973304, "percentage": 81.75, "elapsed_time": "2 days, 13:43:20", "remaining_time": "13:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7871, "total_steps": 9627, "loss": 1.6774, "learning_rate": 7.98711512515084e-06, "epoch": 0.8175963436169108, "percentage": 81.76, "elapsed_time": "2 days, 13:43:50", "remaining_time": "13:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7872, "total_steps": 9627, "loss": 1.4368, "learning_rate": 7.978270725548493e-06, "epoch": 0.8177002181364911, "percentage": 81.77, "elapsed_time": "2 days, 13:44:22", "remaining_time": "13:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7873, "total_steps": 9627, "loss": 1.6731, "learning_rate": 7.969430800932526e-06, "epoch": 0.8178040926560715, "percentage": 81.78, "elapsed_time": "2 days, 13:44:53", "remaining_time": "13:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7874, "total_steps": 9627, "loss": 1.7251, "learning_rate": 7.960595352244332e-06, "epoch": 0.8179079671756518, "percentage": 81.79, "elapsed_time": "2 days, 13:45:23", "remaining_time": "13:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7875, "total_steps": 9627, "loss": 1.8268, "learning_rate": 7.951764380424808e-06, "epoch": 0.8180118416952321, "percentage": 81.8, "elapsed_time": "2 days, 13:45:54", "remaining_time": "13:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7876, "total_steps": 9627, "loss": 1.4004, "learning_rate": 7.942937886414392e-06, "epoch": 0.8181157162148125, "percentage": 81.81, "elapsed_time": "2 days, 13:46:25", "remaining_time": "13:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7877, "total_steps": 9627, "loss": 1.6694, "learning_rate": 7.934115871153025e-06, "epoch": 0.8182195907343929, "percentage": 81.82, "elapsed_time": "2 days, 13:46:56", "remaining_time": "13:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7878, "total_steps": 9627, "loss": 1.5698, "learning_rate": 7.925298335580211e-06, "epoch": 0.8183234652539731, "percentage": 81.83, "elapsed_time": "2 days, 13:47:28", "remaining_time": "13:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7879, "total_steps": 9627, "loss": 1.6886, "learning_rate": 7.916485280634906e-06, "epoch": 0.8184273397735535, "percentage": 81.84, "elapsed_time": "2 days, 13:47:58", "remaining_time": "13:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7880, "total_steps": 9627, "loss": 1.8019, "learning_rate": 7.907676707255668e-06, "epoch": 0.8185312142931339, "percentage": 81.85, "elapsed_time": "2 days, 13:48:30", "remaining_time": "13:42:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7881, "total_steps": 9627, "loss": 1.5613, "learning_rate": 7.898872616380526e-06, "epoch": 0.8186350888127143, "percentage": 81.86, "elapsed_time": "2 days, 13:49:00", "remaining_time": "13:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7882, "total_steps": 9627, "loss": 1.6753, "learning_rate": 7.890073008947047e-06, "epoch": 0.8187389633322946, "percentage": 81.87, "elapsed_time": "2 days, 13:49:32", "remaining_time": "13:41:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7883, "total_steps": 9627, "loss": 1.4869, "learning_rate": 7.881277885892324e-06, "epoch": 0.818842837851875, "percentage": 81.88, "elapsed_time": "2 days, 13:50:02", "remaining_time": "13:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7884, "total_steps": 9627, "loss": 1.641, "learning_rate": 7.87248724815296e-06, "epoch": 0.8189467123714553, "percentage": 81.89, "elapsed_time": "2 days, 13:50:33", "remaining_time": "13:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7885, "total_steps": 9627, "loss": 1.708, "learning_rate": 7.863701096665116e-06, "epoch": 0.8190505868910356, "percentage": 81.91, "elapsed_time": "2 days, 13:51:05", "remaining_time": "13:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7886, "total_steps": 9627, "loss": 1.545, "learning_rate": 7.854919432364406e-06, "epoch": 0.819154461410616, "percentage": 81.92, "elapsed_time": "2 days, 13:51:34", "remaining_time": "13:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7887, "total_steps": 9627, "loss": 1.6084, "learning_rate": 7.846142256186046e-06, "epoch": 0.8192583359301964, "percentage": 81.93, "elapsed_time": "2 days, 13:52:07", "remaining_time": "13:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7888, "total_steps": 9627, "loss": 1.4237, "learning_rate": 7.837369569064734e-06, "epoch": 0.8193622104497766, "percentage": 81.94, "elapsed_time": "2 days, 13:52:37", "remaining_time": "13:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7889, "total_steps": 9627, "loss": 1.7202, "learning_rate": 7.828601371934657e-06, "epoch": 0.819466084969357, "percentage": 81.95, "elapsed_time": "2 days, 13:53:08", "remaining_time": "13:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7890, "total_steps": 9627, "loss": 1.8862, "learning_rate": 7.819837665729596e-06, "epoch": 0.8195699594889374, "percentage": 81.96, "elapsed_time": "2 days, 13:53:40", "remaining_time": "13:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7891, "total_steps": 9627, "loss": 1.776, "learning_rate": 7.811078451382808e-06, "epoch": 0.8196738340085177, "percentage": 81.97, "elapsed_time": "2 days, 13:54:09", "remaining_time": "13:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7892, "total_steps": 9627, "loss": 1.7542, "learning_rate": 7.802323729827077e-06, "epoch": 0.8197777085280981, "percentage": 81.98, "elapsed_time": "2 days, 13:54:41", "remaining_time": "13:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7893, "total_steps": 9627, "loss": 1.3346, "learning_rate": 7.79357350199471e-06, "epoch": 0.8198815830476784, "percentage": 81.99, "elapsed_time": "2 days, 13:55:11", "remaining_time": "13:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7894, "total_steps": 9627, "loss": 1.6569, "learning_rate": 7.784827768817548e-06, "epoch": 0.8199854575672587, "percentage": 82.0, "elapsed_time": "2 days, 13:55:42", "remaining_time": "13:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7895, "total_steps": 9627, "loss": 1.5361, "learning_rate": 7.77608653122694e-06, "epoch": 0.8200893320868391, "percentage": 82.01, "elapsed_time": "2 days, 13:56:14", "remaining_time": "13:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7896, "total_steps": 9627, "loss": 1.5803, "learning_rate": 7.767349790153738e-06, "epoch": 0.8201932066064195, "percentage": 82.02, "elapsed_time": "2 days, 13:56:44", "remaining_time": "13:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7897, "total_steps": 9627, "loss": 1.6642, "learning_rate": 7.758617546528386e-06, "epoch": 0.8202970811259997, "percentage": 82.03, "elapsed_time": "2 days, 13:57:14", "remaining_time": "13:34:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7898, "total_steps": 9627, "loss": 1.8093, "learning_rate": 7.74988980128074e-06, "epoch": 0.8204009556455801, "percentage": 82.04, "elapsed_time": "2 days, 13:57:46", "remaining_time": "13:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7899, "total_steps": 9627, "loss": 1.7515, "learning_rate": 7.741166555340284e-06, "epoch": 0.8205048301651605, "percentage": 82.05, "elapsed_time": "2 days, 13:58:17", "remaining_time": "13:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7900, "total_steps": 9627, "loss": 1.6826, "learning_rate": 7.732447809635956e-06, "epoch": 0.8206087046847408, "percentage": 82.06, "elapsed_time": "2 days, 13:58:47", "remaining_time": "13:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7901, "total_steps": 9627, "loss": 1.6249, "learning_rate": 7.723733565096236e-06, "epoch": 0.8207125792043212, "percentage": 82.07, "elapsed_time": "2 days, 13:59:19", "remaining_time": "13:32:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7902, "total_steps": 9627, "loss": 1.563, "learning_rate": 7.715023822649126e-06, "epoch": 0.8208164537239016, "percentage": 82.08, "elapsed_time": "2 days, 13:59:49", "remaining_time": "13:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7903, "total_steps": 9627, "loss": 1.787, "learning_rate": 7.706318583222144e-06, "epoch": 0.8209203282434818, "percentage": 82.09, "elapsed_time": "2 days, 14:00:20", "remaining_time": "13:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7904, "total_steps": 9627, "loss": 1.6397, "learning_rate": 7.697617847742328e-06, "epoch": 0.8210242027630622, "percentage": 82.1, "elapsed_time": "2 days, 14:00:52", "remaining_time": "13:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7905, "total_steps": 9627, "loss": 1.6617, "learning_rate": 7.688921617136224e-06, "epoch": 0.8211280772826426, "percentage": 82.11, "elapsed_time": "2 days, 14:01:22", "remaining_time": "13:30:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7906, "total_steps": 9627, "loss": 1.5171, "learning_rate": 7.68022989232996e-06, "epoch": 0.8212319518022229, "percentage": 82.12, "elapsed_time": "2 days, 14:01:53", "remaining_time": "13:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7907, "total_steps": 9627, "loss": 1.7494, "learning_rate": 7.671542674249077e-06, "epoch": 0.8213358263218032, "percentage": 82.13, "elapsed_time": "2 days, 14:02:23", "remaining_time": "13:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7908, "total_steps": 9627, "loss": 1.6006, "learning_rate": 7.662859963818737e-06, "epoch": 0.8214397008413836, "percentage": 82.14, "elapsed_time": "2 days, 14:02:56", "remaining_time": "13:29:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7909, "total_steps": 9627, "loss": 1.4621, "learning_rate": 7.65418176196357e-06, "epoch": 0.821543575360964, "percentage": 82.15, "elapsed_time": "2 days, 14:03:26", "remaining_time": "13:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7910, "total_steps": 9627, "loss": 1.5073, "learning_rate": 7.645508069607731e-06, "epoch": 0.8216474498805443, "percentage": 82.16, "elapsed_time": "2 days, 14:03:56", "remaining_time": "13:28:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7911, "total_steps": 9627, "loss": 1.9018, "learning_rate": 7.636838887674908e-06, "epoch": 0.8217513244001247, "percentage": 82.18, "elapsed_time": "2 days, 14:04:28", "remaining_time": "13:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7912, "total_steps": 9627, "loss": 1.6646, "learning_rate": 7.6281742170882854e-06, "epoch": 0.821855198919705, "percentage": 82.19, "elapsed_time": "2 days, 14:04:58", "remaining_time": "13:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7913, "total_steps": 9627, "loss": 1.482, "learning_rate": 7.619514058770622e-06, "epoch": 0.8219590734392853, "percentage": 82.2, "elapsed_time": "2 days, 14:05:29", "remaining_time": "13:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7914, "total_steps": 9627, "loss": 1.7999, "learning_rate": 7.610858413644106e-06, "epoch": 0.8220629479588657, "percentage": 82.21, "elapsed_time": "2 days, 14:06:00", "remaining_time": "13:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7915, "total_steps": 9627, "loss": 1.6357, "learning_rate": 7.60220728263053e-06, "epoch": 0.8221668224784461, "percentage": 82.22, "elapsed_time": "2 days, 14:06:32", "remaining_time": "13:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7916, "total_steps": 9627, "loss": 1.7431, "learning_rate": 7.5935606666511785e-06, "epoch": 0.8222706969980264, "percentage": 82.23, "elapsed_time": "2 days, 14:07:02", "remaining_time": "13:25:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7917, "total_steps": 9627, "loss": 1.8379, "learning_rate": 7.584918566626808e-06, "epoch": 0.8223745715176067, "percentage": 82.24, "elapsed_time": "2 days, 14:07:32", "remaining_time": "13:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7918, "total_steps": 9627, "loss": 1.7044, "learning_rate": 7.576280983477768e-06, "epoch": 0.8224784460371871, "percentage": 82.25, "elapsed_time": "2 days, 14:08:05", "remaining_time": "13:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7919, "total_steps": 9627, "loss": 1.6908, "learning_rate": 7.5676479181238935e-06, "epoch": 0.8225823205567674, "percentage": 82.26, "elapsed_time": "2 days, 14:08:35", "remaining_time": "13:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7920, "total_steps": 9627, "loss": 1.7343, "learning_rate": 7.5590193714845215e-06, "epoch": 0.8226861950763478, "percentage": 82.27, "elapsed_time": "2 days, 14:09:05", "remaining_time": "13:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7921, "total_steps": 9627, "loss": 1.6858, "learning_rate": 7.5503953444785395e-06, "epoch": 0.8227900695959282, "percentage": 82.28, "elapsed_time": "2 days, 14:09:36", "remaining_time": "13:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7922, "total_steps": 9627, "loss": 1.4288, "learning_rate": 7.541775838024335e-06, "epoch": 0.8228939441155084, "percentage": 82.29, "elapsed_time": "2 days, 14:10:07", "remaining_time": "13:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7923, "total_steps": 9627, "loss": 1.6902, "learning_rate": 7.533160853039811e-06, "epoch": 0.8229978186350888, "percentage": 82.3, "elapsed_time": "2 days, 14:10:38", "remaining_time": "13:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7924, "total_steps": 9627, "loss": 1.6764, "learning_rate": 7.5245503904423974e-06, "epoch": 0.8231016931546692, "percentage": 82.31, "elapsed_time": "2 days, 14:11:10", "remaining_time": "13:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7925, "total_steps": 9627, "loss": 1.5257, "learning_rate": 7.515944451149065e-06, "epoch": 0.8232055676742495, "percentage": 82.32, "elapsed_time": "2 days, 14:11:39", "remaining_time": "13:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7926, "total_steps": 9627, "loss": 1.7414, "learning_rate": 7.507343036076236e-06, "epoch": 0.8233094421938298, "percentage": 82.33, "elapsed_time": "2 days, 14:12:12", "remaining_time": "13:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7927, "total_steps": 9627, "loss": 1.6366, "learning_rate": 7.498746146139934e-06, "epoch": 0.8234133167134102, "percentage": 82.34, "elapsed_time": "2 days, 14:12:42", "remaining_time": "13:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7928, "total_steps": 9627, "loss": 1.5959, "learning_rate": 7.490153782255643e-06, "epoch": 0.8235171912329905, "percentage": 82.35, "elapsed_time": "2 days, 14:13:13", "remaining_time": "13:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7929, "total_steps": 9627, "loss": 1.8361, "learning_rate": 7.481565945338381e-06, "epoch": 0.8236210657525709, "percentage": 82.36, "elapsed_time": "2 days, 14:13:45", "remaining_time": "13:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7930, "total_steps": 9627, "loss": 1.592, "learning_rate": 7.472982636302694e-06, "epoch": 0.8237249402721513, "percentage": 82.37, "elapsed_time": "2 days, 14:14:15", "remaining_time": "13:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7931, "total_steps": 9627, "loss": 1.7912, "learning_rate": 7.464403856062629e-06, "epoch": 0.8238288147917315, "percentage": 82.38, "elapsed_time": "2 days, 14:14:47", "remaining_time": "13:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7932, "total_steps": 9627, "loss": 1.7699, "learning_rate": 7.455829605531767e-06, "epoch": 0.8239326893113119, "percentage": 82.39, "elapsed_time": "2 days, 14:15:18", "remaining_time": "13:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7933, "total_steps": 9627, "loss": 1.5568, "learning_rate": 7.4472598856231815e-06, "epoch": 0.8240365638308923, "percentage": 82.4, "elapsed_time": "2 days, 14:15:48", "remaining_time": "13:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7934, "total_steps": 9627, "loss": 1.5514, "learning_rate": 7.438694697249504e-06, "epoch": 0.8241404383504727, "percentage": 82.41, "elapsed_time": "2 days, 14:16:19", "remaining_time": "13:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7935, "total_steps": 9627, "loss": 1.6633, "learning_rate": 7.430134041322856e-06, "epoch": 0.824244312870053, "percentage": 82.42, "elapsed_time": "2 days, 14:16:51", "remaining_time": "13:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7936, "total_steps": 9627, "loss": 1.8486, "learning_rate": 7.421577918754868e-06, "epoch": 0.8243481873896333, "percentage": 82.43, "elapsed_time": "2 days, 14:17:21", "remaining_time": "13:16:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7937, "total_steps": 9627, "loss": 1.6866, "learning_rate": 7.413026330456713e-06, "epoch": 0.8244520619092137, "percentage": 82.45, "elapsed_time": "2 days, 14:17:52", "remaining_time": "13:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7938, "total_steps": 9627, "loss": 1.6298, "learning_rate": 7.404479277339055e-06, "epoch": 0.824555936428794, "percentage": 82.46, "elapsed_time": "2 days, 14:18:23", "remaining_time": "13:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7939, "total_steps": 9627, "loss": 1.6743, "learning_rate": 7.3959367603121055e-06, "epoch": 0.8246598109483744, "percentage": 82.47, "elapsed_time": "2 days, 14:18:53", "remaining_time": "13:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7940, "total_steps": 9627, "loss": 1.5683, "learning_rate": 7.387398780285548e-06, "epoch": 0.8247636854679548, "percentage": 82.48, "elapsed_time": "2 days, 14:19:25", "remaining_time": "13:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7941, "total_steps": 9627, "loss": 1.5644, "learning_rate": 7.378865338168655e-06, "epoch": 0.824867559987535, "percentage": 82.49, "elapsed_time": "2 days, 14:19:56", "remaining_time": "13:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7942, "total_steps": 9627, "loss": 1.8986, "learning_rate": 7.370336434870123e-06, "epoch": 0.8249714345071154, "percentage": 82.5, "elapsed_time": "2 days, 14:20:26", "remaining_time": "13:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7943, "total_steps": 9627, "loss": 1.6532, "learning_rate": 7.361812071298246e-06, "epoch": 0.8250753090266958, "percentage": 82.51, "elapsed_time": "2 days, 14:20:57", "remaining_time": "13:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7944, "total_steps": 9627, "loss": 1.6532, "learning_rate": 7.353292248360805e-06, "epoch": 0.8251791835462761, "percentage": 82.52, "elapsed_time": "2 days, 14:21:29", "remaining_time": "13:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7945, "total_steps": 9627, "loss": 1.7635, "learning_rate": 7.344776966965061e-06, "epoch": 0.8252830580658564, "percentage": 82.53, "elapsed_time": "2 days, 14:21:59", "remaining_time": "13:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7946, "total_steps": 9627, "loss": 1.5736, "learning_rate": 7.336266228017857e-06, "epoch": 0.8253869325854368, "percentage": 82.54, "elapsed_time": "2 days, 14:22:30", "remaining_time": "13:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7947, "total_steps": 9627, "loss": 1.7677, "learning_rate": 7.327760032425507e-06, "epoch": 0.8254908071050171, "percentage": 82.55, "elapsed_time": "2 days, 14:23:02", "remaining_time": "13:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7948, "total_steps": 9627, "loss": 1.541, "learning_rate": 7.319258381093863e-06, "epoch": 0.8255946816245975, "percentage": 82.56, "elapsed_time": "2 days, 14:23:32", "remaining_time": "13:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7949, "total_steps": 9627, "loss": 1.6897, "learning_rate": 7.310761274928274e-06, "epoch": 0.8256985561441779, "percentage": 82.57, "elapsed_time": "2 days, 14:24:02", "remaining_time": "13:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7950, "total_steps": 9627, "loss": 1.6534, "learning_rate": 7.302268714833621e-06, "epoch": 0.8258024306637581, "percentage": 82.58, "elapsed_time": "2 days, 14:24:34", "remaining_time": "13:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7951, "total_steps": 9627, "loss": 1.4829, "learning_rate": 7.2937807017142975e-06, "epoch": 0.8259063051833385, "percentage": 82.59, "elapsed_time": "2 days, 14:25:05", "remaining_time": "13:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7952, "total_steps": 9627, "loss": 1.7697, "learning_rate": 7.285297236474198e-06, "epoch": 0.8260101797029189, "percentage": 82.6, "elapsed_time": "2 days, 14:25:36", "remaining_time": "13:08:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7953, "total_steps": 9627, "loss": 1.4717, "learning_rate": 7.27681832001677e-06, "epoch": 0.8261140542224992, "percentage": 82.61, "elapsed_time": "2 days, 14:26:07", "remaining_time": "13:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7954, "total_steps": 9627, "loss": 1.5658, "learning_rate": 7.268343953244921e-06, "epoch": 0.8262179287420796, "percentage": 82.62, "elapsed_time": "2 days, 14:26:38", "remaining_time": "13:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7955, "total_steps": 9627, "loss": 1.7525, "learning_rate": 7.259874137061135e-06, "epoch": 0.8263218032616599, "percentage": 82.63, "elapsed_time": "2 days, 14:27:08", "remaining_time": "13:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7956, "total_steps": 9627, "loss": 1.6619, "learning_rate": 7.2514088723673605e-06, "epoch": 0.8264256777812402, "percentage": 82.64, "elapsed_time": "2 days, 14:27:39", "remaining_time": "13:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7957, "total_steps": 9627, "loss": 1.7732, "learning_rate": 7.2429481600650936e-06, "epoch": 0.8265295523008206, "percentage": 82.65, "elapsed_time": "2 days, 14:28:10", "remaining_time": "13:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7958, "total_steps": 9627, "loss": 1.762, "learning_rate": 7.234492001055332e-06, "epoch": 0.826633426820401, "percentage": 82.66, "elapsed_time": "2 days, 14:28:41", "remaining_time": "13:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7959, "total_steps": 9627, "loss": 1.5749, "learning_rate": 7.2260403962385706e-06, "epoch": 0.8267373013399814, "percentage": 82.67, "elapsed_time": "2 days, 14:29:13", "remaining_time": "13:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7960, "total_steps": 9627, "loss": 1.7171, "learning_rate": 7.217593346514884e-06, "epoch": 0.8268411758595616, "percentage": 82.68, "elapsed_time": "2 days, 14:29:43", "remaining_time": "13:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7961, "total_steps": 9627, "loss": 1.6369, "learning_rate": 7.209150852783769e-06, "epoch": 0.826945050379142, "percentage": 82.69, "elapsed_time": "2 days, 14:30:14", "remaining_time": "13:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7962, "total_steps": 9627, "loss": 1.6839, "learning_rate": 7.200712915944313e-06, "epoch": 0.8270489248987224, "percentage": 82.7, "elapsed_time": "2 days, 14:30:44", "remaining_time": "13:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7963, "total_steps": 9627, "loss": 1.7524, "learning_rate": 7.192279536895091e-06, "epoch": 0.8271527994183027, "percentage": 82.72, "elapsed_time": "2 days, 14:31:16", "remaining_time": "13:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7964, "total_steps": 9627, "loss": 1.6049, "learning_rate": 7.183850716534179e-06, "epoch": 0.827256673937883, "percentage": 82.73, "elapsed_time": "2 days, 14:31:46", "remaining_time": "13:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7965, "total_steps": 9627, "loss": 1.5222, "learning_rate": 7.175426455759193e-06, "epoch": 0.8273605484574634, "percentage": 82.74, "elapsed_time": "2 days, 14:32:17", "remaining_time": "13:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7966, "total_steps": 9627, "loss": 1.7086, "learning_rate": 7.167006755467237e-06, "epoch": 0.8274644229770437, "percentage": 82.75, "elapsed_time": "2 days, 14:32:47", "remaining_time": "13:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7967, "total_steps": 9627, "loss": 1.7143, "learning_rate": 7.15859161655496e-06, "epoch": 0.8275682974966241, "percentage": 82.76, "elapsed_time": "2 days, 14:33:18", "remaining_time": "13:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7968, "total_steps": 9627, "loss": 1.3494, "learning_rate": 7.150181039918485e-06, "epoch": 0.8276721720162045, "percentage": 82.77, "elapsed_time": "2 days, 14:33:49", "remaining_time": "13:01:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7969, "total_steps": 9627, "loss": 1.5688, "learning_rate": 7.141775026453506e-06, "epoch": 0.8277760465357847, "percentage": 82.78, "elapsed_time": "2 days, 14:34:21", "remaining_time": "13:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7970, "total_steps": 9627, "loss": 1.7456, "learning_rate": 7.133373577055163e-06, "epoch": 0.8278799210553651, "percentage": 82.79, "elapsed_time": "2 days, 14:34:51", "remaining_time": "13:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7971, "total_steps": 9627, "loss": 1.5706, "learning_rate": 7.124976692618168e-06, "epoch": 0.8279837955749455, "percentage": 82.8, "elapsed_time": "2 days, 14:35:23", "remaining_time": "13:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7972, "total_steps": 9627, "loss": 1.6361, "learning_rate": 7.116584374036733e-06, "epoch": 0.8280876700945258, "percentage": 82.81, "elapsed_time": "2 days, 14:35:53", "remaining_time": "12:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7973, "total_steps": 9627, "loss": 1.5935, "learning_rate": 7.108196622204538e-06, "epoch": 0.8281915446141062, "percentage": 82.82, "elapsed_time": "2 days, 14:36:24", "remaining_time": "12:59:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7974, "total_steps": 9627, "loss": 1.4914, "learning_rate": 7.099813438014841e-06, "epoch": 0.8282954191336865, "percentage": 82.83, "elapsed_time": "2 days, 14:36:56", "remaining_time": "12:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7975, "total_steps": 9627, "loss": 1.6914, "learning_rate": 7.091434822360377e-06, "epoch": 0.8283992936532668, "percentage": 82.84, "elapsed_time": "2 days, 14:37:26", "remaining_time": "12:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7976, "total_steps": 9627, "loss": 1.7179, "learning_rate": 7.083060776133404e-06, "epoch": 0.8285031681728472, "percentage": 82.85, "elapsed_time": "2 days, 14:37:57", "remaining_time": "12:57:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7977, "total_steps": 9627, "loss": 1.7011, "learning_rate": 7.0746913002257e-06, "epoch": 0.8286070426924276, "percentage": 82.86, "elapsed_time": "2 days, 14:38:27", "remaining_time": "12:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7978, "total_steps": 9627, "loss": 1.6866, "learning_rate": 7.066326395528539e-06, "epoch": 0.8287109172120078, "percentage": 82.87, "elapsed_time": "2 days, 14:38:58", "remaining_time": "12:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7979, "total_steps": 9627, "loss": 1.6695, "learning_rate": 7.05796606293272e-06, "epoch": 0.8288147917315882, "percentage": 82.88, "elapsed_time": "2 days, 14:39:29", "remaining_time": "12:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7980, "total_steps": 9627, "loss": 1.7386, "learning_rate": 7.049610303328541e-06, "epoch": 0.8289186662511686, "percentage": 82.89, "elapsed_time": "2 days, 14:40:00", "remaining_time": "12:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7981, "total_steps": 9627, "loss": 1.6829, "learning_rate": 7.04125911760587e-06, "epoch": 0.8290225407707489, "percentage": 82.9, "elapsed_time": "2 days, 14:40:30", "remaining_time": "12:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7982, "total_steps": 9627, "loss": 1.5823, "learning_rate": 7.032912506653983e-06, "epoch": 0.8291264152903293, "percentage": 82.91, "elapsed_time": "2 days, 14:41:01", "remaining_time": "12:55:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7983, "total_steps": 9627, "loss": 1.5883, "learning_rate": 7.024570471361769e-06, "epoch": 0.8292302898099096, "percentage": 82.92, "elapsed_time": "2 days, 14:41:32", "remaining_time": "12:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7984, "total_steps": 9627, "loss": 1.4265, "learning_rate": 7.016233012617579e-06, "epoch": 0.82933416432949, "percentage": 82.93, "elapsed_time": "2 days, 14:42:04", "remaining_time": "12:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7985, "total_steps": 9627, "loss": 1.7404, "learning_rate": 7.0079001313092865e-06, "epoch": 0.8294380388490703, "percentage": 82.94, "elapsed_time": "2 days, 14:42:33", "remaining_time": "12:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7986, "total_steps": 9627, "loss": 1.6176, "learning_rate": 6.99957182832428e-06, "epoch": 0.8295419133686507, "percentage": 82.95, "elapsed_time": "2 days, 14:43:05", "remaining_time": "12:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7987, "total_steps": 9627, "loss": 1.6707, "learning_rate": 6.9912481045494475e-06, "epoch": 0.8296457878882311, "percentage": 82.96, "elapsed_time": "2 days, 14:43:36", "remaining_time": "12:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7988, "total_steps": 9627, "loss": 1.6712, "learning_rate": 6.9829289608712264e-06, "epoch": 0.8297496624078113, "percentage": 82.97, "elapsed_time": "2 days, 14:44:06", "remaining_time": "12:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7989, "total_steps": 9627, "loss": 1.6211, "learning_rate": 6.974614398175511e-06, "epoch": 0.8298535369273917, "percentage": 82.99, "elapsed_time": "2 days, 14:44:37", "remaining_time": "12:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7990, "total_steps": 9627, "loss": 1.6593, "learning_rate": 6.966304417347758e-06, "epoch": 0.8299574114469721, "percentage": 83.0, "elapsed_time": "2 days, 14:45:07", "remaining_time": "12:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7991, "total_steps": 9627, "loss": 1.6225, "learning_rate": 6.95799901927291e-06, "epoch": 0.8300612859665524, "percentage": 83.01, "elapsed_time": "2 days, 14:45:39", "remaining_time": "12:50:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7992, "total_steps": 9627, "loss": 1.5756, "learning_rate": 6.949698204835426e-06, "epoch": 0.8301651604861328, "percentage": 83.02, "elapsed_time": "2 days, 14:46:10", "remaining_time": "12:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7993, "total_steps": 9627, "loss": 1.6939, "learning_rate": 6.941401974919276e-06, "epoch": 0.8302690350057131, "percentage": 83.03, "elapsed_time": "2 days, 14:46:40", "remaining_time": "12:50:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7994, "total_steps": 9627, "loss": 1.7476, "learning_rate": 6.9331103304079494e-06, "epoch": 0.8303729095252934, "percentage": 83.04, "elapsed_time": "2 days, 14:47:10", "remaining_time": "12:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7995, "total_steps": 9627, "loss": 1.449, "learning_rate": 6.924823272184439e-06, "epoch": 0.8304767840448738, "percentage": 83.05, "elapsed_time": "2 days, 14:47:42", "remaining_time": "12:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7996, "total_steps": 9627, "loss": 1.6482, "learning_rate": 6.916540801131232e-06, "epoch": 0.8305806585644542, "percentage": 83.06, "elapsed_time": "2 days, 14:48:12", "remaining_time": "12:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7997, "total_steps": 9627, "loss": 1.5417, "learning_rate": 6.908262918130392e-06, "epoch": 0.8306845330840344, "percentage": 83.07, "elapsed_time": "2 days, 14:48:43", "remaining_time": "12:48:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7998, "total_steps": 9627, "loss": 1.5201, "learning_rate": 6.899989624063402e-06, "epoch": 0.8307884076036148, "percentage": 83.08, "elapsed_time": "2 days, 14:49:13", "remaining_time": "12:47:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7999, "total_steps": 9627, "loss": 1.7178, "learning_rate": 6.8917209198113345e-06, "epoch": 0.8308922821231952, "percentage": 83.09, "elapsed_time": "2 days, 14:49:43", "remaining_time": "12:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8000, "total_steps": 9627, "loss": 1.5518, "learning_rate": 6.883456806254746e-06, "epoch": 0.8309961566427755, "percentage": 83.1, "elapsed_time": "2 days, 14:50:16", "remaining_time": "12:46:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8001, "total_steps": 9627, "loss": 1.6246, "learning_rate": 6.87519728427366e-06, "epoch": 0.8311000311623559, "percentage": 83.11, "elapsed_time": "2 days, 14:50:46", "remaining_time": "12:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8002, "total_steps": 9627, "loss": 1.7103, "learning_rate": 6.866942354747685e-06, "epoch": 0.8312039056819363, "percentage": 83.12, "elapsed_time": "2 days, 14:51:19", "remaining_time": "12:45:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8003, "total_steps": 9627, "loss": 1.5555, "learning_rate": 6.8586920185559015e-06, "epoch": 0.8313077802015165, "percentage": 83.13, "elapsed_time": "2 days, 14:51:49", "remaining_time": "12:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8004, "total_steps": 9627, "loss": 1.5676, "learning_rate": 6.850446276576905e-06, "epoch": 0.8314116547210969, "percentage": 83.14, "elapsed_time": "2 days, 14:52:20", "remaining_time": "12:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8005, "total_steps": 9627, "loss": 1.5645, "learning_rate": 6.8422051296888e-06, "epoch": 0.8315155292406773, "percentage": 83.15, "elapsed_time": "2 days, 14:52:51", "remaining_time": "12:44:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8006, "total_steps": 9627, "loss": 1.4893, "learning_rate": 6.833968578769201e-06, "epoch": 0.8316194037602576, "percentage": 83.16, "elapsed_time": "2 days, 14:53:21", "remaining_time": "12:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8007, "total_steps": 9627, "loss": 1.5007, "learning_rate": 6.825736624695245e-06, "epoch": 0.8317232782798379, "percentage": 83.17, "elapsed_time": "2 days, 14:53:52", "remaining_time": "12:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8008, "total_steps": 9627, "loss": 1.3456, "learning_rate": 6.817509268343553e-06, "epoch": 0.8318271527994183, "percentage": 83.18, "elapsed_time": "2 days, 14:54:23", "remaining_time": "12:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8009, "total_steps": 9627, "loss": 1.5847, "learning_rate": 6.809286510590307e-06, "epoch": 0.8319310273189986, "percentage": 83.19, "elapsed_time": "2 days, 14:54:53", "remaining_time": "12:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8010, "total_steps": 9627, "loss": 1.7015, "learning_rate": 6.80106835231113e-06, "epoch": 0.832034901838579, "percentage": 83.2, "elapsed_time": "2 days, 14:55:25", "remaining_time": "12:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8011, "total_steps": 9627, "loss": 1.6057, "learning_rate": 6.792854794381215e-06, "epoch": 0.8321387763581594, "percentage": 83.21, "elapsed_time": "2 days, 14:55:55", "remaining_time": "12:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8012, "total_steps": 9627, "loss": 1.6555, "learning_rate": 6.784645837675241e-06, "epoch": 0.8322426508777397, "percentage": 83.22, "elapsed_time": "2 days, 14:56:26", "remaining_time": "12:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8013, "total_steps": 9627, "loss": 1.6785, "learning_rate": 6.776441483067386e-06, "epoch": 0.83234652539732, "percentage": 83.23, "elapsed_time": "2 days, 14:56:57", "remaining_time": "12:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8014, "total_steps": 9627, "loss": 1.6525, "learning_rate": 6.768241731431363e-06, "epoch": 0.8324503999169004, "percentage": 83.25, "elapsed_time": "2 days, 14:57:27", "remaining_time": "12:40:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8015, "total_steps": 9627, "loss": 1.6921, "learning_rate": 6.760046583640362e-06, "epoch": 0.8325542744364808, "percentage": 83.26, "elapsed_time": "2 days, 14:57:59", "remaining_time": "12:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8016, "total_steps": 9627, "loss": 1.7602, "learning_rate": 6.751856040567134e-06, "epoch": 0.832658148956061, "percentage": 83.27, "elapsed_time": "2 days, 14:58:31", "remaining_time": "12:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8017, "total_steps": 9627, "loss": 1.9422, "learning_rate": 6.7436701030838715e-06, "epoch": 0.8327620234756414, "percentage": 83.28, "elapsed_time": "2 days, 14:59:00", "remaining_time": "12:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8018, "total_steps": 9627, "loss": 1.7875, "learning_rate": 6.735488772062337e-06, "epoch": 0.8328658979952218, "percentage": 83.29, "elapsed_time": "2 days, 14:59:31", "remaining_time": "12:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8019, "total_steps": 9627, "loss": 1.5723, "learning_rate": 6.727312048373774e-06, "epoch": 0.8329697725148021, "percentage": 83.3, "elapsed_time": "2 days, 15:00:02", "remaining_time": "12:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8020, "total_steps": 9627, "loss": 1.536, "learning_rate": 6.71913993288894e-06, "epoch": 0.8330736470343825, "percentage": 83.31, "elapsed_time": "2 days, 15:00:32", "remaining_time": "12:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8021, "total_steps": 9627, "loss": 1.5312, "learning_rate": 6.710972426478096e-06, "epoch": 0.8331775215539629, "percentage": 83.32, "elapsed_time": "2 days, 15:01:03", "remaining_time": "12:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8022, "total_steps": 9627, "loss": 1.6728, "learning_rate": 6.7028095300110225e-06, "epoch": 0.8332813960735431, "percentage": 83.33, "elapsed_time": "2 days, 15:01:34", "remaining_time": "12:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8023, "total_steps": 9627, "loss": 1.4944, "learning_rate": 6.6946512443570085e-06, "epoch": 0.8333852705931235, "percentage": 83.34, "elapsed_time": "2 days, 15:02:04", "remaining_time": "12:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8024, "total_steps": 9627, "loss": 1.5726, "learning_rate": 6.686497570384825e-06, "epoch": 0.8334891451127039, "percentage": 83.35, "elapsed_time": "2 days, 15:02:35", "remaining_time": "12:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8025, "total_steps": 9627, "loss": 1.6453, "learning_rate": 6.678348508962812e-06, "epoch": 0.8335930196322842, "percentage": 83.36, "elapsed_time": "2 days, 15:03:06", "remaining_time": "12:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8026, "total_steps": 9627, "loss": 1.6386, "learning_rate": 6.670204060958746e-06, "epoch": 0.8336968941518645, "percentage": 83.37, "elapsed_time": "2 days, 15:03:36", "remaining_time": "12:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8027, "total_steps": 9627, "loss": 1.6229, "learning_rate": 6.662064227239967e-06, "epoch": 0.8338007686714449, "percentage": 83.38, "elapsed_time": "2 days, 15:04:07", "remaining_time": "12:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8028, "total_steps": 9627, "loss": 1.7046, "learning_rate": 6.653929008673315e-06, "epoch": 0.8339046431910252, "percentage": 83.39, "elapsed_time": "2 days, 15:04:39", "remaining_time": "12:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8029, "total_steps": 9627, "loss": 1.6751, "learning_rate": 6.645798406125087e-06, "epoch": 0.8340085177106056, "percentage": 83.4, "elapsed_time": "2 days, 15:05:09", "remaining_time": "12:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8030, "total_steps": 9627, "loss": 1.4603, "learning_rate": 6.637672420461161e-06, "epoch": 0.834112392230186, "percentage": 83.41, "elapsed_time": "2 days, 15:05:39", "remaining_time": "12:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8031, "total_steps": 9627, "loss": 1.4504, "learning_rate": 6.629551052546884e-06, "epoch": 0.8342162667497662, "percentage": 83.42, "elapsed_time": "2 days, 15:06:11", "remaining_time": "12:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8032, "total_steps": 9627, "loss": 1.6946, "learning_rate": 6.6214343032471204e-06, "epoch": 0.8343201412693466, "percentage": 83.43, "elapsed_time": "2 days, 15:06:41", "remaining_time": "12:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8033, "total_steps": 9627, "loss": 1.7209, "learning_rate": 6.613322173426239e-06, "epoch": 0.834424015788927, "percentage": 83.44, "elapsed_time": "2 days, 15:07:11", "remaining_time": "12:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8034, "total_steps": 9627, "loss": 1.8021, "learning_rate": 6.605214663948111e-06, "epoch": 0.8345278903085073, "percentage": 83.45, "elapsed_time": "2 days, 15:07:41", "remaining_time": "12:31:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8035, "total_steps": 9627, "loss": 1.6669, "learning_rate": 6.597111775676135e-06, "epoch": 0.8346317648280877, "percentage": 83.46, "elapsed_time": "2 days, 15:08:13", "remaining_time": "12:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8036, "total_steps": 9627, "loss": 1.5882, "learning_rate": 6.589013509473185e-06, "epoch": 0.834735639347668, "percentage": 83.47, "elapsed_time": "2 days, 15:08:44", "remaining_time": "12:30:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8037, "total_steps": 9627, "loss": 1.4626, "learning_rate": 6.58091986620169e-06, "epoch": 0.8348395138672484, "percentage": 83.48, "elapsed_time": "2 days, 15:09:14", "remaining_time": "12:29:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8038, "total_steps": 9627, "loss": 1.676, "learning_rate": 6.5728308467235435e-06, "epoch": 0.8349433883868287, "percentage": 83.49, "elapsed_time": "2 days, 15:09:45", "remaining_time": "12:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8039, "total_steps": 9627, "loss": 1.3398, "learning_rate": 6.5647464519001725e-06, "epoch": 0.8350472629064091, "percentage": 83.5, "elapsed_time": "2 days, 15:10:16", "remaining_time": "12:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8040, "total_steps": 9627, "loss": 1.5381, "learning_rate": 6.556666682592494e-06, "epoch": 0.8351511374259895, "percentage": 83.52, "elapsed_time": "2 days, 15:10:47", "remaining_time": "12:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8041, "total_steps": 9627, "loss": 1.6253, "learning_rate": 6.548591539660942e-06, "epoch": 0.8352550119455697, "percentage": 83.53, "elapsed_time": "2 days, 15:11:18", "remaining_time": "12:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8042, "total_steps": 9627, "loss": 1.7125, "learning_rate": 6.540521023965457e-06, "epoch": 0.8353588864651501, "percentage": 83.54, "elapsed_time": "2 days, 15:11:49", "remaining_time": "12:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8043, "total_steps": 9627, "loss": 1.645, "learning_rate": 6.532455136365478e-06, "epoch": 0.8354627609847305, "percentage": 83.55, "elapsed_time": "2 days, 15:12:20", "remaining_time": "12:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8044, "total_steps": 9627, "loss": 1.6461, "learning_rate": 6.524393877719987e-06, "epoch": 0.8355666355043108, "percentage": 83.56, "elapsed_time": "2 days, 15:12:50", "remaining_time": "12:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8045, "total_steps": 9627, "loss": 1.8415, "learning_rate": 6.516337248887399e-06, "epoch": 0.8356705100238911, "percentage": 83.57, "elapsed_time": "2 days, 15:13:21", "remaining_time": "12:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8046, "total_steps": 9627, "loss": 1.4099, "learning_rate": 6.5082852507257265e-06, "epoch": 0.8357743845434715, "percentage": 83.58, "elapsed_time": "2 days, 15:13:52", "remaining_time": "12:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8047, "total_steps": 9627, "loss": 1.6968, "learning_rate": 6.500237884092425e-06, "epoch": 0.8358782590630518, "percentage": 83.59, "elapsed_time": "2 days, 15:14:23", "remaining_time": "12:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8048, "total_steps": 9627, "loss": 1.66, "learning_rate": 6.492195149844471e-06, "epoch": 0.8359821335826322, "percentage": 83.6, "elapsed_time": "2 days, 15:14:53", "remaining_time": "12:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8049, "total_steps": 9627, "loss": 1.657, "learning_rate": 6.484157048838368e-06, "epoch": 0.8360860081022126, "percentage": 83.61, "elapsed_time": "2 days, 15:15:23", "remaining_time": "12:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8050, "total_steps": 9627, "loss": 1.7264, "learning_rate": 6.476123581930099e-06, "epoch": 0.8361898826217928, "percentage": 83.62, "elapsed_time": "2 days, 15:15:55", "remaining_time": "12:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8051, "total_steps": 9627, "loss": 1.798, "learning_rate": 6.468094749975167e-06, "epoch": 0.8362937571413732, "percentage": 83.63, "elapsed_time": "2 days, 15:16:25", "remaining_time": "12:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8052, "total_steps": 9627, "loss": 1.5829, "learning_rate": 6.460070553828573e-06, "epoch": 0.8363976316609536, "percentage": 83.64, "elapsed_time": "2 days, 15:16:56", "remaining_time": "12:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8053, "total_steps": 9627, "loss": 1.5542, "learning_rate": 6.4520509943448656e-06, "epoch": 0.8365015061805339, "percentage": 83.65, "elapsed_time": "2 days, 15:17:26", "remaining_time": "12:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8054, "total_steps": 9627, "loss": 1.5923, "learning_rate": 6.444036072378018e-06, "epoch": 0.8366053807001143, "percentage": 83.66, "elapsed_time": "2 days, 15:17:58", "remaining_time": "12:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8055, "total_steps": 9627, "loss": 1.6131, "learning_rate": 6.436025788781586e-06, "epoch": 0.8367092552196946, "percentage": 83.67, "elapsed_time": "2 days, 15:18:28", "remaining_time": "12:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8056, "total_steps": 9627, "loss": 1.5907, "learning_rate": 6.428020144408608e-06, "epoch": 0.8368131297392749, "percentage": 83.68, "elapsed_time": "2 days, 15:18:59", "remaining_time": "12:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8057, "total_steps": 9627, "loss": 1.6621, "learning_rate": 6.420019140111588e-06, "epoch": 0.8369170042588553, "percentage": 83.69, "elapsed_time": "2 days, 15:19:29", "remaining_time": "12:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8058, "total_steps": 9627, "loss": 1.5021, "learning_rate": 6.412022776742604e-06, "epoch": 0.8370208787784357, "percentage": 83.7, "elapsed_time": "2 days, 15:20:00", "remaining_time": "12:19:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8059, "total_steps": 9627, "loss": 1.6401, "learning_rate": 6.404031055153198e-06, "epoch": 0.8371247532980159, "percentage": 83.71, "elapsed_time": "2 days, 15:20:31", "remaining_time": "12:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8060, "total_steps": 9627, "loss": 1.4499, "learning_rate": 6.396043976194416e-06, "epoch": 0.8372286278175963, "percentage": 83.72, "elapsed_time": "2 days, 15:21:02", "remaining_time": "12:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8061, "total_steps": 9627, "loss": 1.6367, "learning_rate": 6.3880615407168335e-06, "epoch": 0.8373325023371767, "percentage": 83.73, "elapsed_time": "2 days, 15:21:31", "remaining_time": "12:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8062, "total_steps": 9627, "loss": 1.5884, "learning_rate": 6.380083749570498e-06, "epoch": 0.8374363768567571, "percentage": 83.74, "elapsed_time": "2 days, 15:22:03", "remaining_time": "12:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8063, "total_steps": 9627, "loss": 1.4089, "learning_rate": 6.372110603605014e-06, "epoch": 0.8375402513763374, "percentage": 83.75, "elapsed_time": "2 days, 15:22:33", "remaining_time": "12:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8064, "total_steps": 9627, "loss": 1.6824, "learning_rate": 6.364142103669418e-06, "epoch": 0.8376441258959177, "percentage": 83.76, "elapsed_time": "2 days, 15:23:04", "remaining_time": "12:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8065, "total_steps": 9627, "loss": 1.7319, "learning_rate": 6.356178250612327e-06, "epoch": 0.8377480004154981, "percentage": 83.77, "elapsed_time": "2 days, 15:23:36", "remaining_time": "12:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8066, "total_steps": 9627, "loss": 1.6687, "learning_rate": 6.348219045281822e-06, "epoch": 0.8378518749350784, "percentage": 83.79, "elapsed_time": "2 days, 15:24:06", "remaining_time": "12:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8067, "total_steps": 9627, "loss": 1.6577, "learning_rate": 6.340264488525488e-06, "epoch": 0.8379557494546588, "percentage": 83.8, "elapsed_time": "2 days, 15:24:37", "remaining_time": "12:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8068, "total_steps": 9627, "loss": 1.7371, "learning_rate": 6.332314581190424e-06, "epoch": 0.8380596239742392, "percentage": 83.81, "elapsed_time": "2 days, 15:25:07", "remaining_time": "12:15:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8069, "total_steps": 9627, "loss": 1.8348, "learning_rate": 6.324369324123242e-06, "epoch": 0.8381634984938194, "percentage": 83.82, "elapsed_time": "2 days, 15:25:38", "remaining_time": "12:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8070, "total_steps": 9627, "loss": 1.7954, "learning_rate": 6.316428718170036e-06, "epoch": 0.8382673730133998, "percentage": 83.83, "elapsed_time": "2 days, 15:26:08", "remaining_time": "12:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8071, "total_steps": 9627, "loss": 1.4829, "learning_rate": 6.308492764176421e-06, "epoch": 0.8383712475329802, "percentage": 83.84, "elapsed_time": "2 days, 15:26:39", "remaining_time": "12:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8072, "total_steps": 9627, "loss": 1.469, "learning_rate": 6.300561462987542e-06, "epoch": 0.8384751220525605, "percentage": 83.85, "elapsed_time": "2 days, 15:27:10", "remaining_time": "12:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8073, "total_steps": 9627, "loss": 1.5294, "learning_rate": 6.292634815447978e-06, "epoch": 0.8385789965721409, "percentage": 83.86, "elapsed_time": "2 days, 15:27:41", "remaining_time": "12:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8074, "total_steps": 9627, "loss": 1.5216, "learning_rate": 6.2847128224018835e-06, "epoch": 0.8386828710917212, "percentage": 83.87, "elapsed_time": "2 days, 15:28:10", "remaining_time": "12:12:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8075, "total_steps": 9627, "loss": 1.7961, "learning_rate": 6.276795484692882e-06, "epoch": 0.8387867456113015, "percentage": 83.88, "elapsed_time": "2 days, 15:28:43", "remaining_time": "12:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8076, "total_steps": 9627, "loss": 1.6753, "learning_rate": 6.268882803164106e-06, "epoch": 0.8388906201308819, "percentage": 83.89, "elapsed_time": "2 days, 15:29:13", "remaining_time": "12:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8077, "total_steps": 9627, "loss": 1.4427, "learning_rate": 6.260974778658202e-06, "epoch": 0.8389944946504623, "percentage": 83.9, "elapsed_time": "2 days, 15:29:43", "remaining_time": "12:11:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8078, "total_steps": 9627, "loss": 1.7915, "learning_rate": 6.253071412017298e-06, "epoch": 0.8390983691700425, "percentage": 83.91, "elapsed_time": "2 days, 15:30:14", "remaining_time": "12:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8079, "total_steps": 9627, "loss": 1.8103, "learning_rate": 6.2451727040830525e-06, "epoch": 0.8392022436896229, "percentage": 83.92, "elapsed_time": "2 days, 15:30:44", "remaining_time": "12:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8080, "total_steps": 9627, "loss": 1.4995, "learning_rate": 6.237278655696605e-06, "epoch": 0.8393061182092033, "percentage": 83.93, "elapsed_time": "2 days, 15:31:16", "remaining_time": "12:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8081, "total_steps": 9627, "loss": 1.737, "learning_rate": 6.229389267698638e-06, "epoch": 0.8394099927287836, "percentage": 83.94, "elapsed_time": "2 days, 15:31:45", "remaining_time": "12:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8082, "total_steps": 9627, "loss": 1.5779, "learning_rate": 6.2215045409292794e-06, "epoch": 0.839513867248364, "percentage": 83.95, "elapsed_time": "2 days, 15:32:17", "remaining_time": "12:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8083, "total_steps": 9627, "loss": 1.6885, "learning_rate": 6.213624476228191e-06, "epoch": 0.8396177417679443, "percentage": 83.96, "elapsed_time": "2 days, 15:32:47", "remaining_time": "12:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8084, "total_steps": 9627, "loss": 1.5655, "learning_rate": 6.205749074434569e-06, "epoch": 0.8397216162875246, "percentage": 83.97, "elapsed_time": "2 days, 15:33:17", "remaining_time": "12:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8085, "total_steps": 9627, "loss": 1.5628, "learning_rate": 6.197878336387042e-06, "epoch": 0.839825490807105, "percentage": 83.98, "elapsed_time": "2 days, 15:33:47", "remaining_time": "12:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8086, "total_steps": 9627, "loss": 1.5581, "learning_rate": 6.190012262923811e-06, "epoch": 0.8399293653266854, "percentage": 83.99, "elapsed_time": "2 days, 15:34:20", "remaining_time": "12:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8087, "total_steps": 9627, "loss": 1.8488, "learning_rate": 6.182150854882546e-06, "epoch": 0.8400332398462657, "percentage": 84.0, "elapsed_time": "2 days, 15:34:49", "remaining_time": "12:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8088, "total_steps": 9627, "loss": 1.5469, "learning_rate": 6.1742941131004205e-06, "epoch": 0.840137114365846, "percentage": 84.01, "elapsed_time": "2 days, 15:35:21", "remaining_time": "12:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8089, "total_steps": 9627, "loss": 1.756, "learning_rate": 6.166442038414122e-06, "epoch": 0.8402409888854264, "percentage": 84.02, "elapsed_time": "2 days, 15:35:50", "remaining_time": "12:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8090, "total_steps": 9627, "loss": 1.5767, "learning_rate": 6.1585946316598195e-06, "epoch": 0.8403448634050068, "percentage": 84.03, "elapsed_time": "2 days, 15:36:21", "remaining_time": "12:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8091, "total_steps": 9627, "loss": 1.3907, "learning_rate": 6.150751893673229e-06, "epoch": 0.8404487379245871, "percentage": 84.04, "elapsed_time": "2 days, 15:36:53", "remaining_time": "12:04:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8092, "total_steps": 9627, "loss": 1.8505, "learning_rate": 6.142913825289509e-06, "epoch": 0.8405526124441675, "percentage": 84.06, "elapsed_time": "2 days, 15:37:23", "remaining_time": "12:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8093, "total_steps": 9627, "loss": 1.5951, "learning_rate": 6.135080427343376e-06, "epoch": 0.8406564869637478, "percentage": 84.07, "elapsed_time": "2 days, 15:37:53", "remaining_time": "12:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8094, "total_steps": 9627, "loss": 1.7048, "learning_rate": 6.1272517006690174e-06, "epoch": 0.8407603614833281, "percentage": 84.08, "elapsed_time": "2 days, 15:38:24", "remaining_time": "12:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8095, "total_steps": 9627, "loss": 1.6959, "learning_rate": 6.1194276461001345e-06, "epoch": 0.8408642360029085, "percentage": 84.09, "elapsed_time": "2 days, 15:38:55", "remaining_time": "12:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8096, "total_steps": 9627, "loss": 1.6371, "learning_rate": 6.111608264469926e-06, "epoch": 0.8409681105224889, "percentage": 84.1, "elapsed_time": "2 days, 15:39:24", "remaining_time": "12:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8097, "total_steps": 9627, "loss": 1.6457, "learning_rate": 6.103793556611093e-06, "epoch": 0.8410719850420691, "percentage": 84.11, "elapsed_time": "2 days, 15:39:56", "remaining_time": "12:01:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8098, "total_steps": 9627, "loss": 1.5726, "learning_rate": 6.095983523355841e-06, "epoch": 0.8411758595616495, "percentage": 84.12, "elapsed_time": "2 days, 15:40:26", "remaining_time": "12:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8099, "total_steps": 9627, "loss": 1.6642, "learning_rate": 6.088178165535874e-06, "epoch": 0.8412797340812299, "percentage": 84.13, "elapsed_time": "2 days, 15:40:56", "remaining_time": "12:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8100, "total_steps": 9627, "loss": 1.6482, "learning_rate": 6.080377483982424e-06, "epoch": 0.8413836086008102, "percentage": 84.14, "elapsed_time": "2 days, 15:41:27", "remaining_time": "12:00:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8101, "total_steps": 9627, "loss": 1.5789, "learning_rate": 6.072581479526168e-06, "epoch": 0.8414874831203906, "percentage": 84.15, "elapsed_time": "2 days, 15:41:58", "remaining_time": "11:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8102, "total_steps": 9627, "loss": 1.7686, "learning_rate": 6.064790152997346e-06, "epoch": 0.841591357639971, "percentage": 84.16, "elapsed_time": "2 days, 15:42:28", "remaining_time": "11:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8103, "total_steps": 9627, "loss": 1.4962, "learning_rate": 6.0570035052256615e-06, "epoch": 0.8416952321595512, "percentage": 84.17, "elapsed_time": "2 days, 15:42:59", "remaining_time": "11:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8104, "total_steps": 9627, "loss": 1.5899, "learning_rate": 6.049221537040339e-06, "epoch": 0.8417991066791316, "percentage": 84.18, "elapsed_time": "2 days, 15:43:29", "remaining_time": "11:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8105, "total_steps": 9627, "loss": 1.7044, "learning_rate": 6.041444249270089e-06, "epoch": 0.841902981198712, "percentage": 84.19, "elapsed_time": "2 days, 15:43:59", "remaining_time": "11:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8106, "total_steps": 9627, "loss": 1.6839, "learning_rate": 6.033671642743144e-06, "epoch": 0.8420068557182923, "percentage": 84.2, "elapsed_time": "2 days, 15:44:29", "remaining_time": "11:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8107, "total_steps": 9627, "loss": 1.6526, "learning_rate": 6.025903718287212e-06, "epoch": 0.8421107302378726, "percentage": 84.21, "elapsed_time": "2 days, 15:45:00", "remaining_time": "11:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8108, "total_steps": 9627, "loss": 1.6792, "learning_rate": 6.018140476729517e-06, "epoch": 0.842214604757453, "percentage": 84.22, "elapsed_time": "2 days, 15:45:30", "remaining_time": "11:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8109, "total_steps": 9627, "loss": 1.7154, "learning_rate": 6.010381918896807e-06, "epoch": 0.8423184792770333, "percentage": 84.23, "elapsed_time": "2 days, 15:46:02", "remaining_time": "11:56:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8110, "total_steps": 9627, "loss": 1.6739, "learning_rate": 6.002628045615283e-06, "epoch": 0.8424223537966137, "percentage": 84.24, "elapsed_time": "2 days, 15:46:31", "remaining_time": "11:55:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8111, "total_steps": 9627, "loss": 1.7719, "learning_rate": 5.994878857710667e-06, "epoch": 0.8425262283161941, "percentage": 84.25, "elapsed_time": "2 days, 15:47:02", "remaining_time": "11:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8112, "total_steps": 9627, "loss": 1.6761, "learning_rate": 5.9871343560082225e-06, "epoch": 0.8426301028357743, "percentage": 84.26, "elapsed_time": "2 days, 15:47:32", "remaining_time": "11:54:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8113, "total_steps": 9627, "loss": 1.4098, "learning_rate": 5.9793945413326335e-06, "epoch": 0.8427339773553547, "percentage": 84.27, "elapsed_time": "2 days, 15:48:03", "remaining_time": "11:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8114, "total_steps": 9627, "loss": 1.6621, "learning_rate": 5.9716594145081625e-06, "epoch": 0.8428378518749351, "percentage": 84.28, "elapsed_time": "2 days, 15:48:33", "remaining_time": "11:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8115, "total_steps": 9627, "loss": 1.7382, "learning_rate": 5.963928976358518e-06, "epoch": 0.8429417263945155, "percentage": 84.29, "elapsed_time": "2 days, 15:49:03", "remaining_time": "11:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8116, "total_steps": 9627, "loss": 1.7194, "learning_rate": 5.956203227706963e-06, "epoch": 0.8430456009140957, "percentage": 84.3, "elapsed_time": "2 days, 15:49:35", "remaining_time": "11:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8117, "total_steps": 9627, "loss": 1.7364, "learning_rate": 5.948482169376202e-06, "epoch": 0.8431494754336761, "percentage": 84.31, "elapsed_time": "2 days, 15:50:05", "remaining_time": "11:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8118, "total_steps": 9627, "loss": 1.4118, "learning_rate": 5.940765802188458e-06, "epoch": 0.8432533499532565, "percentage": 84.33, "elapsed_time": "2 days, 15:50:35", "remaining_time": "11:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8119, "total_steps": 9627, "loss": 1.3972, "learning_rate": 5.933054126965509e-06, "epoch": 0.8433572244728368, "percentage": 84.34, "elapsed_time": "2 days, 15:51:07", "remaining_time": "11:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8120, "total_steps": 9627, "loss": 1.8372, "learning_rate": 5.925347144528537e-06, "epoch": 0.8434610989924172, "percentage": 84.35, "elapsed_time": "2 days, 15:51:36", "remaining_time": "11:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8121, "total_steps": 9627, "loss": 1.7691, "learning_rate": 5.917644855698306e-06, "epoch": 0.8435649735119976, "percentage": 84.36, "elapsed_time": "2 days, 15:52:06", "remaining_time": "11:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8122, "total_steps": 9627, "loss": 1.6897, "learning_rate": 5.9099472612950455e-06, "epoch": 0.8436688480315778, "percentage": 84.37, "elapsed_time": "2 days, 15:52:37", "remaining_time": "11:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8123, "total_steps": 9627, "loss": 1.7894, "learning_rate": 5.902254362138487e-06, "epoch": 0.8437727225511582, "percentage": 84.38, "elapsed_time": "2 days, 15:53:06", "remaining_time": "11:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8124, "total_steps": 9627, "loss": 1.5154, "learning_rate": 5.894566159047865e-06, "epoch": 0.8438765970707386, "percentage": 84.39, "elapsed_time": "2 days, 15:53:38", "remaining_time": "11:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8125, "total_steps": 9627, "loss": 1.613, "learning_rate": 5.886882652841907e-06, "epoch": 0.8439804715903189, "percentage": 84.4, "elapsed_time": "2 days, 15:54:08", "remaining_time": "11:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8126, "total_steps": 9627, "loss": 1.6085, "learning_rate": 5.879203844338848e-06, "epoch": 0.8440843461098992, "percentage": 84.41, "elapsed_time": "2 days, 15:54:38", "remaining_time": "11:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8127, "total_steps": 9627, "loss": 1.6069, "learning_rate": 5.871529734356423e-06, "epoch": 0.8441882206294796, "percentage": 84.42, "elapsed_time": "2 days, 15:55:09", "remaining_time": "11:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8128, "total_steps": 9627, "loss": 1.539, "learning_rate": 5.863860323711879e-06, "epoch": 0.8442920951490599, "percentage": 84.43, "elapsed_time": "2 days, 15:55:39", "remaining_time": "11:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8129, "total_steps": 9627, "loss": 1.3045, "learning_rate": 5.856195613221921e-06, "epoch": 0.8443959696686403, "percentage": 84.44, "elapsed_time": "2 days, 15:56:08", "remaining_time": "11:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8130, "total_steps": 9627, "loss": 1.5672, "learning_rate": 5.848535603702798e-06, "epoch": 0.8444998441882207, "percentage": 84.45, "elapsed_time": "2 days, 15:56:38", "remaining_time": "11:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8131, "total_steps": 9627, "loss": 1.7033, "learning_rate": 5.840880295970247e-06, "epoch": 0.8446037187078009, "percentage": 84.46, "elapsed_time": "2 days, 15:57:10", "remaining_time": "11:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8132, "total_steps": 9627, "loss": 1.7776, "learning_rate": 5.833229690839481e-06, "epoch": 0.8447075932273813, "percentage": 84.47, "elapsed_time": "2 days, 15:57:39", "remaining_time": "11:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8133, "total_steps": 9627, "loss": 1.7372, "learning_rate": 5.825583789125244e-06, "epoch": 0.8448114677469617, "percentage": 84.48, "elapsed_time": "2 days, 15:58:11", "remaining_time": "11:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8134, "total_steps": 9627, "loss": 1.7629, "learning_rate": 5.817942591641762e-06, "epoch": 0.844915342266542, "percentage": 84.49, "elapsed_time": "2 days, 15:58:41", "remaining_time": "11:44:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8135, "total_steps": 9627, "loss": 1.6475, "learning_rate": 5.810306099202755e-06, "epoch": 0.8450192167861224, "percentage": 84.5, "elapsed_time": "2 days, 15:59:11", "remaining_time": "11:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8136, "total_steps": 9627, "loss": 1.477, "learning_rate": 5.802674312621448e-06, "epoch": 0.8451230913057027, "percentage": 84.51, "elapsed_time": "2 days, 15:59:40", "remaining_time": "11:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8137, "total_steps": 9627, "loss": 1.586, "learning_rate": 5.795047232710599e-06, "epoch": 0.845226965825283, "percentage": 84.52, "elapsed_time": "2 days, 16:00:10", "remaining_time": "11:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8138, "total_steps": 9627, "loss": 1.5229, "learning_rate": 5.787424860282392e-06, "epoch": 0.8453308403448634, "percentage": 84.53, "elapsed_time": "2 days, 16:00:41", "remaining_time": "11:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8139, "total_steps": 9627, "loss": 1.7491, "learning_rate": 5.779807196148556e-06, "epoch": 0.8454347148644438, "percentage": 84.54, "elapsed_time": "2 days, 16:01:11", "remaining_time": "11:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8140, "total_steps": 9627, "loss": 1.5724, "learning_rate": 5.772194241120338e-06, "epoch": 0.8455385893840242, "percentage": 84.55, "elapsed_time": "2 days, 16:01:41", "remaining_time": "11:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8141, "total_steps": 9627, "loss": 1.7322, "learning_rate": 5.764585996008437e-06, "epoch": 0.8456424639036044, "percentage": 84.56, "elapsed_time": "2 days, 16:02:11", "remaining_time": "11:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8142, "total_steps": 9627, "loss": 1.763, "learning_rate": 5.756982461623084e-06, "epoch": 0.8457463384231848, "percentage": 84.57, "elapsed_time": "2 days, 16:02:41", "remaining_time": "11:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8143, "total_steps": 9627, "loss": 1.9331, "learning_rate": 5.749383638773986e-06, "epoch": 0.8458502129427652, "percentage": 84.59, "elapsed_time": "2 days, 16:03:10", "remaining_time": "11:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8144, "total_steps": 9627, "loss": 1.6423, "learning_rate": 5.7417895282703635e-06, "epoch": 0.8459540874623455, "percentage": 84.6, "elapsed_time": "2 days, 16:03:41", "remaining_time": "11:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8145, "total_steps": 9627, "loss": 1.5123, "learning_rate": 5.734200130920925e-06, "epoch": 0.8460579619819258, "percentage": 84.61, "elapsed_time": "2 days, 16:04:11", "remaining_time": "11:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8146, "total_steps": 9627, "loss": 1.4982, "learning_rate": 5.726615447533878e-06, "epoch": 0.8461618365015062, "percentage": 84.62, "elapsed_time": "2 days, 16:04:41", "remaining_time": "11:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8147, "total_steps": 9627, "loss": 1.8708, "learning_rate": 5.719035478916967e-06, "epoch": 0.8462657110210865, "percentage": 84.63, "elapsed_time": "2 days, 16:05:13", "remaining_time": "11:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8148, "total_steps": 9627, "loss": 1.5868, "learning_rate": 5.711460225877346e-06, "epoch": 0.8463695855406669, "percentage": 84.64, "elapsed_time": "2 days, 16:05:42", "remaining_time": "11:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8149, "total_steps": 9627, "loss": 1.4511, "learning_rate": 5.703889689221758e-06, "epoch": 0.8464734600602473, "percentage": 84.65, "elapsed_time": "2 days, 16:06:12", "remaining_time": "11:37:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8150, "total_steps": 9627, "loss": 1.6854, "learning_rate": 5.696323869756398e-06, "epoch": 0.8465773345798275, "percentage": 84.66, "elapsed_time": "2 days, 16:06:42", "remaining_time": "11:37:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8151, "total_steps": 9627, "loss": 1.6919, "learning_rate": 5.68876276828696e-06, "epoch": 0.8466812090994079, "percentage": 84.67, "elapsed_time": "2 days, 16:07:14", "remaining_time": "11:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8152, "total_steps": 9627, "loss": 1.5359, "learning_rate": 5.681206385618648e-06, "epoch": 0.8467850836189883, "percentage": 84.68, "elapsed_time": "2 days, 16:07:44", "remaining_time": "11:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8153, "total_steps": 9627, "loss": 1.8919, "learning_rate": 5.6736547225561545e-06, "epoch": 0.8468889581385686, "percentage": 84.69, "elapsed_time": "2 days, 16:08:14", "remaining_time": "11:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8154, "total_steps": 9627, "loss": 1.5971, "learning_rate": 5.6661077799036785e-06, "epoch": 0.846992832658149, "percentage": 84.7, "elapsed_time": "2 days, 16:08:44", "remaining_time": "11:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8155, "total_steps": 9627, "loss": 1.6858, "learning_rate": 5.65856555846489e-06, "epoch": 0.8470967071777293, "percentage": 84.71, "elapsed_time": "2 days, 16:09:14", "remaining_time": "11:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8156, "total_steps": 9627, "loss": 1.673, "learning_rate": 5.6510280590430174e-06, "epoch": 0.8472005816973096, "percentage": 84.72, "elapsed_time": "2 days, 16:09:44", "remaining_time": "11:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8157, "total_steps": 9627, "loss": 1.5692, "learning_rate": 5.643495282440703e-06, "epoch": 0.84730445621689, "percentage": 84.73, "elapsed_time": "2 days, 16:10:14", "remaining_time": "11:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8158, "total_steps": 9627, "loss": 1.5003, "learning_rate": 5.635967229460154e-06, "epoch": 0.8474083307364704, "percentage": 84.74, "elapsed_time": "2 days, 16:10:45", "remaining_time": "11:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8159, "total_steps": 9627, "loss": 1.6919, "learning_rate": 5.628443900903041e-06, "epoch": 0.8475122052560506, "percentage": 84.75, "elapsed_time": "2 days, 16:11:16", "remaining_time": "11:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8160, "total_steps": 9627, "loss": 1.602, "learning_rate": 5.62092529757054e-06, "epoch": 0.847616079775631, "percentage": 84.76, "elapsed_time": "2 days, 16:11:46", "remaining_time": "11:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8161, "total_steps": 9627, "loss": 1.6129, "learning_rate": 5.613411420263331e-06, "epoch": 0.8477199542952114, "percentage": 84.77, "elapsed_time": "2 days, 16:12:16", "remaining_time": "11:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8162, "total_steps": 9627, "loss": 1.572, "learning_rate": 5.605902269781571e-06, "epoch": 0.8478238288147917, "percentage": 84.78, "elapsed_time": "2 days, 16:12:46", "remaining_time": "11:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8163, "total_steps": 9627, "loss": 1.6821, "learning_rate": 5.598397846924935e-06, "epoch": 0.8479277033343721, "percentage": 84.79, "elapsed_time": "2 days, 16:13:16", "remaining_time": "11:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8164, "total_steps": 9627, "loss": 1.6375, "learning_rate": 5.590898152492574e-06, "epoch": 0.8480315778539524, "percentage": 84.8, "elapsed_time": "2 days, 16:13:46", "remaining_time": "11:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8165, "total_steps": 9627, "loss": 1.7255, "learning_rate": 5.583403187283159e-06, "epoch": 0.8481354523735328, "percentage": 84.81, "elapsed_time": "2 days, 16:14:17", "remaining_time": "11:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8166, "total_steps": 9627, "loss": 1.7604, "learning_rate": 5.575912952094858e-06, "epoch": 0.8482393268931131, "percentage": 84.82, "elapsed_time": "2 days, 16:14:46", "remaining_time": "11:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8167, "total_steps": 9627, "loss": 1.7037, "learning_rate": 5.568427447725283e-06, "epoch": 0.8483432014126935, "percentage": 84.83, "elapsed_time": "2 days, 16:15:17", "remaining_time": "11:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8168, "total_steps": 9627, "loss": 1.8658, "learning_rate": 5.560946674971618e-06, "epoch": 0.8484470759322739, "percentage": 84.84, "elapsed_time": "2 days, 16:15:48", "remaining_time": "11:28:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8169, "total_steps": 9627, "loss": 1.5678, "learning_rate": 5.553470634630492e-06, "epoch": 0.8485509504518541, "percentage": 84.86, "elapsed_time": "2 days, 16:16:18", "remaining_time": "11:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8170, "total_steps": 9627, "loss": 1.6442, "learning_rate": 5.5459993274980525e-06, "epoch": 0.8486548249714345, "percentage": 84.87, "elapsed_time": "2 days, 16:16:49", "remaining_time": "11:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8171, "total_steps": 9627, "loss": 1.6004, "learning_rate": 5.538532754369924e-06, "epoch": 0.8487586994910149, "percentage": 84.88, "elapsed_time": "2 days, 16:17:19", "remaining_time": "11:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8172, "total_steps": 9627, "loss": 1.5942, "learning_rate": 5.531070916041247e-06, "epoch": 0.8488625740105952, "percentage": 84.89, "elapsed_time": "2 days, 16:17:50", "remaining_time": "11:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8173, "total_steps": 9627, "loss": 1.6922, "learning_rate": 5.523613813306644e-06, "epoch": 0.8489664485301756, "percentage": 84.9, "elapsed_time": "2 days, 16:18:20", "remaining_time": "11:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8174, "total_steps": 9627, "loss": 1.6135, "learning_rate": 5.516161446960233e-06, "epoch": 0.8490703230497559, "percentage": 84.91, "elapsed_time": "2 days, 16:18:50", "remaining_time": "11:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8175, "total_steps": 9627, "loss": 1.5972, "learning_rate": 5.508713817795658e-06, "epoch": 0.8491741975693362, "percentage": 84.92, "elapsed_time": "2 days, 16:19:20", "remaining_time": "11:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8176, "total_steps": 9627, "loss": 1.5106, "learning_rate": 5.501270926606e-06, "epoch": 0.8492780720889166, "percentage": 84.93, "elapsed_time": "2 days, 16:19:50", "remaining_time": "11:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8177, "total_steps": 9627, "loss": 1.9156, "learning_rate": 5.493832774183894e-06, "epoch": 0.849381946608497, "percentage": 84.94, "elapsed_time": "2 days, 16:20:20", "remaining_time": "11:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8178, "total_steps": 9627, "loss": 1.592, "learning_rate": 5.4863993613214314e-06, "epoch": 0.8494858211280772, "percentage": 84.95, "elapsed_time": "2 days, 16:20:51", "remaining_time": "11:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8179, "total_steps": 9627, "loss": 1.6454, "learning_rate": 5.478970688810225e-06, "epoch": 0.8495896956476576, "percentage": 84.96, "elapsed_time": "2 days, 16:21:22", "remaining_time": "11:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8180, "total_steps": 9627, "loss": 1.7903, "learning_rate": 5.471546757441359e-06, "epoch": 0.849693570167238, "percentage": 84.97, "elapsed_time": "2 days, 16:21:52", "remaining_time": "11:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8181, "total_steps": 9627, "loss": 1.5594, "learning_rate": 5.464127568005423e-06, "epoch": 0.8497974446868183, "percentage": 84.98, "elapsed_time": "2 days, 16:22:22", "remaining_time": "11:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8182, "total_steps": 9627, "loss": 1.6509, "learning_rate": 5.456713121292517e-06, "epoch": 0.8499013192063987, "percentage": 84.99, "elapsed_time": "2 days, 16:22:52", "remaining_time": "11:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8183, "total_steps": 9627, "loss": 1.4437, "learning_rate": 5.4493034180921944e-06, "epoch": 0.850005193725979, "percentage": 85.0, "elapsed_time": "2 days, 16:23:23", "remaining_time": "11:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8184, "total_steps": 9627, "loss": 1.689, "learning_rate": 5.441898459193573e-06, "epoch": 0.8501090682455593, "percentage": 85.01, "elapsed_time": "2 days, 16:23:54", "remaining_time": "11:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8185, "total_steps": 9627, "loss": 1.6464, "learning_rate": 5.434498245385184e-06, "epoch": 0.8502129427651397, "percentage": 85.02, "elapsed_time": "2 days, 16:24:23", "remaining_time": "11:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8186, "total_steps": 9627, "loss": 1.4614, "learning_rate": 5.427102777455112e-06, "epoch": 0.8503168172847201, "percentage": 85.03, "elapsed_time": "2 days, 16:24:54", "remaining_time": "11:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8187, "total_steps": 9627, "loss": 1.5345, "learning_rate": 5.419712056190912e-06, "epoch": 0.8504206918043004, "percentage": 85.04, "elapsed_time": "2 days, 16:25:24", "remaining_time": "11:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8188, "total_steps": 9627, "loss": 1.5901, "learning_rate": 5.412326082379637e-06, "epoch": 0.8505245663238807, "percentage": 85.05, "elapsed_time": "2 days, 16:25:54", "remaining_time": "11:19:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8189, "total_steps": 9627, "loss": 1.5966, "learning_rate": 5.404944856807842e-06, "epoch": 0.8506284408434611, "percentage": 85.06, "elapsed_time": "2 days, 16:26:25", "remaining_time": "11:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8190, "total_steps": 9627, "loss": 1.6621, "learning_rate": 5.3975683802615586e-06, "epoch": 0.8507323153630414, "percentage": 85.07, "elapsed_time": "2 days, 16:26:55", "remaining_time": "11:18:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8191, "total_steps": 9627, "loss": 1.6508, "learning_rate": 5.390196653526336e-06, "epoch": 0.8508361898826218, "percentage": 85.08, "elapsed_time": "2 days, 16:27:25", "remaining_time": "11:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8192, "total_steps": 9627, "loss": 1.6648, "learning_rate": 5.382829677387186e-06, "epoch": 0.8509400644022022, "percentage": 85.09, "elapsed_time": "2 days, 16:27:55", "remaining_time": "11:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8193, "total_steps": 9627, "loss": 1.7252, "learning_rate": 5.375467452628663e-06, "epoch": 0.8510439389217825, "percentage": 85.1, "elapsed_time": "2 days, 16:28:26", "remaining_time": "11:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8194, "total_steps": 9627, "loss": 1.6036, "learning_rate": 5.368109980034775e-06, "epoch": 0.8511478134413628, "percentage": 85.11, "elapsed_time": "2 days, 16:28:56", "remaining_time": "11:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8195, "total_steps": 9627, "loss": 1.5241, "learning_rate": 5.360757260389015e-06, "epoch": 0.8512516879609432, "percentage": 85.13, "elapsed_time": "2 days, 16:29:26", "remaining_time": "11:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8196, "total_steps": 9627, "loss": 1.568, "learning_rate": 5.353409294474421e-06, "epoch": 0.8513555624805236, "percentage": 85.14, "elapsed_time": "2 days, 16:29:56", "remaining_time": "11:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8197, "total_steps": 9627, "loss": 1.5569, "learning_rate": 5.346066083073475e-06, "epoch": 0.8514594370001038, "percentage": 85.15, "elapsed_time": "2 days, 16:30:26", "remaining_time": "11:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8198, "total_steps": 9627, "loss": 1.6933, "learning_rate": 5.338727626968182e-06, "epoch": 0.8515633115196842, "percentage": 85.16, "elapsed_time": "2 days, 16:30:57", "remaining_time": "11:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8199, "total_steps": 9627, "loss": 1.7458, "learning_rate": 5.331393926940021e-06, "epoch": 0.8516671860392646, "percentage": 85.17, "elapsed_time": "2 days, 16:31:27", "remaining_time": "11:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8200, "total_steps": 9627, "loss": 1.6325, "learning_rate": 5.324064983769978e-06, "epoch": 0.8517710605588449, "percentage": 85.18, "elapsed_time": "2 days, 16:31:58", "remaining_time": "11:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8201, "total_steps": 9627, "loss": 1.7025, "learning_rate": 5.316740798238534e-06, "epoch": 0.8518749350784253, "percentage": 85.19, "elapsed_time": "2 days, 16:32:28", "remaining_time": "11:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8202, "total_steps": 9627, "loss": 1.7289, "learning_rate": 5.309421371125639e-06, "epoch": 0.8519788095980056, "percentage": 85.2, "elapsed_time": "2 days, 16:32:58", "remaining_time": "11:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8203, "total_steps": 9627, "loss": 1.6378, "learning_rate": 5.302106703210785e-06, "epoch": 0.8520826841175859, "percentage": 85.21, "elapsed_time": "2 days, 16:33:28", "remaining_time": "11:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8204, "total_steps": 9627, "loss": 1.8429, "learning_rate": 5.294796795272894e-06, "epoch": 0.8521865586371663, "percentage": 85.22, "elapsed_time": "2 days, 16:33:59", "remaining_time": "11:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8205, "total_steps": 9627, "loss": 1.515, "learning_rate": 5.287491648090437e-06, "epoch": 0.8522904331567467, "percentage": 85.23, "elapsed_time": "2 days, 16:34:28", "remaining_time": "11:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8206, "total_steps": 9627, "loss": 1.4383, "learning_rate": 5.280191262441353e-06, "epoch": 0.852394307676327, "percentage": 85.24, "elapsed_time": "2 days, 16:34:59", "remaining_time": "11:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8207, "total_steps": 9627, "loss": 1.6824, "learning_rate": 5.27289563910307e-06, "epoch": 0.8524981821959073, "percentage": 85.25, "elapsed_time": "2 days, 16:35:29", "remaining_time": "11:10:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8208, "total_steps": 9627, "loss": 1.525, "learning_rate": 5.265604778852512e-06, "epoch": 0.8526020567154877, "percentage": 85.26, "elapsed_time": "2 days, 16:36:00", "remaining_time": "11:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8209, "total_steps": 9627, "loss": 1.6278, "learning_rate": 5.258318682466107e-06, "epoch": 0.852705931235068, "percentage": 85.27, "elapsed_time": "2 days, 16:36:30", "remaining_time": "11:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8210, "total_steps": 9627, "loss": 1.563, "learning_rate": 5.2510373507197675e-06, "epoch": 0.8528098057546484, "percentage": 85.28, "elapsed_time": "2 days, 16:37:01", "remaining_time": "11:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8211, "total_steps": 9627, "loss": 1.5489, "learning_rate": 5.243760784388879e-06, "epoch": 0.8529136802742288, "percentage": 85.29, "elapsed_time": "2 days, 16:37:31", "remaining_time": "11:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8212, "total_steps": 9627, "loss": 1.7528, "learning_rate": 5.236488984248378e-06, "epoch": 0.853017554793809, "percentage": 85.3, "elapsed_time": "2 days, 16:38:00", "remaining_time": "11:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8213, "total_steps": 9627, "loss": 1.5852, "learning_rate": 5.229221951072611e-06, "epoch": 0.8531214293133894, "percentage": 85.31, "elapsed_time": "2 days, 16:38:30", "remaining_time": "11:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8214, "total_steps": 9627, "loss": 1.7859, "learning_rate": 5.221959685635491e-06, "epoch": 0.8532253038329698, "percentage": 85.32, "elapsed_time": "2 days, 16:39:00", "remaining_time": "11:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8215, "total_steps": 9627, "loss": 1.6043, "learning_rate": 5.2147021887103796e-06, "epoch": 0.8533291783525501, "percentage": 85.33, "elapsed_time": "2 days, 16:39:32", "remaining_time": "11:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8216, "total_steps": 9627, "loss": 1.7065, "learning_rate": 5.207449461070146e-06, "epoch": 0.8534330528721304, "percentage": 85.34, "elapsed_time": "2 days, 16:40:02", "remaining_time": "11:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8217, "total_steps": 9627, "loss": 1.8633, "learning_rate": 5.2002015034871564e-06, "epoch": 0.8535369273917108, "percentage": 85.35, "elapsed_time": "2 days, 16:40:32", "remaining_time": "11:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8218, "total_steps": 9627, "loss": 1.7325, "learning_rate": 5.1929583167332375e-06, "epoch": 0.8536408019112912, "percentage": 85.36, "elapsed_time": "2 days, 16:41:02", "remaining_time": "11:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8219, "total_steps": 9627, "loss": 1.8017, "learning_rate": 5.185719901579772e-06, "epoch": 0.8537446764308715, "percentage": 85.37, "elapsed_time": "2 days, 16:41:31", "remaining_time": "11:04:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8220, "total_steps": 9627, "loss": 1.8846, "learning_rate": 5.178486258797555e-06, "epoch": 0.8538485509504519, "percentage": 85.38, "elapsed_time": "2 days, 16:42:02", "remaining_time": "11:04:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8221, "total_steps": 9627, "loss": 1.7558, "learning_rate": 5.171257389156936e-06, "epoch": 0.8539524254700323, "percentage": 85.4, "elapsed_time": "2 days, 16:42:32", "remaining_time": "11:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8222, "total_steps": 9627, "loss": 1.6539, "learning_rate": 5.164033293427739e-06, "epoch": 0.8540562999896125, "percentage": 85.41, "elapsed_time": "2 days, 16:43:02", "remaining_time": "11:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8223, "total_steps": 9627, "loss": 1.769, "learning_rate": 5.156813972379243e-06, "epoch": 0.8541601745091929, "percentage": 85.42, "elapsed_time": "2 days, 16:43:33", "remaining_time": "11:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8224, "total_steps": 9627, "loss": 1.5509, "learning_rate": 5.1495994267802775e-06, "epoch": 0.8542640490287733, "percentage": 85.43, "elapsed_time": "2 days, 16:44:03", "remaining_time": "11:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8225, "total_steps": 9627, "loss": 1.7014, "learning_rate": 5.142389657399127e-06, "epoch": 0.8543679235483536, "percentage": 85.44, "elapsed_time": "2 days, 16:44:33", "remaining_time": "11:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8226, "total_steps": 9627, "loss": 1.602, "learning_rate": 5.135184665003573e-06, "epoch": 0.8544717980679339, "percentage": 85.45, "elapsed_time": "2 days, 16:45:03", "remaining_time": "11:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8227, "total_steps": 9627, "loss": 1.7716, "learning_rate": 5.127984450360895e-06, "epoch": 0.8545756725875143, "percentage": 85.46, "elapsed_time": "2 days, 16:45:32", "remaining_time": "11:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8228, "total_steps": 9627, "loss": 1.6233, "learning_rate": 5.120789014237859e-06, "epoch": 0.8546795471070946, "percentage": 85.47, "elapsed_time": "2 days, 16:46:04", "remaining_time": "11:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8229, "total_steps": 9627, "loss": 1.5956, "learning_rate": 5.113598357400723e-06, "epoch": 0.854783421626675, "percentage": 85.48, "elapsed_time": "2 days, 16:46:34", "remaining_time": "11:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8230, "total_steps": 9627, "loss": 1.5542, "learning_rate": 5.106412480615219e-06, "epoch": 0.8548872961462554, "percentage": 85.49, "elapsed_time": "2 days, 16:47:03", "remaining_time": "10:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8231, "total_steps": 9627, "loss": 1.6801, "learning_rate": 5.09923138464663e-06, "epoch": 0.8549911706658356, "percentage": 85.5, "elapsed_time": "2 days, 16:47:34", "remaining_time": "10:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8232, "total_steps": 9627, "loss": 1.6589, "learning_rate": 5.092055070259632e-06, "epoch": 0.855095045185416, "percentage": 85.51, "elapsed_time": "2 days, 16:48:04", "remaining_time": "10:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8233, "total_steps": 9627, "loss": 1.6403, "learning_rate": 5.0848835382184875e-06, "epoch": 0.8551989197049964, "percentage": 85.52, "elapsed_time": "2 days, 16:48:34", "remaining_time": "10:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8234, "total_steps": 9627, "loss": 1.7067, "learning_rate": 5.077716789286896e-06, "epoch": 0.8553027942245767, "percentage": 85.53, "elapsed_time": "2 days, 16:49:04", "remaining_time": "10:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8235, "total_steps": 9627, "loss": 1.667, "learning_rate": 5.070554824228052e-06, "epoch": 0.855406668744157, "percentage": 85.54, "elapsed_time": "2 days, 16:49:34", "remaining_time": "10:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8236, "total_steps": 9627, "loss": 1.4978, "learning_rate": 5.063397643804662e-06, "epoch": 0.8555105432637374, "percentage": 85.55, "elapsed_time": "2 days, 16:50:03", "remaining_time": "10:57:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8237, "total_steps": 9627, "loss": 1.5833, "learning_rate": 5.056245248778902e-06, "epoch": 0.8556144177833177, "percentage": 85.56, "elapsed_time": "2 days, 16:50:34", "remaining_time": "10:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8238, "total_steps": 9627, "loss": 1.4775, "learning_rate": 5.049097639912454e-06, "epoch": 0.8557182923028981, "percentage": 85.57, "elapsed_time": "2 days, 16:51:05", "remaining_time": "10:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8239, "total_steps": 9627, "loss": 1.612, "learning_rate": 5.04195481796646e-06, "epoch": 0.8558221668224785, "percentage": 85.58, "elapsed_time": "2 days, 16:51:34", "remaining_time": "10:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8240, "total_steps": 9627, "loss": 1.5282, "learning_rate": 5.034816783701613e-06, "epoch": 0.8559260413420587, "percentage": 85.59, "elapsed_time": "2 days, 16:52:05", "remaining_time": "10:55:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8241, "total_steps": 9627, "loss": 1.5708, "learning_rate": 5.027683537878014e-06, "epoch": 0.8560299158616391, "percentage": 85.6, "elapsed_time": "2 days, 16:52:34", "remaining_time": "10:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8242, "total_steps": 9627, "loss": 1.6524, "learning_rate": 5.0205550812553345e-06, "epoch": 0.8561337903812195, "percentage": 85.61, "elapsed_time": "2 days, 16:53:05", "remaining_time": "10:54:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8243, "total_steps": 9627, "loss": 1.8134, "learning_rate": 5.01343141459269e-06, "epoch": 0.8562376649007999, "percentage": 85.62, "elapsed_time": "2 days, 16:53:35", "remaining_time": "10:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8244, "total_steps": 9627, "loss": 1.9862, "learning_rate": 5.0063125386486834e-06, "epoch": 0.8563415394203802, "percentage": 85.63, "elapsed_time": "2 days, 16:54:05", "remaining_time": "10:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8245, "total_steps": 9627, "loss": 1.8108, "learning_rate": 4.999198454181431e-06, "epoch": 0.8564454139399605, "percentage": 85.64, "elapsed_time": "2 days, 16:54:35", "remaining_time": "10:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8246, "total_steps": 9627, "loss": 1.6589, "learning_rate": 4.99208916194851e-06, "epoch": 0.8565492884595409, "percentage": 85.65, "elapsed_time": "2 days, 16:55:04", "remaining_time": "10:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8247, "total_steps": 9627, "loss": 1.7302, "learning_rate": 4.984984662707043e-06, "epoch": 0.8566531629791212, "percentage": 85.67, "elapsed_time": "2 days, 16:55:34", "remaining_time": "10:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8248, "total_steps": 9627, "loss": 1.564, "learning_rate": 4.977884957213558e-06, "epoch": 0.8567570374987016, "percentage": 85.68, "elapsed_time": "2 days, 16:56:05", "remaining_time": "10:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8249, "total_steps": 9627, "loss": 1.7149, "learning_rate": 4.970790046224144e-06, "epoch": 0.856860912018282, "percentage": 85.69, "elapsed_time": "2 days, 16:56:34", "remaining_time": "10:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8250, "total_steps": 9627, "loss": 1.5095, "learning_rate": 4.963699930494364e-06, "epoch": 0.8569647865378622, "percentage": 85.7, "elapsed_time": "2 days, 16:57:06", "remaining_time": "10:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8251, "total_steps": 9627, "loss": 1.5314, "learning_rate": 4.95661461077922e-06, "epoch": 0.8570686610574426, "percentage": 85.71, "elapsed_time": "2 days, 16:57:35", "remaining_time": "10:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8252, "total_steps": 9627, "loss": 1.5747, "learning_rate": 4.94953408783328e-06, "epoch": 0.857172535577023, "percentage": 85.72, "elapsed_time": "2 days, 16:58:05", "remaining_time": "10:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8253, "total_steps": 9627, "loss": 1.628, "learning_rate": 4.942458362410557e-06, "epoch": 0.8572764100966033, "percentage": 85.73, "elapsed_time": "2 days, 16:58:35", "remaining_time": "10:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8254, "total_steps": 9627, "loss": 1.5326, "learning_rate": 4.935387435264549e-06, "epoch": 0.8573802846161837, "percentage": 85.74, "elapsed_time": "2 days, 16:59:04", "remaining_time": "10:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8255, "total_steps": 9627, "loss": 1.7157, "learning_rate": 4.928321307148265e-06, "epoch": 0.857484159135764, "percentage": 85.75, "elapsed_time": "2 days, 16:59:36", "remaining_time": "10:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8256, "total_steps": 9627, "loss": 1.8348, "learning_rate": 4.921259978814191e-06, "epoch": 0.8575880336553443, "percentage": 85.76, "elapsed_time": "2 days, 17:00:06", "remaining_time": "10:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8257, "total_steps": 9627, "loss": 1.521, "learning_rate": 4.914203451014299e-06, "epoch": 0.8576919081749247, "percentage": 85.77, "elapsed_time": "2 days, 17:00:35", "remaining_time": "10:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8258, "total_steps": 9627, "loss": 1.6885, "learning_rate": 4.907151724500048e-06, "epoch": 0.8577957826945051, "percentage": 85.78, "elapsed_time": "2 days, 17:01:06", "remaining_time": "10:46:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8259, "total_steps": 9627, "loss": 1.746, "learning_rate": 4.9001048000224205e-06, "epoch": 0.8578996572140853, "percentage": 85.79, "elapsed_time": "2 days, 17:01:36", "remaining_time": "10:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8260, "total_steps": 9627, "loss": 1.794, "learning_rate": 4.893062678331817e-06, "epoch": 0.8580035317336657, "percentage": 85.8, "elapsed_time": "2 days, 17:02:06", "remaining_time": "10:45:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8261, "total_steps": 9627, "loss": 1.6533, "learning_rate": 4.886025360178204e-06, "epoch": 0.8581074062532461, "percentage": 85.81, "elapsed_time": "2 days, 17:02:36", "remaining_time": "10:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8262, "total_steps": 9627, "loss": 1.6403, "learning_rate": 4.878992846310987e-06, "epoch": 0.8582112807728264, "percentage": 85.82, "elapsed_time": "2 days, 17:03:06", "remaining_time": "10:44:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8263, "total_steps": 9627, "loss": 1.7938, "learning_rate": 4.8719651374790735e-06, "epoch": 0.8583151552924068, "percentage": 85.83, "elapsed_time": "2 days, 17:03:36", "remaining_time": "10:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8264, "total_steps": 9627, "loss": 1.5834, "learning_rate": 4.864942234430858e-06, "epoch": 0.8584190298119871, "percentage": 85.84, "elapsed_time": "2 days, 17:04:07", "remaining_time": "10:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8265, "total_steps": 9627, "loss": 1.6952, "learning_rate": 4.857924137914233e-06, "epoch": 0.8585229043315674, "percentage": 85.85, "elapsed_time": "2 days, 17:04:37", "remaining_time": "10:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8266, "total_steps": 9627, "loss": 1.658, "learning_rate": 4.85091084867656e-06, "epoch": 0.8586267788511478, "percentage": 85.86, "elapsed_time": "2 days, 17:05:07", "remaining_time": "10:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8267, "total_steps": 9627, "loss": 1.6903, "learning_rate": 4.843902367464698e-06, "epoch": 0.8587306533707282, "percentage": 85.87, "elapsed_time": "2 days, 17:05:36", "remaining_time": "10:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8268, "total_steps": 9627, "loss": 1.7291, "learning_rate": 4.8368986950250275e-06, "epoch": 0.8588345278903085, "percentage": 85.88, "elapsed_time": "2 days, 17:06:06", "remaining_time": "10:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8269, "total_steps": 9627, "loss": 1.5672, "learning_rate": 4.829899832103335e-06, "epoch": 0.8589384024098888, "percentage": 85.89, "elapsed_time": "2 days, 17:06:36", "remaining_time": "10:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8270, "total_steps": 9627, "loss": 1.5287, "learning_rate": 4.82290577944498e-06, "epoch": 0.8590422769294692, "percentage": 85.9, "elapsed_time": "2 days, 17:07:06", "remaining_time": "10:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8271, "total_steps": 9627, "loss": 1.7356, "learning_rate": 4.815916537794763e-06, "epoch": 0.8591461514490496, "percentage": 85.91, "elapsed_time": "2 days, 17:07:36", "remaining_time": "10:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8272, "total_steps": 9627, "loss": 1.5447, "learning_rate": 4.8089321078969904e-06, "epoch": 0.8592500259686299, "percentage": 85.93, "elapsed_time": "2 days, 17:08:06", "remaining_time": "10:40:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8273, "total_steps": 9627, "loss": 1.6652, "learning_rate": 4.801952490495437e-06, "epoch": 0.8593539004882103, "percentage": 85.94, "elapsed_time": "2 days, 17:08:36", "remaining_time": "10:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8274, "total_steps": 9627, "loss": 1.6881, "learning_rate": 4.79497768633338e-06, "epoch": 0.8594577750077906, "percentage": 85.95, "elapsed_time": "2 days, 17:09:06", "remaining_time": "10:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8275, "total_steps": 9627, "loss": 1.6703, "learning_rate": 4.788007696153607e-06, "epoch": 0.8595616495273709, "percentage": 85.96, "elapsed_time": "2 days, 17:09:37", "remaining_time": "10:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8276, "total_steps": 9627, "loss": 1.7158, "learning_rate": 4.781042520698326e-06, "epoch": 0.8596655240469513, "percentage": 85.97, "elapsed_time": "2 days, 17:10:06", "remaining_time": "10:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8277, "total_steps": 9627, "loss": 1.518, "learning_rate": 4.774082160709309e-06, "epoch": 0.8597693985665317, "percentage": 85.98, "elapsed_time": "2 days, 17:10:36", "remaining_time": "10:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8278, "total_steps": 9627, "loss": 1.5671, "learning_rate": 4.767126616927769e-06, "epoch": 0.8598732730861119, "percentage": 85.99, "elapsed_time": "2 days, 17:11:06", "remaining_time": "10:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8279, "total_steps": 9627, "loss": 1.6172, "learning_rate": 4.760175890094399e-06, "epoch": 0.8599771476056923, "percentage": 86.0, "elapsed_time": "2 days, 17:11:36", "remaining_time": "10:36:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8280, "total_steps": 9627, "loss": 1.5905, "learning_rate": 4.753229980949419e-06, "epoch": 0.8600810221252727, "percentage": 86.01, "elapsed_time": "2 days, 17:12:06", "remaining_time": "10:36:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8281, "total_steps": 9627, "loss": 1.6522, "learning_rate": 4.746288890232514e-06, "epoch": 0.860184896644853, "percentage": 86.02, "elapsed_time": "2 days, 17:12:36", "remaining_time": "10:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8282, "total_steps": 9627, "loss": 1.6796, "learning_rate": 4.739352618682846e-06, "epoch": 0.8602887711644334, "percentage": 86.03, "elapsed_time": "2 days, 17:13:06", "remaining_time": "10:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8283, "total_steps": 9627, "loss": 1.6135, "learning_rate": 4.732421167039075e-06, "epoch": 0.8603926456840137, "percentage": 86.04, "elapsed_time": "2 days, 17:13:36", "remaining_time": "10:35:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8284, "total_steps": 9627, "loss": 1.4627, "learning_rate": 4.725494536039354e-06, "epoch": 0.860496520203594, "percentage": 86.05, "elapsed_time": "2 days, 17:14:05", "remaining_time": "10:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8285, "total_steps": 9627, "loss": 1.782, "learning_rate": 4.718572726421305e-06, "epoch": 0.8606003947231744, "percentage": 86.06, "elapsed_time": "2 days, 17:14:35", "remaining_time": "10:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8286, "total_steps": 9627, "loss": 1.6468, "learning_rate": 4.711655738922044e-06, "epoch": 0.8607042692427548, "percentage": 86.07, "elapsed_time": "2 days, 17:15:06", "remaining_time": "10:33:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8287, "total_steps": 9627, "loss": 1.6226, "learning_rate": 4.704743574278209e-06, "epoch": 0.860808143762335, "percentage": 86.08, "elapsed_time": "2 days, 17:15:35", "remaining_time": "10:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8288, "total_steps": 9627, "loss": 1.6135, "learning_rate": 4.697836233225838e-06, "epoch": 0.8609120182819154, "percentage": 86.09, "elapsed_time": "2 days, 17:16:05", "remaining_time": "10:32:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8289, "total_steps": 9627, "loss": 1.845, "learning_rate": 4.690933716500556e-06, "epoch": 0.8610158928014958, "percentage": 86.1, "elapsed_time": "2 days, 17:16:36", "remaining_time": "10:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8290, "total_steps": 9627, "loss": 1.7574, "learning_rate": 4.684036024837402e-06, "epoch": 0.8611197673210761, "percentage": 86.11, "elapsed_time": "2 days, 17:17:05", "remaining_time": "10:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8291, "total_steps": 9627, "loss": 1.5884, "learning_rate": 4.677143158970937e-06, "epoch": 0.8612236418406565, "percentage": 86.12, "elapsed_time": "2 days, 17:17:35", "remaining_time": "10:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8292, "total_steps": 9627, "loss": 1.6082, "learning_rate": 4.670255119635192e-06, "epoch": 0.8613275163602369, "percentage": 86.13, "elapsed_time": "2 days, 17:18:05", "remaining_time": "10:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8293, "total_steps": 9627, "loss": 1.5688, "learning_rate": 4.663371907563696e-06, "epoch": 0.8614313908798171, "percentage": 86.14, "elapsed_time": "2 days, 17:18:36", "remaining_time": "10:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8294, "total_steps": 9627, "loss": 1.7237, "learning_rate": 4.656493523489447e-06, "epoch": 0.8615352653993975, "percentage": 86.15, "elapsed_time": "2 days, 17:19:05", "remaining_time": "10:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8295, "total_steps": 9627, "loss": 1.6905, "learning_rate": 4.649619968144936e-06, "epoch": 0.8616391399189779, "percentage": 86.16, "elapsed_time": "2 days, 17:19:35", "remaining_time": "10:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8296, "total_steps": 9627, "loss": 1.5359, "learning_rate": 4.642751242262161e-06, "epoch": 0.8617430144385583, "percentage": 86.17, "elapsed_time": "2 days, 17:20:05", "remaining_time": "10:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8297, "total_steps": 9627, "loss": 1.6373, "learning_rate": 4.635887346572582e-06, "epoch": 0.8618468889581385, "percentage": 86.18, "elapsed_time": "2 days, 17:20:35", "remaining_time": "10:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8298, "total_steps": 9627, "loss": 1.7373, "learning_rate": 4.629028281807146e-06, "epoch": 0.8619507634777189, "percentage": 86.2, "elapsed_time": "2 days, 17:21:05", "remaining_time": "10:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8299, "total_steps": 9627, "loss": 1.456, "learning_rate": 4.622174048696288e-06, "epoch": 0.8620546379972993, "percentage": 86.21, "elapsed_time": "2 days, 17:21:36", "remaining_time": "10:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8300, "total_steps": 9627, "loss": 1.7349, "learning_rate": 4.615324647969932e-06, "epoch": 0.8621585125168796, "percentage": 86.22, "elapsed_time": "2 days, 17:22:05", "remaining_time": "10:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8301, "total_steps": 9627, "loss": 1.4529, "learning_rate": 4.608480080357491e-06, "epoch": 0.86226238703646, "percentage": 86.23, "elapsed_time": "2 days, 17:22:35", "remaining_time": "10:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8302, "total_steps": 9627, "loss": 1.7035, "learning_rate": 4.601640346587843e-06, "epoch": 0.8623662615560403, "percentage": 86.24, "elapsed_time": "2 days, 17:23:05", "remaining_time": "10:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8303, "total_steps": 9627, "loss": 1.6631, "learning_rate": 4.5948054473894e-06, "epoch": 0.8624701360756206, "percentage": 86.25, "elapsed_time": "2 days, 17:23:35", "remaining_time": "10:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8304, "total_steps": 9627, "loss": 1.6642, "learning_rate": 4.587975383489978e-06, "epoch": 0.862574010595201, "percentage": 86.26, "elapsed_time": "2 days, 17:24:05", "remaining_time": "10:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8305, "total_steps": 9627, "loss": 1.79, "learning_rate": 4.581150155616959e-06, "epoch": 0.8626778851147814, "percentage": 86.27, "elapsed_time": "2 days, 17:24:36", "remaining_time": "10:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8306, "total_steps": 9627, "loss": 1.7097, "learning_rate": 4.574329764497182e-06, "epoch": 0.8627817596343617, "percentage": 86.28, "elapsed_time": "2 days, 17:25:05", "remaining_time": "10:24:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8307, "total_steps": 9627, "loss": 1.6195, "learning_rate": 4.567514210856933e-06, "epoch": 0.862885634153942, "percentage": 86.29, "elapsed_time": "2 days, 17:25:35", "remaining_time": "10:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8308, "total_steps": 9627, "loss": 1.4697, "learning_rate": 4.560703495422037e-06, "epoch": 0.8629895086735224, "percentage": 86.3, "elapsed_time": "2 days, 17:26:06", "remaining_time": "10:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8309, "total_steps": 9627, "loss": 1.6035, "learning_rate": 4.553897618917785e-06, "epoch": 0.8630933831931027, "percentage": 86.31, "elapsed_time": "2 days, 17:26:35", "remaining_time": "10:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8310, "total_steps": 9627, "loss": 1.6968, "learning_rate": 4.547096582068938e-06, "epoch": 0.8631972577126831, "percentage": 86.32, "elapsed_time": "2 days, 17:27:05", "remaining_time": "10:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8311, "total_steps": 9627, "loss": 1.8258, "learning_rate": 4.540300385599761e-06, "epoch": 0.8633011322322635, "percentage": 86.33, "elapsed_time": "2 days, 17:27:35", "remaining_time": "10:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8312, "total_steps": 9627, "loss": 1.6876, "learning_rate": 4.533509030233995e-06, "epoch": 0.8634050067518437, "percentage": 86.34, "elapsed_time": "2 days, 17:28:05", "remaining_time": "10:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8313, "total_steps": 9627, "loss": 1.7243, "learning_rate": 4.5267225166948645e-06, "epoch": 0.8635088812714241, "percentage": 86.35, "elapsed_time": "2 days, 17:28:35", "remaining_time": "10:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8314, "total_steps": 9627, "loss": 1.8883, "learning_rate": 4.519940845705067e-06, "epoch": 0.8636127557910045, "percentage": 86.36, "elapsed_time": "2 days, 17:29:05", "remaining_time": "10:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8315, "total_steps": 9627, "loss": 1.4688, "learning_rate": 4.513164017986837e-06, "epoch": 0.8637166303105848, "percentage": 86.37, "elapsed_time": "2 days, 17:29:35", "remaining_time": "10:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8316, "total_steps": 9627, "loss": 1.7138, "learning_rate": 4.506392034261803e-06, "epoch": 0.8638205048301651, "percentage": 86.38, "elapsed_time": "2 days, 17:30:06", "remaining_time": "10:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8317, "total_steps": 9627, "loss": 1.6899, "learning_rate": 4.49962489525117e-06, "epoch": 0.8639243793497455, "percentage": 86.39, "elapsed_time": "2 days, 17:30:35", "remaining_time": "10:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8318, "total_steps": 9627, "loss": 1.5958, "learning_rate": 4.492862601675563e-06, "epoch": 0.8640282538693258, "percentage": 86.4, "elapsed_time": "2 days, 17:31:06", "remaining_time": "10:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8319, "total_steps": 9627, "loss": 1.8196, "learning_rate": 4.486105154255121e-06, "epoch": 0.8641321283889062, "percentage": 86.41, "elapsed_time": "2 days, 17:31:35", "remaining_time": "10:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8320, "total_steps": 9627, "loss": 1.7509, "learning_rate": 4.4793525537094595e-06, "epoch": 0.8642360029084866, "percentage": 86.42, "elapsed_time": "2 days, 17:32:06", "remaining_time": "10:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8321, "total_steps": 9627, "loss": 1.813, "learning_rate": 4.472604800757668e-06, "epoch": 0.864339877428067, "percentage": 86.43, "elapsed_time": "2 days, 17:32:36", "remaining_time": "10:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8322, "total_steps": 9627, "loss": 1.6671, "learning_rate": 4.4658618961183506e-06, "epoch": 0.8644437519476472, "percentage": 86.44, "elapsed_time": "2 days, 17:33:06", "remaining_time": "10:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8323, "total_steps": 9627, "loss": 1.5313, "learning_rate": 4.459123840509549e-06, "epoch": 0.8645476264672276, "percentage": 86.45, "elapsed_time": "2 days, 17:33:36", "remaining_time": "10:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8324, "total_steps": 9627, "loss": 1.5305, "learning_rate": 4.4523906346488345e-06, "epoch": 0.864651500986808, "percentage": 86.47, "elapsed_time": "2 days, 17:34:07", "remaining_time": "10:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8325, "total_steps": 9627, "loss": 1.5326, "learning_rate": 4.445662279253226e-06, "epoch": 0.8647553755063883, "percentage": 86.48, "elapsed_time": "2 days, 17:34:36", "remaining_time": "10:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8326, "total_steps": 9627, "loss": 1.7945, "learning_rate": 4.438938775039253e-06, "epoch": 0.8648592500259686, "percentage": 86.49, "elapsed_time": "2 days, 17:35:07", "remaining_time": "10:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8327, "total_steps": 9627, "loss": 1.7237, "learning_rate": 4.4322201227229134e-06, "epoch": 0.864963124545549, "percentage": 86.5, "elapsed_time": "2 days, 17:35:37", "remaining_time": "10:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8328, "total_steps": 9627, "loss": 1.7394, "learning_rate": 4.425506323019685e-06, "epoch": 0.8650669990651293, "percentage": 86.51, "elapsed_time": "2 days, 17:36:06", "remaining_time": "10:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8329, "total_steps": 9627, "loss": 1.6003, "learning_rate": 4.418797376644534e-06, "epoch": 0.8651708735847097, "percentage": 86.52, "elapsed_time": "2 days, 17:36:36", "remaining_time": "10:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8330, "total_steps": 9627, "loss": 1.5485, "learning_rate": 4.412093284311913e-06, "epoch": 0.8652747481042901, "percentage": 86.53, "elapsed_time": "2 days, 17:37:06", "remaining_time": "10:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8331, "total_steps": 9627, "loss": 1.5195, "learning_rate": 4.405394046735773e-06, "epoch": 0.8653786226238703, "percentage": 86.54, "elapsed_time": "2 days, 17:37:36", "remaining_time": "10:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8332, "total_steps": 9627, "loss": 1.7706, "learning_rate": 4.398699664629497e-06, "epoch": 0.8654824971434507, "percentage": 86.55, "elapsed_time": "2 days, 17:38:06", "remaining_time": "10:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8333, "total_steps": 9627, "loss": 1.6909, "learning_rate": 4.392010138706015e-06, "epoch": 0.8655863716630311, "percentage": 86.56, "elapsed_time": "2 days, 17:38:36", "remaining_time": "10:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8334, "total_steps": 9627, "loss": 1.6691, "learning_rate": 4.3853254696777036e-06, "epoch": 0.8656902461826114, "percentage": 86.57, "elapsed_time": "2 days, 17:39:07", "remaining_time": "10:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8335, "total_steps": 9627, "loss": 1.5524, "learning_rate": 4.378645658256403e-06, "epoch": 0.8657941207021917, "percentage": 86.58, "elapsed_time": "2 days, 17:39:36", "remaining_time": "10:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8336, "total_steps": 9627, "loss": 1.6553, "learning_rate": 4.371970705153489e-06, "epoch": 0.8658979952217721, "percentage": 86.59, "elapsed_time": "2 days, 17:40:07", "remaining_time": "10:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8337, "total_steps": 9627, "loss": 1.7254, "learning_rate": 4.365300611079781e-06, "epoch": 0.8660018697413524, "percentage": 86.6, "elapsed_time": "2 days, 17:40:37", "remaining_time": "10:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8338, "total_steps": 9627, "loss": 1.6613, "learning_rate": 4.358635376745601e-06, "epoch": 0.8661057442609328, "percentage": 86.61, "elapsed_time": "2 days, 17:41:06", "remaining_time": "10:09:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8339, "total_steps": 9627, "loss": 1.6243, "learning_rate": 4.351975002860731e-06, "epoch": 0.8662096187805132, "percentage": 86.62, "elapsed_time": "2 days, 17:41:36", "remaining_time": "10:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8340, "total_steps": 9627, "loss": 1.6895, "learning_rate": 4.345319490134453e-06, "epoch": 0.8663134933000934, "percentage": 86.63, "elapsed_time": "2 days, 17:42:06", "remaining_time": "10:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8341, "total_steps": 9627, "loss": 1.6746, "learning_rate": 4.338668839275534e-06, "epoch": 0.8664173678196738, "percentage": 86.64, "elapsed_time": "2 days, 17:42:36", "remaining_time": "10:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8342, "total_steps": 9627, "loss": 1.6391, "learning_rate": 4.3320230509922014e-06, "epoch": 0.8665212423392542, "percentage": 86.65, "elapsed_time": "2 days, 17:43:06", "remaining_time": "10:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8343, "total_steps": 9627, "loss": 1.5569, "learning_rate": 4.3253821259922055e-06, "epoch": 0.8666251168588345, "percentage": 86.66, "elapsed_time": "2 days, 17:43:37", "remaining_time": "10:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8344, "total_steps": 9627, "loss": 1.6763, "learning_rate": 4.318746064982721e-06, "epoch": 0.8667289913784149, "percentage": 86.67, "elapsed_time": "2 days, 17:44:06", "remaining_time": "10:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8345, "total_steps": 9627, "loss": 1.4977, "learning_rate": 4.312114868670458e-06, "epoch": 0.8668328658979952, "percentage": 86.68, "elapsed_time": "2 days, 17:44:37", "remaining_time": "10:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8346, "total_steps": 9627, "loss": 1.586, "learning_rate": 4.305488537761588e-06, "epoch": 0.8669367404175756, "percentage": 86.69, "elapsed_time": "2 days, 17:45:06", "remaining_time": "10:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8347, "total_steps": 9627, "loss": 1.6925, "learning_rate": 4.298867072961754e-06, "epoch": 0.8670406149371559, "percentage": 86.7, "elapsed_time": "2 days, 17:45:37", "remaining_time": "10:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8348, "total_steps": 9627, "loss": 1.5939, "learning_rate": 4.2922504749761005e-06, "epoch": 0.8671444894567363, "percentage": 86.71, "elapsed_time": "2 days, 17:46:08", "remaining_time": "10:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8349, "total_steps": 9627, "loss": 1.6401, "learning_rate": 4.2856387445092235e-06, "epoch": 0.8672483639763167, "percentage": 86.72, "elapsed_time": "2 days, 17:46:37", "remaining_time": "10:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8350, "total_steps": 9627, "loss": 1.4537, "learning_rate": 4.2790318822652495e-06, "epoch": 0.8673522384958969, "percentage": 86.74, "elapsed_time": "2 days, 17:47:07", "remaining_time": "10:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8351, "total_steps": 9627, "loss": 1.472, "learning_rate": 4.272429888947732e-06, "epoch": 0.8674561130154773, "percentage": 86.75, "elapsed_time": "2 days, 17:47:38", "remaining_time": "10:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8352, "total_steps": 9627, "loss": 1.7643, "learning_rate": 4.265832765259748e-06, "epoch": 0.8675599875350577, "percentage": 86.76, "elapsed_time": "2 days, 17:48:07", "remaining_time": "10:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8353, "total_steps": 9627, "loss": 1.6081, "learning_rate": 4.259240511903834e-06, "epoch": 0.867663862054638, "percentage": 86.77, "elapsed_time": "2 days, 17:48:38", "remaining_time": "10:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8354, "total_steps": 9627, "loss": 1.8201, "learning_rate": 4.252653129582013e-06, "epoch": 0.8677677365742184, "percentage": 86.78, "elapsed_time": "2 days, 17:49:08", "remaining_time": "10:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8355, "total_steps": 9627, "loss": 1.5116, "learning_rate": 4.2460706189957895e-06, "epoch": 0.8678716110937987, "percentage": 86.79, "elapsed_time": "2 days, 17:49:38", "remaining_time": "10:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8356, "total_steps": 9627, "loss": 1.772, "learning_rate": 4.239492980846155e-06, "epoch": 0.867975485613379, "percentage": 86.8, "elapsed_time": "2 days, 17:50:07", "remaining_time": "10:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8357, "total_steps": 9627, "loss": 1.9206, "learning_rate": 4.232920215833569e-06, "epoch": 0.8680793601329594, "percentage": 86.81, "elapsed_time": "2 days, 17:50:37", "remaining_time": "10:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8358, "total_steps": 9627, "loss": 1.7219, "learning_rate": 4.226352324657973e-06, "epoch": 0.8681832346525398, "percentage": 86.82, "elapsed_time": "2 days, 17:51:09", "remaining_time": "9:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8359, "total_steps": 9627, "loss": 1.8179, "learning_rate": 4.219789308018829e-06, "epoch": 0.86828710917212, "percentage": 86.83, "elapsed_time": "2 days, 17:51:39", "remaining_time": "9:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8360, "total_steps": 9627, "loss": 1.6541, "learning_rate": 4.2132311666150005e-06, "epoch": 0.8683909836917004, "percentage": 86.84, "elapsed_time": "2 days, 17:52:08", "remaining_time": "9:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8361, "total_steps": 9627, "loss": 1.5655, "learning_rate": 4.206677901144917e-06, "epoch": 0.8684948582112808, "percentage": 86.85, "elapsed_time": "2 days, 17:52:38", "remaining_time": "9:58:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8362, "total_steps": 9627, "loss": 1.707, "learning_rate": 4.200129512306439e-06, "epoch": 0.8685987327308611, "percentage": 86.86, "elapsed_time": "2 days, 17:53:08", "remaining_time": "9:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8363, "total_steps": 9627, "loss": 1.6708, "learning_rate": 4.1935860007969005e-06, "epoch": 0.8687026072504415, "percentage": 86.87, "elapsed_time": "2 days, 17:53:39", "remaining_time": "9:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8364, "total_steps": 9627, "loss": 1.5422, "learning_rate": 4.187047367313157e-06, "epoch": 0.8688064817700218, "percentage": 86.88, "elapsed_time": "2 days, 17:54:09", "remaining_time": "9:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8365, "total_steps": 9627, "loss": 1.5345, "learning_rate": 4.180513612551517e-06, "epoch": 0.8689103562896021, "percentage": 86.89, "elapsed_time": "2 days, 17:54:39", "remaining_time": "9:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8366, "total_steps": 9627, "loss": 1.5311, "learning_rate": 4.17398473720777e-06, "epoch": 0.8690142308091825, "percentage": 86.9, "elapsed_time": "2 days, 17:55:08", "remaining_time": "9:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8367, "total_steps": 9627, "loss": 1.4414, "learning_rate": 4.1674607419771915e-06, "epoch": 0.8691181053287629, "percentage": 86.91, "elapsed_time": "2 days, 17:55:38", "remaining_time": "9:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8368, "total_steps": 9627, "loss": 1.4987, "learning_rate": 4.160941627554538e-06, "epoch": 0.8692219798483432, "percentage": 86.92, "elapsed_time": "2 days, 17:56:08", "remaining_time": "9:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8369, "total_steps": 9627, "loss": 1.6341, "learning_rate": 4.154427394634036e-06, "epoch": 0.8693258543679235, "percentage": 86.93, "elapsed_time": "2 days, 17:56:39", "remaining_time": "9:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8370, "total_steps": 9627, "loss": 1.7277, "learning_rate": 4.147918043909404e-06, "epoch": 0.8694297288875039, "percentage": 86.94, "elapsed_time": "2 days, 17:57:08", "remaining_time": "9:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8371, "total_steps": 9627, "loss": 1.6332, "learning_rate": 4.14141357607386e-06, "epoch": 0.8695336034070842, "percentage": 86.95, "elapsed_time": "2 days, 17:57:39", "remaining_time": "9:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8372, "total_steps": 9627, "loss": 1.6576, "learning_rate": 4.1349139918200385e-06, "epoch": 0.8696374779266646, "percentage": 86.96, "elapsed_time": "2 days, 17:58:09", "remaining_time": "9:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8373, "total_steps": 9627, "loss": 1.517, "learning_rate": 4.1284192918401245e-06, "epoch": 0.869741352446245, "percentage": 86.97, "elapsed_time": "2 days, 17:58:39", "remaining_time": "9:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8374, "total_steps": 9627, "loss": 1.6047, "learning_rate": 4.121929476825742e-06, "epoch": 0.8698452269658253, "percentage": 86.98, "elapsed_time": "2 days, 17:59:10", "remaining_time": "9:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8375, "total_steps": 9627, "loss": 1.6017, "learning_rate": 4.1154445474680115e-06, "epoch": 0.8699491014854056, "percentage": 86.99, "elapsed_time": "2 days, 17:59:39", "remaining_time": "9:51:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8376, "total_steps": 9627, "loss": 1.7602, "learning_rate": 4.108964504457524e-06, "epoch": 0.870052976004986, "percentage": 87.01, "elapsed_time": "2 days, 18:00:10", "remaining_time": "9:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8377, "total_steps": 9627, "loss": 1.542, "learning_rate": 4.102489348484339e-06, "epoch": 0.8701568505245664, "percentage": 87.02, "elapsed_time": "2 days, 18:00:40", "remaining_time": "9:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8378, "total_steps": 9627, "loss": 1.4748, "learning_rate": 4.096019080238045e-06, "epoch": 0.8702607250441466, "percentage": 87.03, "elapsed_time": "2 days, 18:01:10", "remaining_time": "9:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8379, "total_steps": 9627, "loss": 1.6876, "learning_rate": 4.089553700407634e-06, "epoch": 0.870364599563727, "percentage": 87.04, "elapsed_time": "2 days, 18:01:39", "remaining_time": "9:50:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8380, "total_steps": 9627, "loss": 1.6637, "learning_rate": 4.083093209681649e-06, "epoch": 0.8704684740833074, "percentage": 87.05, "elapsed_time": "2 days, 18:02:09", "remaining_time": "9:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8381, "total_steps": 9627, "loss": 1.4212, "learning_rate": 4.076637608748074e-06, "epoch": 0.8705723486028877, "percentage": 87.06, "elapsed_time": "2 days, 18:02:39", "remaining_time": "9:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8382, "total_steps": 9627, "loss": 1.7361, "learning_rate": 4.070186898294375e-06, "epoch": 0.8706762231224681, "percentage": 87.07, "elapsed_time": "2 days, 18:03:09", "remaining_time": "9:48:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8383, "total_steps": 9627, "loss": 1.9468, "learning_rate": 4.063741079007505e-06, "epoch": 0.8707800976420484, "percentage": 87.08, "elapsed_time": "2 days, 18:03:39", "remaining_time": "9:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8384, "total_steps": 9627, "loss": 1.6335, "learning_rate": 4.057300151573895e-06, "epoch": 0.8708839721616287, "percentage": 87.09, "elapsed_time": "2 days, 18:04:08", "remaining_time": "9:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8385, "total_steps": 9627, "loss": 1.8369, "learning_rate": 4.050864116679454e-06, "epoch": 0.8709878466812091, "percentage": 87.1, "elapsed_time": "2 days, 18:04:38", "remaining_time": "9:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8386, "total_steps": 9627, "loss": 1.5588, "learning_rate": 4.044432975009554e-06, "epoch": 0.8710917212007895, "percentage": 87.11, "elapsed_time": "2 days, 18:05:09", "remaining_time": "9:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8387, "total_steps": 9627, "loss": 1.6729, "learning_rate": 4.038006727249094e-06, "epoch": 0.8711955957203698, "percentage": 87.12, "elapsed_time": "2 days, 18:05:39", "remaining_time": "9:46:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8388, "total_steps": 9627, "loss": 1.6353, "learning_rate": 4.031585374082381e-06, "epoch": 0.8712994702399501, "percentage": 87.13, "elapsed_time": "2 days, 18:06:09", "remaining_time": "9:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8389, "total_steps": 9627, "loss": 1.7602, "learning_rate": 4.025168916193273e-06, "epoch": 0.8714033447595305, "percentage": 87.14, "elapsed_time": "2 days, 18:06:39", "remaining_time": "9:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8390, "total_steps": 9627, "loss": 1.5152, "learning_rate": 4.0187573542650625e-06, "epoch": 0.8715072192791108, "percentage": 87.15, "elapsed_time": "2 days, 18:07:08", "remaining_time": "9:44:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8391, "total_steps": 9627, "loss": 1.775, "learning_rate": 4.01235068898051e-06, "epoch": 0.8716110937986912, "percentage": 87.16, "elapsed_time": "2 days, 18:07:38", "remaining_time": "9:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8392, "total_steps": 9627, "loss": 1.5729, "learning_rate": 4.005948921021896e-06, "epoch": 0.8717149683182716, "percentage": 87.17, "elapsed_time": "2 days, 18:08:08", "remaining_time": "9:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8393, "total_steps": 9627, "loss": 1.7396, "learning_rate": 3.99955205107096e-06, "epoch": 0.8718188428378518, "percentage": 87.18, "elapsed_time": "2 days, 18:08:39", "remaining_time": "9:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8394, "total_steps": 9627, "loss": 1.7512, "learning_rate": 3.99316007980891e-06, "epoch": 0.8719227173574322, "percentage": 87.19, "elapsed_time": "2 days, 18:09:08", "remaining_time": "9:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8395, "total_steps": 9627, "loss": 1.5736, "learning_rate": 3.9867730079164445e-06, "epoch": 0.8720265918770126, "percentage": 87.2, "elapsed_time": "2 days, 18:09:37", "remaining_time": "9:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8396, "total_steps": 9627, "loss": 1.4956, "learning_rate": 3.980390836073739e-06, "epoch": 0.8721304663965929, "percentage": 87.21, "elapsed_time": "2 days, 18:10:09", "remaining_time": "9:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8397, "total_steps": 9627, "loss": 1.5223, "learning_rate": 3.974013564960444e-06, "epoch": 0.8722343409161732, "percentage": 87.22, "elapsed_time": "2 days, 18:10:39", "remaining_time": "9:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8398, "total_steps": 9627, "loss": 1.5784, "learning_rate": 3.967641195255672e-06, "epoch": 0.8723382154357536, "percentage": 87.23, "elapsed_time": "2 days, 18:11:09", "remaining_time": "9:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8399, "total_steps": 9627, "loss": 1.652, "learning_rate": 3.9612737276380595e-06, "epoch": 0.872442089955334, "percentage": 87.24, "elapsed_time": "2 days, 18:11:39", "remaining_time": "9:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8400, "total_steps": 9627, "loss": 1.863, "learning_rate": 3.9549111627856795e-06, "epoch": 0.8725459644749143, "percentage": 87.25, "elapsed_time": "2 days, 18:12:08", "remaining_time": "9:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8401, "total_steps": 9627, "loss": 1.6226, "learning_rate": 3.948553501376096e-06, "epoch": 0.8726498389944947, "percentage": 87.26, "elapsed_time": "2 days, 18:12:39", "remaining_time": "9:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8402, "total_steps": 9627, "loss": 1.687, "learning_rate": 3.942200744086349e-06, "epoch": 0.872753713514075, "percentage": 87.28, "elapsed_time": "2 days, 18:13:09", "remaining_time": "9:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8403, "total_steps": 9627, "loss": 1.6296, "learning_rate": 3.935852891592956e-06, "epoch": 0.8728575880336553, "percentage": 87.29, "elapsed_time": "2 days, 18:13:38", "remaining_time": "9:38:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8404, "total_steps": 9627, "loss": 1.7, "learning_rate": 3.929509944571918e-06, "epoch": 0.8729614625532357, "percentage": 87.3, "elapsed_time": "2 days, 18:14:10", "remaining_time": "9:38:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8405, "total_steps": 9627, "loss": 1.627, "learning_rate": 3.9231719036987025e-06, "epoch": 0.8730653370728161, "percentage": 87.31, "elapsed_time": "2 days, 18:14:39", "remaining_time": "9:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8406, "total_steps": 9627, "loss": 1.6984, "learning_rate": 3.916838769648279e-06, "epoch": 0.8731692115923964, "percentage": 87.32, "elapsed_time": "2 days, 18:15:10", "remaining_time": "9:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8407, "total_steps": 9627, "loss": 1.5953, "learning_rate": 3.910510543095047e-06, "epoch": 0.8732730861119767, "percentage": 87.33, "elapsed_time": "2 days, 18:15:40", "remaining_time": "9:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8408, "total_steps": 9627, "loss": 1.8256, "learning_rate": 3.904187224712935e-06, "epoch": 0.8733769606315571, "percentage": 87.34, "elapsed_time": "2 days, 18:16:09", "remaining_time": "9:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8409, "total_steps": 9627, "loss": 1.6616, "learning_rate": 3.897868815175326e-06, "epoch": 0.8734808351511374, "percentage": 87.35, "elapsed_time": "2 days, 18:16:40", "remaining_time": "9:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8410, "total_steps": 9627, "loss": 1.4936, "learning_rate": 3.891555315155082e-06, "epoch": 0.8735847096707178, "percentage": 87.36, "elapsed_time": "2 days, 18:17:10", "remaining_time": "9:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8411, "total_steps": 9627, "loss": 1.5365, "learning_rate": 3.885246725324532e-06, "epoch": 0.8736885841902982, "percentage": 87.37, "elapsed_time": "2 days, 18:17:41", "remaining_time": "9:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8412, "total_steps": 9627, "loss": 1.5884, "learning_rate": 3.878943046355499e-06, "epoch": 0.8737924587098784, "percentage": 87.38, "elapsed_time": "2 days, 18:18:10", "remaining_time": "9:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8413, "total_steps": 9627, "loss": 1.6765, "learning_rate": 3.872644278919274e-06, "epoch": 0.8738963332294588, "percentage": 87.39, "elapsed_time": "2 days, 18:18:40", "remaining_time": "9:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8414, "total_steps": 9627, "loss": 1.6804, "learning_rate": 3.866350423686615e-06, "epoch": 0.8740002077490392, "percentage": 87.4, "elapsed_time": "2 days, 18:19:10", "remaining_time": "9:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8415, "total_steps": 9627, "loss": 1.7906, "learning_rate": 3.860061481327798e-06, "epoch": 0.8741040822686195, "percentage": 87.41, "elapsed_time": "2 days, 18:19:41", "remaining_time": "9:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8416, "total_steps": 9627, "loss": 1.7432, "learning_rate": 3.8537774525125195e-06, "epoch": 0.8742079567881998, "percentage": 87.42, "elapsed_time": "2 days, 18:20:10", "remaining_time": "9:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8417, "total_steps": 9627, "loss": 1.6909, "learning_rate": 3.847498337909977e-06, "epoch": 0.8743118313077802, "percentage": 87.43, "elapsed_time": "2 days, 18:20:41", "remaining_time": "9:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8418, "total_steps": 9627, "loss": 1.5617, "learning_rate": 3.8412241381888755e-06, "epoch": 0.8744157058273605, "percentage": 87.44, "elapsed_time": "2 days, 18:21:10", "remaining_time": "9:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8419, "total_steps": 9627, "loss": 1.854, "learning_rate": 3.834954854017337e-06, "epoch": 0.8745195803469409, "percentage": 87.45, "elapsed_time": "2 days, 18:21:40", "remaining_time": "9:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8420, "total_steps": 9627, "loss": 1.7667, "learning_rate": 3.828690486063013e-06, "epoch": 0.8746234548665213, "percentage": 87.46, "elapsed_time": "2 days, 18:22:11", "remaining_time": "9:30:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8421, "total_steps": 9627, "loss": 1.623, "learning_rate": 3.822431034993002e-06, "epoch": 0.8747273293861015, "percentage": 87.47, "elapsed_time": "2 days, 18:22:40", "remaining_time": "9:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8422, "total_steps": 9627, "loss": 1.6026, "learning_rate": 3.816176501473889e-06, "epoch": 0.8748312039056819, "percentage": 87.48, "elapsed_time": "2 days, 18:23:12", "remaining_time": "9:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8423, "total_steps": 9627, "loss": 1.7327, "learning_rate": 3.8099268861717275e-06, "epoch": 0.8749350784252623, "percentage": 87.49, "elapsed_time": "2 days, 18:23:41", "remaining_time": "9:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8424, "total_steps": 9627, "loss": 1.622, "learning_rate": 3.8036821897520502e-06, "epoch": 0.8750389529448427, "percentage": 87.5, "elapsed_time": "2 days, 18:24:11", "remaining_time": "9:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8425, "total_steps": 9627, "loss": 1.5021, "learning_rate": 3.7974424128798868e-06, "epoch": 0.875142827464423, "percentage": 87.51, "elapsed_time": "2 days, 18:24:40", "remaining_time": "9:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8426, "total_steps": 9627, "loss": 1.5933, "learning_rate": 3.7912075562197e-06, "epoch": 0.8752467019840033, "percentage": 87.52, "elapsed_time": "2 days, 18:25:12", "remaining_time": "9:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8427, "total_steps": 9627, "loss": 1.63, "learning_rate": 3.784977620435476e-06, "epoch": 0.8753505765035837, "percentage": 87.54, "elapsed_time": "2 days, 18:25:42", "remaining_time": "9:27:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8428, "total_steps": 9627, "loss": 1.655, "learning_rate": 3.7787526061906387e-06, "epoch": 0.875454451023164, "percentage": 87.55, "elapsed_time": "2 days, 18:26:11", "remaining_time": "9:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8429, "total_steps": 9627, "loss": 1.8994, "learning_rate": 3.7725325141481137e-06, "epoch": 0.8755583255427444, "percentage": 87.56, "elapsed_time": "2 days, 18:26:40", "remaining_time": "9:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8430, "total_steps": 9627, "loss": 1.6722, "learning_rate": 3.766317344970288e-06, "epoch": 0.8756622000623248, "percentage": 87.57, "elapsed_time": "2 days, 18:27:12", "remaining_time": "9:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8431, "total_steps": 9627, "loss": 1.6381, "learning_rate": 3.7601070993190267e-06, "epoch": 0.875766074581905, "percentage": 87.58, "elapsed_time": "2 days, 18:27:42", "remaining_time": "9:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8432, "total_steps": 9627, "loss": 1.6305, "learning_rate": 3.753901777855673e-06, "epoch": 0.8758699491014854, "percentage": 87.59, "elapsed_time": "2 days, 18:28:12", "remaining_time": "9:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8433, "total_steps": 9627, "loss": 1.6229, "learning_rate": 3.7477013812410422e-06, "epoch": 0.8759738236210658, "percentage": 87.6, "elapsed_time": "2 days, 18:28:42", "remaining_time": "9:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8434, "total_steps": 9627, "loss": 1.5569, "learning_rate": 3.7415059101354454e-06, "epoch": 0.8760776981406461, "percentage": 87.61, "elapsed_time": "2 days, 18:29:12", "remaining_time": "9:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8435, "total_steps": 9627, "loss": 1.5411, "learning_rate": 3.735315365198622e-06, "epoch": 0.8761815726602264, "percentage": 87.62, "elapsed_time": "2 days, 18:29:42", "remaining_time": "9:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8436, "total_steps": 9627, "loss": 1.5864, "learning_rate": 3.7291297470898435e-06, "epoch": 0.8762854471798068, "percentage": 87.63, "elapsed_time": "2 days, 18:30:12", "remaining_time": "9:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8437, "total_steps": 9627, "loss": 1.6638, "learning_rate": 3.7229490564678227e-06, "epoch": 0.8763893216993871, "percentage": 87.64, "elapsed_time": "2 days, 18:30:41", "remaining_time": "9:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8438, "total_steps": 9627, "loss": 1.497, "learning_rate": 3.7167732939907496e-06, "epoch": 0.8764931962189675, "percentage": 87.65, "elapsed_time": "2 days, 18:31:12", "remaining_time": "9:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8439, "total_steps": 9627, "loss": 1.5113, "learning_rate": 3.710602460316298e-06, "epoch": 0.8765970707385479, "percentage": 87.66, "elapsed_time": "2 days, 18:31:42", "remaining_time": "9:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8440, "total_steps": 9627, "loss": 1.5233, "learning_rate": 3.704436556101615e-06, "epoch": 0.8767009452581281, "percentage": 87.67, "elapsed_time": "2 days, 18:32:11", "remaining_time": "9:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8441, "total_steps": 9627, "loss": 1.6151, "learning_rate": 3.6982755820033186e-06, "epoch": 0.8768048197777085, "percentage": 87.68, "elapsed_time": "2 days, 18:32:40", "remaining_time": "9:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8442, "total_steps": 9627, "loss": 1.5301, "learning_rate": 3.6921195386774965e-06, "epoch": 0.8769086942972889, "percentage": 87.69, "elapsed_time": "2 days, 18:33:10", "remaining_time": "9:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8443, "total_steps": 9627, "loss": 1.6463, "learning_rate": 3.6859684267797455e-06, "epoch": 0.8770125688168692, "percentage": 87.7, "elapsed_time": "2 days, 18:33:40", "remaining_time": "9:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8444, "total_steps": 9627, "loss": 1.4855, "learning_rate": 3.679822246965087e-06, "epoch": 0.8771164433364496, "percentage": 87.71, "elapsed_time": "2 days, 18:34:10", "remaining_time": "9:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8445, "total_steps": 9627, "loss": 1.5532, "learning_rate": 3.673680999888035e-06, "epoch": 0.8772203178560299, "percentage": 87.72, "elapsed_time": "2 days, 18:34:40", "remaining_time": "9:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8446, "total_steps": 9627, "loss": 1.5249, "learning_rate": 3.6675446862026176e-06, "epoch": 0.8773241923756102, "percentage": 87.73, "elapsed_time": "2 days, 18:35:09", "remaining_time": "9:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8447, "total_steps": 9627, "loss": 1.6669, "learning_rate": 3.661413306562267e-06, "epoch": 0.8774280668951906, "percentage": 87.74, "elapsed_time": "2 days, 18:35:39", "remaining_time": "9:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8448, "total_steps": 9627, "loss": 1.7169, "learning_rate": 3.65528686161995e-06, "epoch": 0.877531941414771, "percentage": 87.75, "elapsed_time": "2 days, 18:36:09", "remaining_time": "9:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8449, "total_steps": 9627, "loss": 1.6258, "learning_rate": 3.649165352028083e-06, "epoch": 0.8776358159343512, "percentage": 87.76, "elapsed_time": "2 days, 18:36:39", "remaining_time": "9:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8450, "total_steps": 9627, "loss": 1.6233, "learning_rate": 3.6430487784385515e-06, "epoch": 0.8777396904539316, "percentage": 87.77, "elapsed_time": "2 days, 18:37:09", "remaining_time": "9:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8451, "total_steps": 9627, "loss": 1.6136, "learning_rate": 3.636937141502733e-06, "epoch": 0.877843564973512, "percentage": 87.78, "elapsed_time": "2 days, 18:37:38", "remaining_time": "9:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8452, "total_steps": 9627, "loss": 1.8124, "learning_rate": 3.6308304418714523e-06, "epoch": 0.8779474394930924, "percentage": 87.79, "elapsed_time": "2 days, 18:38:08", "remaining_time": "9:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8453, "total_steps": 9627, "loss": 1.708, "learning_rate": 3.6247286801950497e-06, "epoch": 0.8780513140126727, "percentage": 87.81, "elapsed_time": "2 days, 18:38:38", "remaining_time": "9:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8454, "total_steps": 9627, "loss": 1.5891, "learning_rate": 3.6186318571232893e-06, "epoch": 0.878155188532253, "percentage": 87.82, "elapsed_time": "2 days, 18:39:08", "remaining_time": "9:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8455, "total_steps": 9627, "loss": 1.6752, "learning_rate": 3.612539973305451e-06, "epoch": 0.8782590630518334, "percentage": 87.83, "elapsed_time": "2 days, 18:39:37", "remaining_time": "9:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8456, "total_steps": 9627, "loss": 1.6183, "learning_rate": 3.606453029390272e-06, "epoch": 0.8783629375714137, "percentage": 87.84, "elapsed_time": "2 days, 18:40:09", "remaining_time": "9:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8457, "total_steps": 9627, "loss": 1.9086, "learning_rate": 3.6003710260259616e-06, "epoch": 0.8784668120909941, "percentage": 87.85, "elapsed_time": "2 days, 18:40:38", "remaining_time": "9:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8458, "total_steps": 9627, "loss": 1.5987, "learning_rate": 3.5942939638602067e-06, "epoch": 0.8785706866105745, "percentage": 87.86, "elapsed_time": "2 days, 18:41:08", "remaining_time": "9:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8459, "total_steps": 9627, "loss": 1.7094, "learning_rate": 3.588221843540168e-06, "epoch": 0.8786745611301547, "percentage": 87.87, "elapsed_time": "2 days, 18:41:38", "remaining_time": "9:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8460, "total_steps": 9627, "loss": 1.6371, "learning_rate": 3.582154665712473e-06, "epoch": 0.8787784356497351, "percentage": 87.88, "elapsed_time": "2 days, 18:42:08", "remaining_time": "9:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8461, "total_steps": 9627, "loss": 1.72, "learning_rate": 3.5760924310232258e-06, "epoch": 0.8788823101693155, "percentage": 87.89, "elapsed_time": "2 days, 18:42:38", "remaining_time": "9:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8462, "total_steps": 9627, "loss": 1.769, "learning_rate": 3.5700351401180333e-06, "epoch": 0.8789861846888958, "percentage": 87.9, "elapsed_time": "2 days, 18:43:08", "remaining_time": "9:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8463, "total_steps": 9627, "loss": 1.7098, "learning_rate": 3.5639827936419123e-06, "epoch": 0.8790900592084762, "percentage": 87.91, "elapsed_time": "2 days, 18:43:38", "remaining_time": "9:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8464, "total_steps": 9627, "loss": 1.7701, "learning_rate": 3.5579353922394197e-06, "epoch": 0.8791939337280565, "percentage": 87.92, "elapsed_time": "2 days, 18:44:08", "remaining_time": "9:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8465, "total_steps": 9627, "loss": 1.7982, "learning_rate": 3.5518929365545406e-06, "epoch": 0.8792978082476368, "percentage": 87.93, "elapsed_time": "2 days, 18:44:37", "remaining_time": "9:09:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8466, "total_steps": 9627, "loss": 1.6386, "learning_rate": 3.5458554272307597e-06, "epoch": 0.8794016827672172, "percentage": 87.94, "elapsed_time": "2 days, 18:45:09", "remaining_time": "9:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8467, "total_steps": 9627, "loss": 1.6979, "learning_rate": 3.5398228649110186e-06, "epoch": 0.8795055572867976, "percentage": 87.95, "elapsed_time": "2 days, 18:45:38", "remaining_time": "9:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8468, "total_steps": 9627, "loss": 1.4209, "learning_rate": 3.533795250237737e-06, "epoch": 0.8796094318063779, "percentage": 87.96, "elapsed_time": "2 days, 18:46:08", "remaining_time": "9:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8469, "total_steps": 9627, "loss": 1.4331, "learning_rate": 3.527772583852812e-06, "epoch": 0.8797133063259582, "percentage": 87.97, "elapsed_time": "2 days, 18:46:39", "remaining_time": "9:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8470, "total_steps": 9627, "loss": 1.8114, "learning_rate": 3.521754866397603e-06, "epoch": 0.8798171808455386, "percentage": 87.98, "elapsed_time": "2 days, 18:47:09", "remaining_time": "9:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8471, "total_steps": 9627, "loss": 1.5685, "learning_rate": 3.5157420985129696e-06, "epoch": 0.8799210553651189, "percentage": 87.99, "elapsed_time": "2 days, 18:47:39", "remaining_time": "9:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8472, "total_steps": 9627, "loss": 1.4964, "learning_rate": 3.5097342808392054e-06, "epoch": 0.8800249298846993, "percentage": 88.0, "elapsed_time": "2 days, 18:48:08", "remaining_time": "9:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8473, "total_steps": 9627, "loss": 1.4608, "learning_rate": 3.5037314140160926e-06, "epoch": 0.8801288044042797, "percentage": 88.01, "elapsed_time": "2 days, 18:48:38", "remaining_time": "9:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8474, "total_steps": 9627, "loss": 1.6019, "learning_rate": 3.4977334986829145e-06, "epoch": 0.8802326789238599, "percentage": 88.02, "elapsed_time": "2 days, 18:49:08", "remaining_time": "9:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8475, "total_steps": 9627, "loss": 1.7727, "learning_rate": 3.4917405354783772e-06, "epoch": 0.8803365534434403, "percentage": 88.03, "elapsed_time": "2 days, 18:49:38", "remaining_time": "9:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8476, "total_steps": 9627, "loss": 1.7575, "learning_rate": 3.4857525250406976e-06, "epoch": 0.8804404279630207, "percentage": 88.04, "elapsed_time": "2 days, 18:50:07", "remaining_time": "9:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8477, "total_steps": 9627, "loss": 1.6869, "learning_rate": 3.479769468007543e-06, "epoch": 0.8805443024826011, "percentage": 88.05, "elapsed_time": "2 days, 18:50:37", "remaining_time": "9:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8478, "total_steps": 9627, "loss": 1.446, "learning_rate": 3.4737913650160826e-06, "epoch": 0.8806481770021813, "percentage": 88.06, "elapsed_time": "2 days, 18:51:07", "remaining_time": "9:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8479, "total_steps": 9627, "loss": 1.5894, "learning_rate": 3.467818216702917e-06, "epoch": 0.8807520515217617, "percentage": 88.08, "elapsed_time": "2 days, 18:51:37", "remaining_time": "9:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8480, "total_steps": 9627, "loss": 1.5221, "learning_rate": 3.461850023704133e-06, "epoch": 0.8808559260413421, "percentage": 88.09, "elapsed_time": "2 days, 18:52:06", "remaining_time": "9:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8481, "total_steps": 9627, "loss": 1.7771, "learning_rate": 3.4558867866553324e-06, "epoch": 0.8809598005609224, "percentage": 88.1, "elapsed_time": "2 days, 18:52:36", "remaining_time": "9:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8482, "total_steps": 9627, "loss": 1.6525, "learning_rate": 3.4499285061915134e-06, "epoch": 0.8810636750805028, "percentage": 88.11, "elapsed_time": "2 days, 18:53:06", "remaining_time": "9:01:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8483, "total_steps": 9627, "loss": 1.808, "learning_rate": 3.4439751829472123e-06, "epoch": 0.8811675496000831, "percentage": 88.12, "elapsed_time": "2 days, 18:53:36", "remaining_time": "9:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8484, "total_steps": 9627, "loss": 1.4988, "learning_rate": 3.4380268175564e-06, "epoch": 0.8812714241196634, "percentage": 88.13, "elapsed_time": "2 days, 18:54:05", "remaining_time": "9:00:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8485, "total_steps": 9627, "loss": 1.7904, "learning_rate": 3.4320834106525367e-06, "epoch": 0.8813752986392438, "percentage": 88.14, "elapsed_time": "2 days, 18:54:35", "remaining_time": "9:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8486, "total_steps": 9627, "loss": 1.4656, "learning_rate": 3.4261449628685492e-06, "epoch": 0.8814791731588242, "percentage": 88.15, "elapsed_time": "2 days, 18:55:05", "remaining_time": "8:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8487, "total_steps": 9627, "loss": 1.6166, "learning_rate": 3.4202114748368264e-06, "epoch": 0.8815830476784045, "percentage": 88.16, "elapsed_time": "2 days, 18:55:35", "remaining_time": "8:59:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8488, "total_steps": 9627, "loss": 1.681, "learning_rate": 3.414282947189251e-06, "epoch": 0.8816869221979848, "percentage": 88.17, "elapsed_time": "2 days, 18:56:06", "remaining_time": "8:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8489, "total_steps": 9627, "loss": 1.6805, "learning_rate": 3.4083593805571523e-06, "epoch": 0.8817907967175652, "percentage": 88.18, "elapsed_time": "2 days, 18:56:35", "remaining_time": "8:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8490, "total_steps": 9627, "loss": 1.7227, "learning_rate": 3.402440775571364e-06, "epoch": 0.8818946712371455, "percentage": 88.19, "elapsed_time": "2 days, 18:57:05", "remaining_time": "8:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8491, "total_steps": 9627, "loss": 1.792, "learning_rate": 3.3965271328621374e-06, "epoch": 0.8819985457567259, "percentage": 88.2, "elapsed_time": "2 days, 18:57:34", "remaining_time": "8:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8492, "total_steps": 9627, "loss": 1.589, "learning_rate": 3.390618453059263e-06, "epoch": 0.8821024202763063, "percentage": 88.21, "elapsed_time": "2 days, 18:58:05", "remaining_time": "8:57:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8493, "total_steps": 9627, "loss": 1.6795, "learning_rate": 3.384714736791955e-06, "epoch": 0.8822062947958865, "percentage": 88.22, "elapsed_time": "2 days, 18:58:35", "remaining_time": "8:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8494, "total_steps": 9627, "loss": 1.6938, "learning_rate": 3.3788159846889157e-06, "epoch": 0.8823101693154669, "percentage": 88.23, "elapsed_time": "2 days, 18:59:04", "remaining_time": "8:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8495, "total_steps": 9627, "loss": 1.6643, "learning_rate": 3.3729221973783144e-06, "epoch": 0.8824140438350473, "percentage": 88.24, "elapsed_time": "2 days, 18:59:35", "remaining_time": "8:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8496, "total_steps": 9627, "loss": 1.8358, "learning_rate": 3.3670333754877937e-06, "epoch": 0.8825179183546276, "percentage": 88.25, "elapsed_time": "2 days, 19:00:05", "remaining_time": "8:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8497, "total_steps": 9627, "loss": 1.5936, "learning_rate": 3.3611495196444685e-06, "epoch": 0.8826217928742079, "percentage": 88.26, "elapsed_time": "2 days, 19:00:34", "remaining_time": "8:54:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8498, "total_steps": 9627, "loss": 1.6163, "learning_rate": 3.355270630474916e-06, "epoch": 0.8827256673937883, "percentage": 88.27, "elapsed_time": "2 days, 19:01:05", "remaining_time": "8:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8499, "total_steps": 9627, "loss": 1.5595, "learning_rate": 3.3493967086052126e-06, "epoch": 0.8828295419133686, "percentage": 88.28, "elapsed_time": "2 days, 19:01:35", "remaining_time": "8:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8500, "total_steps": 9627, "loss": 1.5006, "learning_rate": 3.343527754660858e-06, "epoch": 0.882933416432949, "percentage": 88.29, "elapsed_time": "2 days, 19:02:04", "remaining_time": "8:53:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8501, "total_steps": 9627, "loss": 1.6199, "learning_rate": 3.3376637692668632e-06, "epoch": 0.8830372909525294, "percentage": 88.3, "elapsed_time": "2 days, 19:02:34", "remaining_time": "8:52:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8502, "total_steps": 9627, "loss": 1.7884, "learning_rate": 3.3318047530477013e-06, "epoch": 0.8831411654721097, "percentage": 88.31, "elapsed_time": "2 days, 19:03:05", "remaining_time": "8:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8503, "total_steps": 9627, "loss": 1.4395, "learning_rate": 3.3259507066273064e-06, "epoch": 0.88324503999169, "percentage": 88.32, "elapsed_time": "2 days, 19:03:34", "remaining_time": "8:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8504, "total_steps": 9627, "loss": 1.7359, "learning_rate": 3.320101630629091e-06, "epoch": 0.8833489145112704, "percentage": 88.33, "elapsed_time": "2 days, 19:04:05", "remaining_time": "8:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8505, "total_steps": 9627, "loss": 1.6038, "learning_rate": 3.3142575256759346e-06, "epoch": 0.8834527890308508, "percentage": 88.35, "elapsed_time": "2 days, 19:04:34", "remaining_time": "8:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8506, "total_steps": 9627, "loss": 1.6193, "learning_rate": 3.3084183923901834e-06, "epoch": 0.883556663550431, "percentage": 88.36, "elapsed_time": "2 days, 19:05:04", "remaining_time": "8:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8507, "total_steps": 9627, "loss": 1.636, "learning_rate": 3.302584231393674e-06, "epoch": 0.8836605380700114, "percentage": 88.37, "elapsed_time": "2 days, 19:05:34", "remaining_time": "8:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8508, "total_steps": 9627, "loss": 1.6229, "learning_rate": 3.2967550433076754e-06, "epoch": 0.8837644125895918, "percentage": 88.38, "elapsed_time": "2 days, 19:06:04", "remaining_time": "8:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8509, "total_steps": 9627, "loss": 1.639, "learning_rate": 3.290930828752986e-06, "epoch": 0.8838682871091721, "percentage": 88.39, "elapsed_time": "2 days, 19:06:35", "remaining_time": "8:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8510, "total_steps": 9627, "loss": 1.6301, "learning_rate": 3.2851115883497986e-06, "epoch": 0.8839721616287525, "percentage": 88.4, "elapsed_time": "2 days, 19:07:04", "remaining_time": "8:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8511, "total_steps": 9627, "loss": 1.5388, "learning_rate": 3.27929732271785e-06, "epoch": 0.8840760361483329, "percentage": 88.41, "elapsed_time": "2 days, 19:07:35", "remaining_time": "8:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8512, "total_steps": 9627, "loss": 1.7176, "learning_rate": 3.2734880324762962e-06, "epoch": 0.8841799106679131, "percentage": 88.42, "elapsed_time": "2 days, 19:08:05", "remaining_time": "8:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8513, "total_steps": 9627, "loss": 1.8459, "learning_rate": 3.267683718243786e-06, "epoch": 0.8842837851874935, "percentage": 88.43, "elapsed_time": "2 days, 19:08:34", "remaining_time": "8:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8514, "total_steps": 9627, "loss": 1.7073, "learning_rate": 3.261884380638436e-06, "epoch": 0.8843876597070739, "percentage": 88.44, "elapsed_time": "2 days, 19:09:04", "remaining_time": "8:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8515, "total_steps": 9627, "loss": 1.7029, "learning_rate": 3.25609002027783e-06, "epoch": 0.8844915342266542, "percentage": 88.45, "elapsed_time": "2 days, 19:09:34", "remaining_time": "8:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8516, "total_steps": 9627, "loss": 1.5025, "learning_rate": 3.250300637779019e-06, "epoch": 0.8845954087462345, "percentage": 88.46, "elapsed_time": "2 days, 19:10:03", "remaining_time": "8:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8517, "total_steps": 9627, "loss": 1.8947, "learning_rate": 3.2445162337585154e-06, "epoch": 0.8846992832658149, "percentage": 88.47, "elapsed_time": "2 days, 19:10:34", "remaining_time": "8:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8518, "total_steps": 9627, "loss": 1.9812, "learning_rate": 3.238736808832349e-06, "epoch": 0.8848031577853952, "percentage": 88.48, "elapsed_time": "2 days, 19:11:04", "remaining_time": "8:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8519, "total_steps": 9627, "loss": 1.7276, "learning_rate": 3.2329623636159435e-06, "epoch": 0.8849070323049756, "percentage": 88.49, "elapsed_time": "2 days, 19:11:34", "remaining_time": "8:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8520, "total_steps": 9627, "loss": 1.6525, "learning_rate": 3.2271928987242518e-06, "epoch": 0.885010906824556, "percentage": 88.5, "elapsed_time": "2 days, 19:12:03", "remaining_time": "8:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8521, "total_steps": 9627, "loss": 1.7034, "learning_rate": 3.2214284147716823e-06, "epoch": 0.8851147813441362, "percentage": 88.51, "elapsed_time": "2 days, 19:12:33", "remaining_time": "8:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8522, "total_steps": 9627, "loss": 1.5724, "learning_rate": 3.215668912372094e-06, "epoch": 0.8852186558637166, "percentage": 88.52, "elapsed_time": "2 days, 19:13:03", "remaining_time": "8:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8523, "total_steps": 9627, "loss": 1.5867, "learning_rate": 3.209914392138835e-06, "epoch": 0.885322530383297, "percentage": 88.53, "elapsed_time": "2 days, 19:13:34", "remaining_time": "8:42:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8524, "total_steps": 9627, "loss": 1.6334, "learning_rate": 3.2041648546847215e-06, "epoch": 0.8854264049028773, "percentage": 88.54, "elapsed_time": "2 days, 19:14:03", "remaining_time": "8:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8525, "total_steps": 9627, "loss": 1.6318, "learning_rate": 3.198420300622024e-06, "epoch": 0.8855302794224577, "percentage": 88.55, "elapsed_time": "2 days, 19:14:33", "remaining_time": "8:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8526, "total_steps": 9627, "loss": 1.5733, "learning_rate": 3.192680730562492e-06, "epoch": 0.885634153942038, "percentage": 88.56, "elapsed_time": "2 days, 19:15:03", "remaining_time": "8:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8527, "total_steps": 9627, "loss": 1.7382, "learning_rate": 3.18694614511737e-06, "epoch": 0.8857380284616183, "percentage": 88.57, "elapsed_time": "2 days, 19:15:33", "remaining_time": "8:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8528, "total_steps": 9627, "loss": 1.7749, "learning_rate": 3.181216544897314e-06, "epoch": 0.8858419029811987, "percentage": 88.58, "elapsed_time": "2 days, 19:16:03", "remaining_time": "8:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8529, "total_steps": 9627, "loss": 1.8558, "learning_rate": 3.175491930512492e-06, "epoch": 0.8859457775007791, "percentage": 88.59, "elapsed_time": "2 days, 19:16:32", "remaining_time": "8:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8530, "total_steps": 9627, "loss": 1.5591, "learning_rate": 3.1697723025725378e-06, "epoch": 0.8860496520203595, "percentage": 88.6, "elapsed_time": "2 days, 19:17:03", "remaining_time": "8:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8531, "total_steps": 9627, "loss": 1.6387, "learning_rate": 3.164057661686548e-06, "epoch": 0.8861535265399397, "percentage": 88.62, "elapsed_time": "2 days, 19:17:32", "remaining_time": "8:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8532, "total_steps": 9627, "loss": 1.6326, "learning_rate": 3.15834800846308e-06, "epoch": 0.8862574010595201, "percentage": 88.63, "elapsed_time": "2 days, 19:18:02", "remaining_time": "8:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8533, "total_steps": 9627, "loss": 1.6648, "learning_rate": 3.15264334351017e-06, "epoch": 0.8863612755791005, "percentage": 88.64, "elapsed_time": "2 days, 19:18:31", "remaining_time": "8:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8534, "total_steps": 9627, "loss": 1.8897, "learning_rate": 3.146943667435326e-06, "epoch": 0.8864651500986808, "percentage": 88.65, "elapsed_time": "2 days, 19:19:01", "remaining_time": "8:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8535, "total_steps": 9627, "loss": 1.6006, "learning_rate": 3.141248980845507e-06, "epoch": 0.8865690246182611, "percentage": 88.66, "elapsed_time": "2 days, 19:19:31", "remaining_time": "8:36:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8536, "total_steps": 9627, "loss": 1.4317, "learning_rate": 3.135559284347156e-06, "epoch": 0.8866728991378415, "percentage": 88.67, "elapsed_time": "2 days, 19:20:01", "remaining_time": "8:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8537, "total_steps": 9627, "loss": 1.5809, "learning_rate": 3.1298745785461937e-06, "epoch": 0.8867767736574218, "percentage": 88.68, "elapsed_time": "2 days, 19:20:30", "remaining_time": "8:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8538, "total_steps": 9627, "loss": 1.6632, "learning_rate": 3.1241948640479803e-06, "epoch": 0.8868806481770022, "percentage": 88.69, "elapsed_time": "2 days, 19:21:00", "remaining_time": "8:35:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8539, "total_steps": 9627, "loss": 1.5574, "learning_rate": 3.1185201414573707e-06, "epoch": 0.8869845226965826, "percentage": 88.7, "elapsed_time": "2 days, 19:21:30", "remaining_time": "8:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8540, "total_steps": 9627, "loss": 1.6832, "learning_rate": 3.112850411378676e-06, "epoch": 0.8870883972161628, "percentage": 88.71, "elapsed_time": "2 days, 19:22:00", "remaining_time": "8:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8541, "total_steps": 9627, "loss": 1.6025, "learning_rate": 3.10718567441568e-06, "epoch": 0.8871922717357432, "percentage": 88.72, "elapsed_time": "2 days, 19:22:29", "remaining_time": "8:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8542, "total_steps": 9627, "loss": 1.6887, "learning_rate": 3.101525931171634e-06, "epoch": 0.8872961462553236, "percentage": 88.73, "elapsed_time": "2 days, 19:22:59", "remaining_time": "8:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8543, "total_steps": 9627, "loss": 1.4197, "learning_rate": 3.095871182249255e-06, "epoch": 0.8874000207749039, "percentage": 88.74, "elapsed_time": "2 days, 19:23:29", "remaining_time": "8:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8544, "total_steps": 9627, "loss": 1.655, "learning_rate": 3.0902214282507225e-06, "epoch": 0.8875038952944843, "percentage": 88.75, "elapsed_time": "2 days, 19:23:59", "remaining_time": "8:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8545, "total_steps": 9627, "loss": 1.6276, "learning_rate": 3.0845766697776945e-06, "epoch": 0.8876077698140646, "percentage": 88.76, "elapsed_time": "2 days, 19:24:28", "remaining_time": "8:32:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8546, "total_steps": 9627, "loss": 1.7068, "learning_rate": 3.078936907431312e-06, "epoch": 0.8877116443336449, "percentage": 88.77, "elapsed_time": "2 days, 19:24:59", "remaining_time": "8:31:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8547, "total_steps": 9627, "loss": 1.5961, "learning_rate": 3.0733021418121342e-06, "epoch": 0.8878155188532253, "percentage": 88.78, "elapsed_time": "2 days, 19:25:28", "remaining_time": "8:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8548, "total_steps": 9627, "loss": 1.735, "learning_rate": 3.0676723735202416e-06, "epoch": 0.8879193933728057, "percentage": 88.79, "elapsed_time": "2 days, 19:25:59", "remaining_time": "8:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8549, "total_steps": 9627, "loss": 1.7273, "learning_rate": 3.0620476031551604e-06, "epoch": 0.888023267892386, "percentage": 88.8, "elapsed_time": "2 days, 19:26:27", "remaining_time": "8:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8550, "total_steps": 9627, "loss": 1.6152, "learning_rate": 3.056427831315878e-06, "epoch": 0.8881271424119663, "percentage": 88.81, "elapsed_time": "2 days, 19:26:58", "remaining_time": "8:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8551, "total_steps": 9627, "loss": 1.6926, "learning_rate": 3.0508130586008545e-06, "epoch": 0.8882310169315467, "percentage": 88.82, "elapsed_time": "2 days, 19:27:27", "remaining_time": "8:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8552, "total_steps": 9627, "loss": 1.6707, "learning_rate": 3.0452032856080227e-06, "epoch": 0.888334891451127, "percentage": 88.83, "elapsed_time": "2 days, 19:27:58", "remaining_time": "8:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8553, "total_steps": 9627, "loss": 1.6203, "learning_rate": 3.039598512934783e-06, "epoch": 0.8884387659707074, "percentage": 88.84, "elapsed_time": "2 days, 19:28:28", "remaining_time": "8:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8554, "total_steps": 9627, "loss": 1.7286, "learning_rate": 3.0339987411779846e-06, "epoch": 0.8885426404902877, "percentage": 88.85, "elapsed_time": "2 days, 19:28:58", "remaining_time": "8:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8555, "total_steps": 9627, "loss": 1.5416, "learning_rate": 3.0284039709339795e-06, "epoch": 0.8886465150098681, "percentage": 88.86, "elapsed_time": "2 days, 19:29:27", "remaining_time": "8:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8556, "total_steps": 9627, "loss": 1.6695, "learning_rate": 3.0228142027985684e-06, "epoch": 0.8887503895294484, "percentage": 88.88, "elapsed_time": "2 days, 19:29:57", "remaining_time": "8:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8557, "total_steps": 9627, "loss": 1.5937, "learning_rate": 3.017229437366992e-06, "epoch": 0.8888542640490288, "percentage": 88.89, "elapsed_time": "2 days, 19:30:27", "remaining_time": "8:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8558, "total_steps": 9627, "loss": 1.6053, "learning_rate": 3.0116496752340127e-06, "epoch": 0.8889581385686092, "percentage": 88.9, "elapsed_time": "2 days, 19:30:56", "remaining_time": "8:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8559, "total_steps": 9627, "loss": 1.491, "learning_rate": 3.0060749169938174e-06, "epoch": 0.8890620130881894, "percentage": 88.91, "elapsed_time": "2 days, 19:31:26", "remaining_time": "8:25:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8560, "total_steps": 9627, "loss": 1.775, "learning_rate": 3.000505163240075e-06, "epoch": 0.8891658876077698, "percentage": 88.92, "elapsed_time": "2 days, 19:31:57", "remaining_time": "8:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8561, "total_steps": 9627, "loss": 1.5729, "learning_rate": 2.994940414565922e-06, "epoch": 0.8892697621273502, "percentage": 88.93, "elapsed_time": "2 days, 19:32:25", "remaining_time": "8:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8562, "total_steps": 9627, "loss": 1.5631, "learning_rate": 2.9893806715639626e-06, "epoch": 0.8893736366469305, "percentage": 88.94, "elapsed_time": "2 days, 19:32:56", "remaining_time": "8:24:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8563, "total_steps": 9627, "loss": 1.599, "learning_rate": 2.9838259348262675e-06, "epoch": 0.8894775111665109, "percentage": 88.95, "elapsed_time": "2 days, 19:33:25", "remaining_time": "8:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8564, "total_steps": 9627, "loss": 1.6522, "learning_rate": 2.978276204944358e-06, "epoch": 0.8895813856860912, "percentage": 88.96, "elapsed_time": "2 days, 19:33:56", "remaining_time": "8:23:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8565, "total_steps": 9627, "loss": 1.7648, "learning_rate": 2.9727314825092667e-06, "epoch": 0.8896852602056715, "percentage": 88.97, "elapsed_time": "2 days, 19:34:26", "remaining_time": "8:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8566, "total_steps": 9627, "loss": 1.6324, "learning_rate": 2.967191768111427e-06, "epoch": 0.8897891347252519, "percentage": 88.98, "elapsed_time": "2 days, 19:34:56", "remaining_time": "8:22:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8567, "total_steps": 9627, "loss": 1.8669, "learning_rate": 2.9616570623408057e-06, "epoch": 0.8898930092448323, "percentage": 88.99, "elapsed_time": "2 days, 19:35:26", "remaining_time": "8:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8568, "total_steps": 9627, "loss": 1.6186, "learning_rate": 2.956127365786793e-06, "epoch": 0.8899968837644125, "percentage": 89.0, "elapsed_time": "2 days, 19:35:55", "remaining_time": "8:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8569, "total_steps": 9627, "loss": 1.8238, "learning_rate": 2.950602679038261e-06, "epoch": 0.8901007582839929, "percentage": 89.01, "elapsed_time": "2 days, 19:36:26", "remaining_time": "8:20:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8570, "total_steps": 9627, "loss": 1.7467, "learning_rate": 2.9450830026835407e-06, "epoch": 0.8902046328035733, "percentage": 89.02, "elapsed_time": "2 days, 19:36:55", "remaining_time": "8:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8571, "total_steps": 9627, "loss": 1.931, "learning_rate": 2.939568337310439e-06, "epoch": 0.8903085073231536, "percentage": 89.03, "elapsed_time": "2 days, 19:37:25", "remaining_time": "8:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8572, "total_steps": 9627, "loss": 1.6322, "learning_rate": 2.9340586835062302e-06, "epoch": 0.890412381842734, "percentage": 89.04, "elapsed_time": "2 days, 19:37:55", "remaining_time": "8:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8573, "total_steps": 9627, "loss": 1.5128, "learning_rate": 2.9285540418576283e-06, "epoch": 0.8905162563623144, "percentage": 89.05, "elapsed_time": "2 days, 19:38:25", "remaining_time": "8:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8574, "total_steps": 9627, "loss": 1.5671, "learning_rate": 2.9230544129508655e-06, "epoch": 0.8906201308818946, "percentage": 89.06, "elapsed_time": "2 days, 19:38:54", "remaining_time": "8:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8575, "total_steps": 9627, "loss": 1.4673, "learning_rate": 2.9175597973715828e-06, "epoch": 0.890724005401475, "percentage": 89.07, "elapsed_time": "2 days, 19:39:24", "remaining_time": "8:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8576, "total_steps": 9627, "loss": 1.6937, "learning_rate": 2.9120701957049246e-06, "epoch": 0.8908278799210554, "percentage": 89.08, "elapsed_time": "2 days, 19:39:54", "remaining_time": "8:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8577, "total_steps": 9627, "loss": 1.5243, "learning_rate": 2.906585608535495e-06, "epoch": 0.8909317544406357, "percentage": 89.09, "elapsed_time": "2 days, 19:40:24", "remaining_time": "8:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8578, "total_steps": 9627, "loss": 1.5281, "learning_rate": 2.9011060364473595e-06, "epoch": 0.891035628960216, "percentage": 89.1, "elapsed_time": "2 days, 19:40:53", "remaining_time": "8:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8579, "total_steps": 9627, "loss": 1.7556, "learning_rate": 2.8956314800240415e-06, "epoch": 0.8911395034797964, "percentage": 89.11, "elapsed_time": "2 days, 19:41:24", "remaining_time": "8:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8580, "total_steps": 9627, "loss": 1.7168, "learning_rate": 2.8901619398485347e-06, "epoch": 0.8912433779993768, "percentage": 89.12, "elapsed_time": "2 days, 19:41:52", "remaining_time": "8:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8581, "total_steps": 9627, "loss": 1.5863, "learning_rate": 2.8846974165033235e-06, "epoch": 0.8913472525189571, "percentage": 89.13, "elapsed_time": "2 days, 19:42:23", "remaining_time": "8:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8582, "total_steps": 9627, "loss": 1.5794, "learning_rate": 2.8792379105703094e-06, "epoch": 0.8914511270385375, "percentage": 89.15, "elapsed_time": "2 days, 19:42:53", "remaining_time": "8:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8583, "total_steps": 9627, "loss": 1.7181, "learning_rate": 2.8737834226309156e-06, "epoch": 0.8915550015581178, "percentage": 89.16, "elapsed_time": "2 days, 19:43:22", "remaining_time": "8:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8584, "total_steps": 9627, "loss": 1.6535, "learning_rate": 2.868333953265989e-06, "epoch": 0.8916588760776981, "percentage": 89.17, "elapsed_time": "2 days, 19:43:53", "remaining_time": "8:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8585, "total_steps": 9627, "loss": 1.6133, "learning_rate": 2.8628895030558435e-06, "epoch": 0.8917627505972785, "percentage": 89.18, "elapsed_time": "2 days, 19:44:22", "remaining_time": "8:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8586, "total_steps": 9627, "loss": 1.7044, "learning_rate": 2.8574500725802865e-06, "epoch": 0.8918666251168589, "percentage": 89.19, "elapsed_time": "2 days, 19:44:53", "remaining_time": "8:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8587, "total_steps": 9627, "loss": 1.6096, "learning_rate": 2.8520156624185777e-06, "epoch": 0.8919704996364392, "percentage": 89.2, "elapsed_time": "2 days, 19:45:21", "remaining_time": "8:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8588, "total_steps": 9627, "loss": 1.7143, "learning_rate": 2.8465862731494264e-06, "epoch": 0.8920743741560195, "percentage": 89.21, "elapsed_time": "2 days, 19:45:53", "remaining_time": "8:11:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8589, "total_steps": 9627, "loss": 1.5406, "learning_rate": 2.841161905351031e-06, "epoch": 0.8921782486755999, "percentage": 89.22, "elapsed_time": "2 days, 19:46:23", "remaining_time": "8:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8590, "total_steps": 9627, "loss": 1.7877, "learning_rate": 2.8357425596010344e-06, "epoch": 0.8922821231951802, "percentage": 89.23, "elapsed_time": "2 days, 19:46:51", "remaining_time": "8:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8591, "total_steps": 9627, "loss": 2.0108, "learning_rate": 2.830328236476559e-06, "epoch": 0.8923859977147606, "percentage": 89.24, "elapsed_time": "2 days, 19:47:21", "remaining_time": "8:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8592, "total_steps": 9627, "loss": 1.731, "learning_rate": 2.8249189365541886e-06, "epoch": 0.892489872234341, "percentage": 89.25, "elapsed_time": "2 days, 19:47:50", "remaining_time": "8:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8593, "total_steps": 9627, "loss": 1.7513, "learning_rate": 2.819514660409983e-06, "epoch": 0.8925937467539212, "percentage": 89.26, "elapsed_time": "2 days, 19:48:20", "remaining_time": "8:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8594, "total_steps": 9627, "loss": 1.5909, "learning_rate": 2.814115408619428e-06, "epoch": 0.8926976212735016, "percentage": 89.27, "elapsed_time": "2 days, 19:48:50", "remaining_time": "8:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8595, "total_steps": 9627, "loss": 1.7004, "learning_rate": 2.808721181757523e-06, "epoch": 0.892801495793082, "percentage": 89.28, "elapsed_time": "2 days, 19:49:20", "remaining_time": "8:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8596, "total_steps": 9627, "loss": 1.6818, "learning_rate": 2.80333198039871e-06, "epoch": 0.8929053703126623, "percentage": 89.29, "elapsed_time": "2 days, 19:49:49", "remaining_time": "8:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8597, "total_steps": 9627, "loss": 1.7153, "learning_rate": 2.7979478051168906e-06, "epoch": 0.8930092448322426, "percentage": 89.3, "elapsed_time": "2 days, 19:50:19", "remaining_time": "8:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8598, "total_steps": 9627, "loss": 1.6648, "learning_rate": 2.7925686564854447e-06, "epoch": 0.893113119351823, "percentage": 89.31, "elapsed_time": "2 days, 19:50:50", "remaining_time": "8:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8599, "total_steps": 9627, "loss": 1.6177, "learning_rate": 2.7871945350771977e-06, "epoch": 0.8932169938714033, "percentage": 89.32, "elapsed_time": "2 days, 19:51:18", "remaining_time": "8:06:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8600, "total_steps": 9627, "loss": 1.6729, "learning_rate": 2.781825441464464e-06, "epoch": 0.8933208683909837, "percentage": 89.33, "elapsed_time": "2 days, 19:51:49", "remaining_time": "8:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8601, "total_steps": 9627, "loss": 1.7711, "learning_rate": 2.776461376218997e-06, "epoch": 0.8934247429105641, "percentage": 89.34, "elapsed_time": "2 days, 19:52:18", "remaining_time": "8:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8602, "total_steps": 9627, "loss": 1.532, "learning_rate": 2.7711023399120463e-06, "epoch": 0.8935286174301443, "percentage": 89.35, "elapsed_time": "2 days, 19:52:49", "remaining_time": "8:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8603, "total_steps": 9627, "loss": 1.7887, "learning_rate": 2.7657483331142875e-06, "epoch": 0.8936324919497247, "percentage": 89.36, "elapsed_time": "2 days, 19:53:19", "remaining_time": "8:04:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8604, "total_steps": 9627, "loss": 1.7112, "learning_rate": 2.760399356395893e-06, "epoch": 0.8937363664693051, "percentage": 89.37, "elapsed_time": "2 days, 19:53:49", "remaining_time": "8:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8605, "total_steps": 9627, "loss": 1.6769, "learning_rate": 2.7550554103264845e-06, "epoch": 0.8938402409888855, "percentage": 89.38, "elapsed_time": "2 days, 19:54:18", "remaining_time": "8:03:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8606, "total_steps": 9627, "loss": 1.595, "learning_rate": 2.749716495475152e-06, "epoch": 0.8939441155084658, "percentage": 89.39, "elapsed_time": "2 days, 19:54:47", "remaining_time": "8:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8607, "total_steps": 9627, "loss": 1.5847, "learning_rate": 2.7443826124104454e-06, "epoch": 0.8940479900280461, "percentage": 89.4, "elapsed_time": "2 days, 19:55:17", "remaining_time": "8:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8608, "total_steps": 9627, "loss": 1.4398, "learning_rate": 2.7390537617003777e-06, "epoch": 0.8941518645476265, "percentage": 89.42, "elapsed_time": "2 days, 19:55:47", "remaining_time": "8:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8609, "total_steps": 9627, "loss": 1.7582, "learning_rate": 2.73372994391245e-06, "epoch": 0.8942557390672068, "percentage": 89.43, "elapsed_time": "2 days, 19:56:16", "remaining_time": "8:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8610, "total_steps": 9627, "loss": 1.7001, "learning_rate": 2.72841115961357e-06, "epoch": 0.8943596135867872, "percentage": 89.44, "elapsed_time": "2 days, 19:56:47", "remaining_time": "8:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8611, "total_steps": 9627, "loss": 1.5964, "learning_rate": 2.7230974093701844e-06, "epoch": 0.8944634881063676, "percentage": 89.45, "elapsed_time": "2 days, 19:57:16", "remaining_time": "8:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8612, "total_steps": 9627, "loss": 1.7961, "learning_rate": 2.7177886937481524e-06, "epoch": 0.8945673626259478, "percentage": 89.46, "elapsed_time": "2 days, 19:57:45", "remaining_time": "8:00:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8613, "total_steps": 9627, "loss": 1.4809, "learning_rate": 2.7124850133127987e-06, "epoch": 0.8946712371455282, "percentage": 89.47, "elapsed_time": "2 days, 19:58:16", "remaining_time": "8:00:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8614, "total_steps": 9627, "loss": 1.556, "learning_rate": 2.707186368628939e-06, "epoch": 0.8947751116651086, "percentage": 89.48, "elapsed_time": "2 days, 19:58:44", "remaining_time": "7:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8615, "total_steps": 9627, "loss": 1.4624, "learning_rate": 2.7018927602608323e-06, "epoch": 0.8948789861846889, "percentage": 89.49, "elapsed_time": "2 days, 19:59:14", "remaining_time": "7:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8616, "total_steps": 9627, "loss": 1.8081, "learning_rate": 2.6966041887722117e-06, "epoch": 0.8949828607042692, "percentage": 89.5, "elapsed_time": "2 days, 19:59:44", "remaining_time": "7:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8617, "total_steps": 9627, "loss": 1.7128, "learning_rate": 2.6913206547262593e-06, "epoch": 0.8950867352238496, "percentage": 89.51, "elapsed_time": "2 days, 20:00:13", "remaining_time": "7:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8618, "total_steps": 9627, "loss": 1.7452, "learning_rate": 2.6860421586856368e-06, "epoch": 0.8951906097434299, "percentage": 89.52, "elapsed_time": "2 days, 20:00:42", "remaining_time": "7:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8619, "total_steps": 9627, "loss": 1.773, "learning_rate": 2.6807687012124605e-06, "epoch": 0.8952944842630103, "percentage": 89.53, "elapsed_time": "2 days, 20:01:13", "remaining_time": "7:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8620, "total_steps": 9627, "loss": 1.6954, "learning_rate": 2.6755002828683096e-06, "epoch": 0.8953983587825907, "percentage": 89.54, "elapsed_time": "2 days, 20:01:43", "remaining_time": "7:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8621, "total_steps": 9627, "loss": 1.7723, "learning_rate": 2.6702369042142463e-06, "epoch": 0.8955022333021709, "percentage": 89.55, "elapsed_time": "2 days, 20:02:12", "remaining_time": "7:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8622, "total_steps": 9627, "loss": 1.6812, "learning_rate": 2.6649785658107494e-06, "epoch": 0.8956061078217513, "percentage": 89.56, "elapsed_time": "2 days, 20:02:41", "remaining_time": "7:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8623, "total_steps": 9627, "loss": 1.772, "learning_rate": 2.6597252682178165e-06, "epoch": 0.8957099823413317, "percentage": 89.57, "elapsed_time": "2 days, 20:03:11", "remaining_time": "7:55:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8624, "total_steps": 9627, "loss": 1.6485, "learning_rate": 2.6544770119948714e-06, "epoch": 0.895813856860912, "percentage": 89.58, "elapsed_time": "2 days, 20:03:41", "remaining_time": "7:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8625, "total_steps": 9627, "loss": 1.7824, "learning_rate": 2.6492337977008173e-06, "epoch": 0.8959177313804924, "percentage": 89.59, "elapsed_time": "2 days, 20:04:11", "remaining_time": "7:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8626, "total_steps": 9627, "loss": 1.5354, "learning_rate": 2.6439956258940193e-06, "epoch": 0.8960216059000727, "percentage": 89.6, "elapsed_time": "2 days, 20:04:40", "remaining_time": "7:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8627, "total_steps": 9627, "loss": 1.6791, "learning_rate": 2.638762497132291e-06, "epoch": 0.896125480419653, "percentage": 89.61, "elapsed_time": "2 days, 20:05:09", "remaining_time": "7:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8628, "total_steps": 9627, "loss": 1.7615, "learning_rate": 2.633534411972921e-06, "epoch": 0.8962293549392334, "percentage": 89.62, "elapsed_time": "2 days, 20:05:40", "remaining_time": "7:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8629, "total_steps": 9627, "loss": 1.535, "learning_rate": 2.628311370972664e-06, "epoch": 0.8963332294588138, "percentage": 89.63, "elapsed_time": "2 days, 20:06:10", "remaining_time": "7:52:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8630, "total_steps": 9627, "loss": 1.6903, "learning_rate": 2.6230933746877406e-06, "epoch": 0.896437103978394, "percentage": 89.64, "elapsed_time": "2 days, 20:06:39", "remaining_time": "7:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8631, "total_steps": 9627, "loss": 1.5899, "learning_rate": 2.6178804236738073e-06, "epoch": 0.8965409784979744, "percentage": 89.65, "elapsed_time": "2 days, 20:07:08", "remaining_time": "7:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8632, "total_steps": 9627, "loss": 1.8366, "learning_rate": 2.61267251848602e-06, "epoch": 0.8966448530175548, "percentage": 89.66, "elapsed_time": "2 days, 20:07:38", "remaining_time": "7:51:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8633, "total_steps": 9627, "loss": 1.6235, "learning_rate": 2.6074696596789793e-06, "epoch": 0.8967487275371352, "percentage": 89.67, "elapsed_time": "2 days, 20:08:07", "remaining_time": "7:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8634, "total_steps": 9627, "loss": 1.5863, "learning_rate": 2.6022718478067363e-06, "epoch": 0.8968526020567155, "percentage": 89.69, "elapsed_time": "2 days, 20:08:37", "remaining_time": "7:50:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8635, "total_steps": 9627, "loss": 1.7443, "learning_rate": 2.597079083422832e-06, "epoch": 0.8969564765762958, "percentage": 89.7, "elapsed_time": "2 days, 20:09:07", "remaining_time": "7:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8636, "total_steps": 9627, "loss": 1.7862, "learning_rate": 2.5918913670802346e-06, "epoch": 0.8970603510958762, "percentage": 89.71, "elapsed_time": "2 days, 20:09:37", "remaining_time": "7:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8637, "total_steps": 9627, "loss": 1.7847, "learning_rate": 2.5867086993314305e-06, "epoch": 0.8971642256154565, "percentage": 89.72, "elapsed_time": "2 days, 20:10:06", "remaining_time": "7:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8638, "total_steps": 9627, "loss": 1.6616, "learning_rate": 2.5815310807282944e-06, "epoch": 0.8972681001350369, "percentage": 89.73, "elapsed_time": "2 days, 20:10:36", "remaining_time": "7:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8639, "total_steps": 9627, "loss": 1.8507, "learning_rate": 2.5763585118222246e-06, "epoch": 0.8973719746546173, "percentage": 89.74, "elapsed_time": "2 days, 20:11:06", "remaining_time": "7:47:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8640, "total_steps": 9627, "loss": 1.9273, "learning_rate": 2.5711909931640634e-06, "epoch": 0.8974758491741975, "percentage": 89.75, "elapsed_time": "2 days, 20:11:35", "remaining_time": "7:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8641, "total_steps": 9627, "loss": 1.6388, "learning_rate": 2.566028525304087e-06, "epoch": 0.8975797236937779, "percentage": 89.76, "elapsed_time": "2 days, 20:12:06", "remaining_time": "7:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8642, "total_steps": 9627, "loss": 1.7742, "learning_rate": 2.5608711087920844e-06, "epoch": 0.8976835982133583, "percentage": 89.77, "elapsed_time": "2 days, 20:12:35", "remaining_time": "7:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8643, "total_steps": 9627, "loss": 1.5785, "learning_rate": 2.5557187441772655e-06, "epoch": 0.8977874727329386, "percentage": 89.78, "elapsed_time": "2 days, 20:13:04", "remaining_time": "7:45:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8644, "total_steps": 9627, "loss": 1.6983, "learning_rate": 2.550571432008325e-06, "epoch": 0.897891347252519, "percentage": 89.79, "elapsed_time": "2 days, 20:13:34", "remaining_time": "7:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8645, "total_steps": 9627, "loss": 1.7185, "learning_rate": 2.5454291728334022e-06, "epoch": 0.8979952217720993, "percentage": 89.8, "elapsed_time": "2 days, 20:14:03", "remaining_time": "7:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8646, "total_steps": 9627, "loss": 1.4215, "learning_rate": 2.5402919672001147e-06, "epoch": 0.8980990962916796, "percentage": 89.81, "elapsed_time": "2 days, 20:14:34", "remaining_time": "7:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8647, "total_steps": 9627, "loss": 1.5594, "learning_rate": 2.5351598156555356e-06, "epoch": 0.89820297081126, "percentage": 89.82, "elapsed_time": "2 days, 20:15:04", "remaining_time": "7:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8648, "total_steps": 9627, "loss": 1.7134, "learning_rate": 2.5300327187461837e-06, "epoch": 0.8983068453308404, "percentage": 89.83, "elapsed_time": "2 days, 20:15:34", "remaining_time": "7:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8649, "total_steps": 9627, "loss": 1.5643, "learning_rate": 2.524910677018083e-06, "epoch": 0.8984107198504206, "percentage": 89.84, "elapsed_time": "2 days, 20:16:03", "remaining_time": "7:43:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8650, "total_steps": 9627, "loss": 1.6597, "learning_rate": 2.519793691016664e-06, "epoch": 0.898514594370001, "percentage": 89.85, "elapsed_time": "2 days, 20:16:33", "remaining_time": "7:42:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8651, "total_steps": 9627, "loss": 1.5878, "learning_rate": 2.5146817612868634e-06, "epoch": 0.8986184688895814, "percentage": 89.86, "elapsed_time": "2 days, 20:17:03", "remaining_time": "7:42:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8652, "total_steps": 9627, "loss": 1.6392, "learning_rate": 2.5095748883730562e-06, "epoch": 0.8987223434091617, "percentage": 89.87, "elapsed_time": "2 days, 20:17:32", "remaining_time": "7:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8653, "total_steps": 9627, "loss": 1.6582, "learning_rate": 2.50447307281908e-06, "epoch": 0.8988262179287421, "percentage": 89.88, "elapsed_time": "2 days, 20:18:02", "remaining_time": "7:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8654, "total_steps": 9627, "loss": 1.6875, "learning_rate": 2.4993763151682448e-06, "epoch": 0.8989300924483224, "percentage": 89.89, "elapsed_time": "2 days, 20:18:31", "remaining_time": "7:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8655, "total_steps": 9627, "loss": 1.6108, "learning_rate": 2.4942846159633104e-06, "epoch": 0.8990339669679027, "percentage": 89.9, "elapsed_time": "2 days, 20:19:00", "remaining_time": "7:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8656, "total_steps": 9627, "loss": 1.6022, "learning_rate": 2.4891979757465102e-06, "epoch": 0.8991378414874831, "percentage": 89.91, "elapsed_time": "2 days, 20:19:31", "remaining_time": "7:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8657, "total_steps": 9627, "loss": 1.6271, "learning_rate": 2.484116395059516e-06, "epoch": 0.8992417160070635, "percentage": 89.92, "elapsed_time": "2 days, 20:20:00", "remaining_time": "7:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8658, "total_steps": 9627, "loss": 1.4597, "learning_rate": 2.479039874443495e-06, "epoch": 0.8993455905266439, "percentage": 89.93, "elapsed_time": "2 days, 20:20:30", "remaining_time": "7:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8659, "total_steps": 9627, "loss": 1.5915, "learning_rate": 2.473968414439054e-06, "epoch": 0.8994494650462241, "percentage": 89.94, "elapsed_time": "2 days, 20:20:59", "remaining_time": "7:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8660, "total_steps": 9627, "loss": 1.7938, "learning_rate": 2.468902015586255e-06, "epoch": 0.8995533395658045, "percentage": 89.96, "elapsed_time": "2 days, 20:21:29", "remaining_time": "7:37:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8661, "total_steps": 9627, "loss": 1.5711, "learning_rate": 2.4638406784246337e-06, "epoch": 0.8996572140853849, "percentage": 89.97, "elapsed_time": "2 days, 20:21:59", "remaining_time": "7:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8662, "total_steps": 9627, "loss": 1.5101, "learning_rate": 2.458784403493186e-06, "epoch": 0.8997610886049652, "percentage": 89.98, "elapsed_time": "2 days, 20:22:29", "remaining_time": "7:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8663, "total_steps": 9627, "loss": 1.706, "learning_rate": 2.453733191330365e-06, "epoch": 0.8998649631245456, "percentage": 89.99, "elapsed_time": "2 days, 20:22:59", "remaining_time": "7:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8664, "total_steps": 9627, "loss": 1.8456, "learning_rate": 2.448687042474074e-06, "epoch": 0.8999688376441259, "percentage": 90.0, "elapsed_time": "2 days, 20:23:27", "remaining_time": "7:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8665, "total_steps": 9627, "loss": 1.6289, "learning_rate": 2.4436459574617155e-06, "epoch": 0.9000727121637062, "percentage": 90.01, "elapsed_time": "2 days, 20:23:58", "remaining_time": "7:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8666, "total_steps": 9627, "loss": 1.6296, "learning_rate": 2.4386099368300943e-06, "epoch": 0.9001765866832866, "percentage": 90.02, "elapsed_time": "2 days, 20:24:27", "remaining_time": "7:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8667, "total_steps": 9627, "loss": 1.7748, "learning_rate": 2.4335789811155253e-06, "epoch": 0.900280461202867, "percentage": 90.03, "elapsed_time": "2 days, 20:24:57", "remaining_time": "7:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8668, "total_steps": 9627, "loss": 1.6025, "learning_rate": 2.4285530908537747e-06, "epoch": 0.9003843357224472, "percentage": 90.04, "elapsed_time": "2 days, 20:25:27", "remaining_time": "7:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8669, "total_steps": 9627, "loss": 1.6433, "learning_rate": 2.423532266580031e-06, "epoch": 0.9004882102420276, "percentage": 90.05, "elapsed_time": "2 days, 20:25:57", "remaining_time": "7:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8670, "total_steps": 9627, "loss": 1.55, "learning_rate": 2.4185165088289996e-06, "epoch": 0.900592084761608, "percentage": 90.06, "elapsed_time": "2 days, 20:26:26", "remaining_time": "7:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8671, "total_steps": 9627, "loss": 1.8198, "learning_rate": 2.4135058181348036e-06, "epoch": 0.9006959592811883, "percentage": 90.07, "elapsed_time": "2 days, 20:26:57", "remaining_time": "7:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8672, "total_steps": 9627, "loss": 1.7265, "learning_rate": 2.4085001950310546e-06, "epoch": 0.9007998338007687, "percentage": 90.08, "elapsed_time": "2 days, 20:27:26", "remaining_time": "7:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8673, "total_steps": 9627, "loss": 1.5325, "learning_rate": 2.403499640050805e-06, "epoch": 0.900903708320349, "percentage": 90.09, "elapsed_time": "2 days, 20:27:56", "remaining_time": "7:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8674, "total_steps": 9627, "loss": 1.5629, "learning_rate": 2.3985041537265774e-06, "epoch": 0.9010075828399293, "percentage": 90.1, "elapsed_time": "2 days, 20:28:25", "remaining_time": "7:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8675, "total_steps": 9627, "loss": 1.6934, "learning_rate": 2.3935137365903526e-06, "epoch": 0.9011114573595097, "percentage": 90.11, "elapsed_time": "2 days, 20:28:55", "remaining_time": "7:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8676, "total_steps": 9627, "loss": 1.5736, "learning_rate": 2.3885283891735664e-06, "epoch": 0.9012153318790901, "percentage": 90.12, "elapsed_time": "2 days, 20:29:24", "remaining_time": "7:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8677, "total_steps": 9627, "loss": 1.6968, "learning_rate": 2.383548112007128e-06, "epoch": 0.9013192063986704, "percentage": 90.13, "elapsed_time": "2 days, 20:29:52", "remaining_time": "7:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8678, "total_steps": 9627, "loss": 1.6976, "learning_rate": 2.3785729056213845e-06, "epoch": 0.9014230809182507, "percentage": 90.14, "elapsed_time": "2 days, 20:30:24", "remaining_time": "7:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8679, "total_steps": 9627, "loss": 1.581, "learning_rate": 2.3736027705461737e-06, "epoch": 0.9015269554378311, "percentage": 90.15, "elapsed_time": "2 days, 20:30:52", "remaining_time": "7:29:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8680, "total_steps": 9627, "loss": 1.6556, "learning_rate": 2.368637707310767e-06, "epoch": 0.9016308299574114, "percentage": 90.16, "elapsed_time": "2 days, 20:31:23", "remaining_time": "7:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8681, "total_steps": 9627, "loss": 1.802, "learning_rate": 2.3636777164439016e-06, "epoch": 0.9017347044769918, "percentage": 90.17, "elapsed_time": "2 days, 20:31:52", "remaining_time": "7:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8682, "total_steps": 9627, "loss": 1.8442, "learning_rate": 2.3587227984737835e-06, "epoch": 0.9018385789965722, "percentage": 90.18, "elapsed_time": "2 days, 20:32:22", "remaining_time": "7:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8683, "total_steps": 9627, "loss": 1.5732, "learning_rate": 2.3537729539280684e-06, "epoch": 0.9019424535161525, "percentage": 90.19, "elapsed_time": "2 days, 20:32:52", "remaining_time": "7:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8684, "total_steps": 9627, "loss": 1.4718, "learning_rate": 2.3488281833338844e-06, "epoch": 0.9020463280357328, "percentage": 90.2, "elapsed_time": "2 days, 20:33:22", "remaining_time": "7:26:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8685, "total_steps": 9627, "loss": 1.5745, "learning_rate": 2.3438884872177992e-06, "epoch": 0.9021502025553132, "percentage": 90.22, "elapsed_time": "2 days, 20:33:51", "remaining_time": "7:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8686, "total_steps": 9627, "loss": 1.8402, "learning_rate": 2.338953866105864e-06, "epoch": 0.9022540770748936, "percentage": 90.23, "elapsed_time": "2 days, 20:34:22", "remaining_time": "7:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8687, "total_steps": 9627, "loss": 1.7328, "learning_rate": 2.3340243205235703e-06, "epoch": 0.9023579515944739, "percentage": 90.24, "elapsed_time": "2 days, 20:34:50", "remaining_time": "7:25:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8688, "total_steps": 9627, "loss": 1.7364, "learning_rate": 2.3290998509958752e-06, "epoch": 0.9024618261140542, "percentage": 90.25, "elapsed_time": "2 days, 20:35:20", "remaining_time": "7:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8689, "total_steps": 9627, "loss": 1.6693, "learning_rate": 2.324180458047198e-06, "epoch": 0.9025657006336346, "percentage": 90.26, "elapsed_time": "2 days, 20:35:49", "remaining_time": "7:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8690, "total_steps": 9627, "loss": 1.7195, "learning_rate": 2.3192661422014204e-06, "epoch": 0.9026695751532149, "percentage": 90.27, "elapsed_time": "2 days, 20:36:19", "remaining_time": "7:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8691, "total_steps": 9627, "loss": 1.5864, "learning_rate": 2.3143569039818737e-06, "epoch": 0.9027734496727953, "percentage": 90.28, "elapsed_time": "2 days, 20:36:49", "remaining_time": "7:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8692, "total_steps": 9627, "loss": 1.7092, "learning_rate": 2.3094527439113446e-06, "epoch": 0.9028773241923757, "percentage": 90.29, "elapsed_time": "2 days, 20:37:19", "remaining_time": "7:22:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8693, "total_steps": 9627, "loss": 1.5689, "learning_rate": 2.3045536625121155e-06, "epoch": 0.9029811987119559, "percentage": 90.3, "elapsed_time": "2 days, 20:37:48", "remaining_time": "7:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8694, "total_steps": 9627, "loss": 1.7061, "learning_rate": 2.2996596603058695e-06, "epoch": 0.9030850732315363, "percentage": 90.31, "elapsed_time": "2 days, 20:38:18", "remaining_time": "7:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8695, "total_steps": 9627, "loss": 1.6226, "learning_rate": 2.294770737813795e-06, "epoch": 0.9031889477511167, "percentage": 90.32, "elapsed_time": "2 days, 20:38:48", "remaining_time": "7:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8696, "total_steps": 9627, "loss": 1.5687, "learning_rate": 2.289886895556531e-06, "epoch": 0.903292822270697, "percentage": 90.33, "elapsed_time": "2 days, 20:39:18", "remaining_time": "7:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8697, "total_steps": 9627, "loss": 1.9438, "learning_rate": 2.285008134054145e-06, "epoch": 0.9033966967902773, "percentage": 90.34, "elapsed_time": "2 days, 20:39:47", "remaining_time": "7:20:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8698, "total_steps": 9627, "loss": 1.6155, "learning_rate": 2.2801344538262103e-06, "epoch": 0.9035005713098577, "percentage": 90.35, "elapsed_time": "2 days, 20:40:15", "remaining_time": "7:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8699, "total_steps": 9627, "loss": 1.669, "learning_rate": 2.2752658553917226e-06, "epoch": 0.903604445829438, "percentage": 90.36, "elapsed_time": "2 days, 20:40:46", "remaining_time": "7:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8700, "total_steps": 9627, "loss": 1.7943, "learning_rate": 2.270402339269162e-06, "epoch": 0.9037083203490184, "percentage": 90.37, "elapsed_time": "2 days, 20:41:16", "remaining_time": "7:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8701, "total_steps": 9627, "loss": 1.5809, "learning_rate": 2.2655439059764415e-06, "epoch": 0.9038121948685988, "percentage": 90.38, "elapsed_time": "2 days, 20:41:45", "remaining_time": "7:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8702, "total_steps": 9627, "loss": 1.5512, "learning_rate": 2.2606905560309534e-06, "epoch": 0.903916069388179, "percentage": 90.39, "elapsed_time": "2 days, 20:42:16", "remaining_time": "7:18:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8703, "total_steps": 9627, "loss": 1.5806, "learning_rate": 2.2558422899495392e-06, "epoch": 0.9040199439077594, "percentage": 90.4, "elapsed_time": "2 days, 20:42:45", "remaining_time": "7:17:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8704, "total_steps": 9627, "loss": 1.71, "learning_rate": 2.2509991082484914e-06, "epoch": 0.9041238184273398, "percentage": 90.41, "elapsed_time": "2 days, 20:43:15", "remaining_time": "7:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8705, "total_steps": 9627, "loss": 1.5765, "learning_rate": 2.2461610114436038e-06, "epoch": 0.9042276929469201, "percentage": 90.42, "elapsed_time": "2 days, 20:43:45", "remaining_time": "7:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8706, "total_steps": 9627, "loss": 1.4221, "learning_rate": 2.241328000050058e-06, "epoch": 0.9043315674665005, "percentage": 90.43, "elapsed_time": "2 days, 20:44:14", "remaining_time": "7:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8707, "total_steps": 9627, "loss": 1.6554, "learning_rate": 2.236500074582554e-06, "epoch": 0.9044354419860808, "percentage": 90.44, "elapsed_time": "2 days, 20:44:43", "remaining_time": "7:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8708, "total_steps": 9627, "loss": 1.4211, "learning_rate": 2.2316772355552185e-06, "epoch": 0.9045393165056611, "percentage": 90.45, "elapsed_time": "2 days, 20:45:14", "remaining_time": "7:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8709, "total_steps": 9627, "loss": 1.6462, "learning_rate": 2.226859483481658e-06, "epoch": 0.9046431910252415, "percentage": 90.46, "elapsed_time": "2 days, 20:45:43", "remaining_time": "7:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8710, "total_steps": 9627, "loss": 1.6724, "learning_rate": 2.222046818874912e-06, "epoch": 0.9047470655448219, "percentage": 90.47, "elapsed_time": "2 days, 20:46:12", "remaining_time": "7:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8711, "total_steps": 9627, "loss": 1.5371, "learning_rate": 2.217239242247493e-06, "epoch": 0.9048509400644023, "percentage": 90.49, "elapsed_time": "2 days, 20:46:41", "remaining_time": "7:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8712, "total_steps": 9627, "loss": 1.7528, "learning_rate": 2.2124367541113856e-06, "epoch": 0.9049548145839825, "percentage": 90.5, "elapsed_time": "2 days, 20:47:12", "remaining_time": "7:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8713, "total_steps": 9627, "loss": 1.5377, "learning_rate": 2.207639354977997e-06, "epoch": 0.9050586891035629, "percentage": 90.51, "elapsed_time": "2 days, 20:47:41", "remaining_time": "7:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8714, "total_steps": 9627, "loss": 1.798, "learning_rate": 2.2028470453582253e-06, "epoch": 0.9051625636231433, "percentage": 90.52, "elapsed_time": "2 days, 20:48:11", "remaining_time": "7:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8715, "total_steps": 9627, "loss": 1.6247, "learning_rate": 2.1980598257624165e-06, "epoch": 0.9052664381427236, "percentage": 90.53, "elapsed_time": "2 days, 20:48:41", "remaining_time": "7:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8716, "total_steps": 9627, "loss": 1.8091, "learning_rate": 2.193277696700363e-06, "epoch": 0.9053703126623039, "percentage": 90.54, "elapsed_time": "2 days, 20:49:09", "remaining_time": "7:11:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8717, "total_steps": 9627, "loss": 1.8274, "learning_rate": 2.188500658681325e-06, "epoch": 0.9054741871818843, "percentage": 90.55, "elapsed_time": "2 days, 20:49:40", "remaining_time": "7:11:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8718, "total_steps": 9627, "loss": 1.5299, "learning_rate": 2.183728712214028e-06, "epoch": 0.9055780617014646, "percentage": 90.56, "elapsed_time": "2 days, 20:50:09", "remaining_time": "7:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8719, "total_steps": 9627, "loss": 1.7601, "learning_rate": 2.1789618578066386e-06, "epoch": 0.905681936221045, "percentage": 90.57, "elapsed_time": "2 days, 20:50:40", "remaining_time": "7:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8720, "total_steps": 9627, "loss": 1.624, "learning_rate": 2.1742000959667885e-06, "epoch": 0.9057858107406254, "percentage": 90.58, "elapsed_time": "2 days, 20:51:08", "remaining_time": "7:09:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8721, "total_steps": 9627, "loss": 1.5616, "learning_rate": 2.169443427201584e-06, "epoch": 0.9058896852602056, "percentage": 90.59, "elapsed_time": "2 days, 20:51:39", "remaining_time": "7:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8722, "total_steps": 9627, "loss": 1.6354, "learning_rate": 2.164691852017553e-06, "epoch": 0.905993559779786, "percentage": 90.6, "elapsed_time": "2 days, 20:52:08", "remaining_time": "7:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8723, "total_steps": 9627, "loss": 1.7588, "learning_rate": 2.159945370920713e-06, "epoch": 0.9060974342993664, "percentage": 90.61, "elapsed_time": "2 days, 20:52:38", "remaining_time": "7:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8724, "total_steps": 9627, "loss": 1.6595, "learning_rate": 2.1552039844165316e-06, "epoch": 0.9062013088189467, "percentage": 90.62, "elapsed_time": "2 days, 20:53:07", "remaining_time": "7:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8725, "total_steps": 9627, "loss": 1.6695, "learning_rate": 2.1504676930099056e-06, "epoch": 0.906305183338527, "percentage": 90.63, "elapsed_time": "2 days, 20:53:37", "remaining_time": "7:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8726, "total_steps": 9627, "loss": 1.6587, "learning_rate": 2.145736497205242e-06, "epoch": 0.9064090578581074, "percentage": 90.64, "elapsed_time": "2 days, 20:54:06", "remaining_time": "7:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8727, "total_steps": 9627, "loss": 1.6881, "learning_rate": 2.14101039750636e-06, "epoch": 0.9065129323776877, "percentage": 90.65, "elapsed_time": "2 days, 20:54:37", "remaining_time": "7:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8728, "total_steps": 9627, "loss": 1.6157, "learning_rate": 2.1362893944165573e-06, "epoch": 0.9066168068972681, "percentage": 90.66, "elapsed_time": "2 days, 20:55:05", "remaining_time": "7:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8729, "total_steps": 9627, "loss": 1.6042, "learning_rate": 2.131573488438582e-06, "epoch": 0.9067206814168485, "percentage": 90.67, "elapsed_time": "2 days, 20:55:36", "remaining_time": "7:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8730, "total_steps": 9627, "loss": 1.738, "learning_rate": 2.1268626800746427e-06, "epoch": 0.9068245559364287, "percentage": 90.68, "elapsed_time": "2 days, 20:56:05", "remaining_time": "7:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8731, "total_steps": 9627, "loss": 1.662, "learning_rate": 2.1221569698264054e-06, "epoch": 0.9069284304560091, "percentage": 90.69, "elapsed_time": "2 days, 20:56:35", "remaining_time": "7:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8732, "total_steps": 9627, "loss": 1.6081, "learning_rate": 2.11745635819498e-06, "epoch": 0.9070323049755895, "percentage": 90.7, "elapsed_time": "2 days, 20:57:04", "remaining_time": "7:04:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8733, "total_steps": 9627, "loss": 1.6897, "learning_rate": 2.1127608456809667e-06, "epoch": 0.9071361794951698, "percentage": 90.71, "elapsed_time": "2 days, 20:57:35", "remaining_time": "7:03:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8734, "total_steps": 9627, "loss": 1.6987, "learning_rate": 2.108070432784376e-06, "epoch": 0.9072400540147502, "percentage": 90.72, "elapsed_time": "2 days, 20:58:05", "remaining_time": "7:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8735, "total_steps": 9627, "loss": 1.5307, "learning_rate": 2.1033851200047195e-06, "epoch": 0.9073439285343305, "percentage": 90.73, "elapsed_time": "2 days, 20:58:34", "remaining_time": "7:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8736, "total_steps": 9627, "loss": 1.5036, "learning_rate": 2.098704907840943e-06, "epoch": 0.9074478030539109, "percentage": 90.74, "elapsed_time": "2 days, 20:59:03", "remaining_time": "7:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8737, "total_steps": 9627, "loss": 1.691, "learning_rate": 2.094029796791441e-06, "epoch": 0.9075516775734912, "percentage": 90.76, "elapsed_time": "2 days, 20:59:33", "remaining_time": "7:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8738, "total_steps": 9627, "loss": 1.6238, "learning_rate": 2.0893597873540947e-06, "epoch": 0.9076555520930716, "percentage": 90.77, "elapsed_time": "2 days, 21:00:03", "remaining_time": "7:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8739, "total_steps": 9627, "loss": 1.765, "learning_rate": 2.0846948800262e-06, "epoch": 0.907759426612652, "percentage": 90.78, "elapsed_time": "2 days, 21:00:32", "remaining_time": "7:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8740, "total_steps": 9627, "loss": 1.785, "learning_rate": 2.080035075304565e-06, "epoch": 0.9078633011322322, "percentage": 90.79, "elapsed_time": "2 days, 21:01:02", "remaining_time": "7:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8741, "total_steps": 9627, "loss": 1.7357, "learning_rate": 2.0753803736853872e-06, "epoch": 0.9079671756518126, "percentage": 90.8, "elapsed_time": "2 days, 21:01:32", "remaining_time": "6:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8742, "total_steps": 9627, "loss": 1.5915, "learning_rate": 2.070730775664381e-06, "epoch": 0.908071050171393, "percentage": 90.81, "elapsed_time": "2 days, 21:02:01", "remaining_time": "6:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8743, "total_steps": 9627, "loss": 1.5252, "learning_rate": 2.0660862817366846e-06, "epoch": 0.9081749246909733, "percentage": 90.82, "elapsed_time": "2 days, 21:02:32", "remaining_time": "6:58:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8744, "total_steps": 9627, "loss": 1.6859, "learning_rate": 2.061446892396901e-06, "epoch": 0.9082787992105537, "percentage": 90.83, "elapsed_time": "2 days, 21:03:01", "remaining_time": "6:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8745, "total_steps": 9627, "loss": 1.635, "learning_rate": 2.0568126081390916e-06, "epoch": 0.908382673730134, "percentage": 90.84, "elapsed_time": "2 days, 21:03:30", "remaining_time": "6:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8746, "total_steps": 9627, "loss": 1.7292, "learning_rate": 2.052183429456761e-06, "epoch": 0.9084865482497143, "percentage": 90.85, "elapsed_time": "2 days, 21:03:59", "remaining_time": "6:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8747, "total_steps": 9627, "loss": 1.6206, "learning_rate": 2.047559356842893e-06, "epoch": 0.9085904227692947, "percentage": 90.86, "elapsed_time": "2 days, 21:04:28", "remaining_time": "6:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8748, "total_steps": 9627, "loss": 1.7271, "learning_rate": 2.042940390789899e-06, "epoch": 0.9086942972888751, "percentage": 90.87, "elapsed_time": "2 days, 21:04:59", "remaining_time": "6:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8749, "total_steps": 9627, "loss": 1.6506, "learning_rate": 2.0383265317896916e-06, "epoch": 0.9087981718084553, "percentage": 90.88, "elapsed_time": "2 days, 21:05:29", "remaining_time": "6:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8750, "total_steps": 9627, "loss": 1.6477, "learning_rate": 2.033717780333577e-06, "epoch": 0.9089020463280357, "percentage": 90.89, "elapsed_time": "2 days, 21:05:57", "remaining_time": "6:55:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8751, "total_steps": 9627, "loss": 1.6716, "learning_rate": 2.0291141369123746e-06, "epoch": 0.9090059208476161, "percentage": 90.9, "elapsed_time": "2 days, 21:06:26", "remaining_time": "6:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8752, "total_steps": 9627, "loss": 1.5676, "learning_rate": 2.0245156020163413e-06, "epoch": 0.9091097953671964, "percentage": 90.91, "elapsed_time": "2 days, 21:06:58", "remaining_time": "6:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8753, "total_steps": 9627, "loss": 1.7053, "learning_rate": 2.019922176135153e-06, "epoch": 0.9092136698867768, "percentage": 90.92, "elapsed_time": "2 days, 21:07:27", "remaining_time": "6:54:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8754, "total_steps": 9627, "loss": 1.7169, "learning_rate": 2.0153338597580006e-06, "epoch": 0.9093175444063571, "percentage": 90.93, "elapsed_time": "2 days, 21:07:56", "remaining_time": "6:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8755, "total_steps": 9627, "loss": 1.7221, "learning_rate": 2.0107506533735e-06, "epoch": 0.9094214189259374, "percentage": 90.94, "elapsed_time": "2 days, 21:08:26", "remaining_time": "6:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8756, "total_steps": 9627, "loss": 1.4159, "learning_rate": 2.0061725574697266e-06, "epoch": 0.9095252934455178, "percentage": 90.95, "elapsed_time": "2 days, 21:08:55", "remaining_time": "6:52:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8757, "total_steps": 9627, "loss": 1.5355, "learning_rate": 2.0015995725342073e-06, "epoch": 0.9096291679650982, "percentage": 90.96, "elapsed_time": "2 days, 21:09:26", "remaining_time": "6:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8758, "total_steps": 9627, "loss": 1.6739, "learning_rate": 1.9970316990539306e-06, "epoch": 0.9097330424846785, "percentage": 90.97, "elapsed_time": "2 days, 21:09:54", "remaining_time": "6:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8759, "total_steps": 9627, "loss": 1.6932, "learning_rate": 1.9924689375153406e-06, "epoch": 0.9098369170042588, "percentage": 90.98, "elapsed_time": "2 days, 21:10:25", "remaining_time": "6:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8760, "total_steps": 9627, "loss": 1.7716, "learning_rate": 1.9879112884043315e-06, "epoch": 0.9099407915238392, "percentage": 90.99, "elapsed_time": "2 days, 21:10:54", "remaining_time": "6:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8761, "total_steps": 9627, "loss": 1.7038, "learning_rate": 1.983358752206266e-06, "epoch": 0.9100446660434196, "percentage": 91.0, "elapsed_time": "2 days, 21:11:25", "remaining_time": "6:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8762, "total_steps": 9627, "loss": 1.5655, "learning_rate": 1.9788113294059498e-06, "epoch": 0.9101485405629999, "percentage": 91.01, "elapsed_time": "2 days, 21:11:54", "remaining_time": "6:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8763, "total_steps": 9627, "loss": 1.5848, "learning_rate": 1.974269020487646e-06, "epoch": 0.9102524150825803, "percentage": 91.03, "elapsed_time": "2 days, 21:12:24", "remaining_time": "6:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8764, "total_steps": 9627, "loss": 1.5146, "learning_rate": 1.969731825935073e-06, "epoch": 0.9103562896021606, "percentage": 91.04, "elapsed_time": "2 days, 21:12:54", "remaining_time": "6:48:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8765, "total_steps": 9627, "loss": 1.7126, "learning_rate": 1.9651997462314166e-06, "epoch": 0.9104601641217409, "percentage": 91.05, "elapsed_time": "2 days, 21:13:23", "remaining_time": "6:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8766, "total_steps": 9627, "loss": 1.8559, "learning_rate": 1.9606727818592963e-06, "epoch": 0.9105640386413213, "percentage": 91.06, "elapsed_time": "2 days, 21:13:53", "remaining_time": "6:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8767, "total_steps": 9627, "loss": 1.6292, "learning_rate": 1.9561509333008045e-06, "epoch": 0.9106679131609017, "percentage": 91.07, "elapsed_time": "2 days, 21:14:22", "remaining_time": "6:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8768, "total_steps": 9627, "loss": 1.7847, "learning_rate": 1.9516342010374888e-06, "epoch": 0.910771787680482, "percentage": 91.08, "elapsed_time": "2 days, 21:14:53", "remaining_time": "6:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8769, "total_steps": 9627, "loss": 1.6476, "learning_rate": 1.9471225855503262e-06, "epoch": 0.9108756622000623, "percentage": 91.09, "elapsed_time": "2 days, 21:15:22", "remaining_time": "6:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8770, "total_steps": 9627, "loss": 1.5905, "learning_rate": 1.9426160873197874e-06, "epoch": 0.9109795367196427, "percentage": 91.1, "elapsed_time": "2 days, 21:15:51", "remaining_time": "6:46:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8771, "total_steps": 9627, "loss": 1.7829, "learning_rate": 1.938114706825778e-06, "epoch": 0.911083411239223, "percentage": 91.11, "elapsed_time": "2 days, 21:16:22", "remaining_time": "6:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8772, "total_steps": 9627, "loss": 1.5937, "learning_rate": 1.9336184445476525e-06, "epoch": 0.9111872857588034, "percentage": 91.12, "elapsed_time": "2 days, 21:16:51", "remaining_time": "6:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8773, "total_steps": 9627, "loss": 1.7094, "learning_rate": 1.9291273009642287e-06, "epoch": 0.9112911602783837, "percentage": 91.13, "elapsed_time": "2 days, 21:17:21", "remaining_time": "6:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8774, "total_steps": 9627, "loss": 1.5736, "learning_rate": 1.924641276553779e-06, "epoch": 0.911395034797964, "percentage": 91.14, "elapsed_time": "2 days, 21:17:50", "remaining_time": "6:44:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8775, "total_steps": 9627, "loss": 1.3872, "learning_rate": 1.9201603717940385e-06, "epoch": 0.9114989093175444, "percentage": 91.15, "elapsed_time": "2 days, 21:18:21", "remaining_time": "6:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8776, "total_steps": 9627, "loss": 1.7079, "learning_rate": 1.9156845871621698e-06, "epoch": 0.9116027838371248, "percentage": 91.16, "elapsed_time": "2 days, 21:18:51", "remaining_time": "6:43:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8777, "total_steps": 9627, "loss": 1.564, "learning_rate": 1.91121392313483e-06, "epoch": 0.9117066583567051, "percentage": 91.17, "elapsed_time": "2 days, 21:19:20", "remaining_time": "6:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8778, "total_steps": 9627, "loss": 1.7931, "learning_rate": 1.9067483801881002e-06, "epoch": 0.9118105328762854, "percentage": 91.18, "elapsed_time": "2 days, 21:19:49", "remaining_time": "6:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8779, "total_steps": 9627, "loss": 1.6593, "learning_rate": 1.9022879587975162e-06, "epoch": 0.9119144073958658, "percentage": 91.19, "elapsed_time": "2 days, 21:20:20", "remaining_time": "6:41:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8780, "total_steps": 9627, "loss": 1.4404, "learning_rate": 1.8978326594381035e-06, "epoch": 0.9120182819154461, "percentage": 91.2, "elapsed_time": "2 days, 21:20:49", "remaining_time": "6:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8781, "total_steps": 9627, "loss": 1.5394, "learning_rate": 1.8933824825842828e-06, "epoch": 0.9121221564350265, "percentage": 91.21, "elapsed_time": "2 days, 21:21:18", "remaining_time": "6:40:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8782, "total_steps": 9627, "loss": 1.7135, "learning_rate": 1.8889374287099916e-06, "epoch": 0.9122260309546069, "percentage": 91.22, "elapsed_time": "2 days, 21:21:48", "remaining_time": "6:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8783, "total_steps": 9627, "loss": 1.4235, "learning_rate": 1.8844974982885843e-06, "epoch": 0.9123299054741871, "percentage": 91.23, "elapsed_time": "2 days, 21:22:19", "remaining_time": "6:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8784, "total_steps": 9627, "loss": 1.5576, "learning_rate": 1.8800626917928776e-06, "epoch": 0.9124337799937675, "percentage": 91.24, "elapsed_time": "2 days, 21:22:47", "remaining_time": "6:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8785, "total_steps": 9627, "loss": 1.6632, "learning_rate": 1.8756330096951435e-06, "epoch": 0.9125376545133479, "percentage": 91.25, "elapsed_time": "2 days, 21:23:17", "remaining_time": "6:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8786, "total_steps": 9627, "loss": 1.6348, "learning_rate": 1.8712084524671047e-06, "epoch": 0.9126415290329283, "percentage": 91.26, "elapsed_time": "2 days, 21:23:46", "remaining_time": "6:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8787, "total_steps": 9627, "loss": 1.5868, "learning_rate": 1.866789020579962e-06, "epoch": 0.9127454035525085, "percentage": 91.27, "elapsed_time": "2 days, 21:24:16", "remaining_time": "6:38:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8788, "total_steps": 9627, "loss": 1.6801, "learning_rate": 1.862374714504317e-06, "epoch": 0.9128492780720889, "percentage": 91.28, "elapsed_time": "2 days, 21:24:44", "remaining_time": "6:37:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8789, "total_steps": 9627, "loss": 1.5403, "learning_rate": 1.8579655347102875e-06, "epoch": 0.9129531525916693, "percentage": 91.3, "elapsed_time": "2 days, 21:25:13", "remaining_time": "6:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8790, "total_steps": 9627, "loss": 1.5541, "learning_rate": 1.853561481667404e-06, "epoch": 0.9130570271112496, "percentage": 91.31, "elapsed_time": "2 days, 21:25:43", "remaining_time": "6:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8791, "total_steps": 9627, "loss": 1.7474, "learning_rate": 1.8491625558446634e-06, "epoch": 0.91316090163083, "percentage": 91.32, "elapsed_time": "2 days, 21:26:13", "remaining_time": "6:36:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8792, "total_steps": 9627, "loss": 1.6448, "learning_rate": 1.8447687577105244e-06, "epoch": 0.9132647761504104, "percentage": 91.33, "elapsed_time": "2 days, 21:26:42", "remaining_time": "6:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8793, "total_steps": 9627, "loss": 1.6618, "learning_rate": 1.8403800877328847e-06, "epoch": 0.9133686506699906, "percentage": 91.34, "elapsed_time": "2 days, 21:27:12", "remaining_time": "6:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8794, "total_steps": 9627, "loss": 1.6608, "learning_rate": 1.835996546379104e-06, "epoch": 0.913472525189571, "percentage": 91.35, "elapsed_time": "2 days, 21:27:42", "remaining_time": "6:34:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8795, "total_steps": 9627, "loss": 1.7398, "learning_rate": 1.8316181341159977e-06, "epoch": 0.9135763997091514, "percentage": 91.36, "elapsed_time": "2 days, 21:28:10", "remaining_time": "6:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8796, "total_steps": 9627, "loss": 1.5286, "learning_rate": 1.8272448514098373e-06, "epoch": 0.9136802742287317, "percentage": 91.37, "elapsed_time": "2 days, 21:28:41", "remaining_time": "6:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8797, "total_steps": 9627, "loss": 1.613, "learning_rate": 1.8228766987263334e-06, "epoch": 0.913784148748312, "percentage": 91.38, "elapsed_time": "2 days, 21:29:09", "remaining_time": "6:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8798, "total_steps": 9627, "loss": 1.6326, "learning_rate": 1.8185136765306643e-06, "epoch": 0.9138880232678924, "percentage": 91.39, "elapsed_time": "2 days, 21:29:38", "remaining_time": "6:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8799, "total_steps": 9627, "loss": 1.4985, "learning_rate": 1.8141557852874634e-06, "epoch": 0.9139918977874727, "percentage": 91.4, "elapsed_time": "2 days, 21:30:08", "remaining_time": "6:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8800, "total_steps": 9627, "loss": 1.6341, "learning_rate": 1.8098030254608044e-06, "epoch": 0.9140957723070531, "percentage": 91.41, "elapsed_time": "2 days, 21:30:37", "remaining_time": "6:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8801, "total_steps": 9627, "loss": 1.8224, "learning_rate": 1.8054553975142273e-06, "epoch": 0.9141996468266335, "percentage": 91.42, "elapsed_time": "2 days, 21:31:07", "remaining_time": "6:31:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8802, "total_steps": 9627, "loss": 1.7055, "learning_rate": 1.8011129019107176e-06, "epoch": 0.9143035213462137, "percentage": 91.43, "elapsed_time": "2 days, 21:31:35", "remaining_time": "6:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8803, "total_steps": 9627, "loss": 1.828, "learning_rate": 1.7967755391127161e-06, "epoch": 0.9144073958657941, "percentage": 91.44, "elapsed_time": "2 days, 21:32:05", "remaining_time": "6:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8804, "total_steps": 9627, "loss": 1.6182, "learning_rate": 1.7924433095821203e-06, "epoch": 0.9145112703853745, "percentage": 91.45, "elapsed_time": "2 days, 21:32:33", "remaining_time": "6:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8805, "total_steps": 9627, "loss": 1.7746, "learning_rate": 1.788116213780283e-06, "epoch": 0.9146151449049548, "percentage": 91.46, "elapsed_time": "2 days, 21:33:04", "remaining_time": "6:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8806, "total_steps": 9627, "loss": 1.7353, "learning_rate": 1.783794252168003e-06, "epoch": 0.9147190194245352, "percentage": 91.47, "elapsed_time": "2 days, 21:33:32", "remaining_time": "6:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8807, "total_steps": 9627, "loss": 1.6535, "learning_rate": 1.7794774252055224e-06, "epoch": 0.9148228939441155, "percentage": 91.48, "elapsed_time": "2 days, 21:34:02", "remaining_time": "6:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8808, "total_steps": 9627, "loss": 1.6215, "learning_rate": 1.775165733352574e-06, "epoch": 0.9149267684636958, "percentage": 91.49, "elapsed_time": "2 days, 21:34:31", "remaining_time": "6:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8809, "total_steps": 9627, "loss": 1.6455, "learning_rate": 1.770859177068296e-06, "epoch": 0.9150306429832762, "percentage": 91.5, "elapsed_time": "2 days, 21:34:59", "remaining_time": "6:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8810, "total_steps": 9627, "loss": 1.6085, "learning_rate": 1.7665577568113212e-06, "epoch": 0.9151345175028566, "percentage": 91.51, "elapsed_time": "2 days, 21:35:28", "remaining_time": "6:27:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8811, "total_steps": 9627, "loss": 1.7182, "learning_rate": 1.7622614730397114e-06, "epoch": 0.9152383920224368, "percentage": 91.52, "elapsed_time": "2 days, 21:35:59", "remaining_time": "6:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8812, "total_steps": 9627, "loss": 1.5084, "learning_rate": 1.7579703262109837e-06, "epoch": 0.9153422665420172, "percentage": 91.53, "elapsed_time": "2 days, 21:36:26", "remaining_time": "6:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8813, "total_steps": 9627, "loss": 1.8689, "learning_rate": 1.7536843167821116e-06, "epoch": 0.9154461410615976, "percentage": 91.54, "elapsed_time": "2 days, 21:36:57", "remaining_time": "6:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8814, "total_steps": 9627, "loss": 1.5368, "learning_rate": 1.7494034452095242e-06, "epoch": 0.915550015581178, "percentage": 91.56, "elapsed_time": "2 days, 21:37:25", "remaining_time": "6:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8815, "total_steps": 9627, "loss": 1.806, "learning_rate": 1.7451277119491073e-06, "epoch": 0.9156538901007583, "percentage": 91.57, "elapsed_time": "2 days, 21:37:55", "remaining_time": "6:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8816, "total_steps": 9627, "loss": 1.6147, "learning_rate": 1.740857117456174e-06, "epoch": 0.9157577646203386, "percentage": 91.58, "elapsed_time": "2 days, 21:38:24", "remaining_time": "6:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8817, "total_steps": 9627, "loss": 1.5101, "learning_rate": 1.7365916621855327e-06, "epoch": 0.915861639139919, "percentage": 91.59, "elapsed_time": "2 days, 21:38:53", "remaining_time": "6:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8818, "total_steps": 9627, "loss": 1.6499, "learning_rate": 1.7323313465914093e-06, "epoch": 0.9159655136594993, "percentage": 91.6, "elapsed_time": "2 days, 21:39:22", "remaining_time": "6:23:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8819, "total_steps": 9627, "loss": 1.5388, "learning_rate": 1.7280761711274906e-06, "epoch": 0.9160693881790797, "percentage": 91.61, "elapsed_time": "2 days, 21:39:50", "remaining_time": "6:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8820, "total_steps": 9627, "loss": 1.5099, "learning_rate": 1.7238261362469254e-06, "epoch": 0.9161732626986601, "percentage": 91.62, "elapsed_time": "2 days, 21:40:19", "remaining_time": "6:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8821, "total_steps": 9627, "loss": 1.4882, "learning_rate": 1.7195812424023129e-06, "epoch": 0.9162771372182403, "percentage": 91.63, "elapsed_time": "2 days, 21:40:50", "remaining_time": "6:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8822, "total_steps": 9627, "loss": 1.6063, "learning_rate": 1.715341490045691e-06, "epoch": 0.9163810117378207, "percentage": 91.64, "elapsed_time": "2 days, 21:41:18", "remaining_time": "6:21:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8823, "total_steps": 9627, "loss": 1.7671, "learning_rate": 1.7111068796285657e-06, "epoch": 0.9164848862574011, "percentage": 91.65, "elapsed_time": "2 days, 21:41:48", "remaining_time": "6:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8824, "total_steps": 9627, "loss": 1.6152, "learning_rate": 1.7068774116018983e-06, "epoch": 0.9165887607769814, "percentage": 91.66, "elapsed_time": "2 days, 21:42:16", "remaining_time": "6:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8825, "total_steps": 9627, "loss": 1.5364, "learning_rate": 1.7026530864160728e-06, "epoch": 0.9166926352965618, "percentage": 91.67, "elapsed_time": "2 days, 21:42:46", "remaining_time": "6:20:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8826, "total_steps": 9627, "loss": 1.5236, "learning_rate": 1.698433904520963e-06, "epoch": 0.9167965098161421, "percentage": 91.68, "elapsed_time": "2 days, 21:43:15", "remaining_time": "6:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8827, "total_steps": 9627, "loss": 1.767, "learning_rate": 1.6942198663658815e-06, "epoch": 0.9169003843357224, "percentage": 91.69, "elapsed_time": "2 days, 21:43:43", "remaining_time": "6:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8828, "total_steps": 9627, "loss": 1.6415, "learning_rate": 1.6900109723995805e-06, "epoch": 0.9170042588553028, "percentage": 91.7, "elapsed_time": "2 days, 21:44:13", "remaining_time": "6:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8829, "total_steps": 9627, "loss": 1.6657, "learning_rate": 1.6858072230702792e-06, "epoch": 0.9171081333748832, "percentage": 91.71, "elapsed_time": "2 days, 21:44:41", "remaining_time": "6:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8830, "total_steps": 9627, "loss": 1.6511, "learning_rate": 1.6816086188256475e-06, "epoch": 0.9172120078944634, "percentage": 91.72, "elapsed_time": "2 days, 21:45:09", "remaining_time": "6:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8831, "total_steps": 9627, "loss": 1.5784, "learning_rate": 1.677415160112794e-06, "epoch": 0.9173158824140438, "percentage": 91.73, "elapsed_time": "2 days, 21:45:39", "remaining_time": "6:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8832, "total_steps": 9627, "loss": 1.6897, "learning_rate": 1.6732268473782953e-06, "epoch": 0.9174197569336242, "percentage": 91.74, "elapsed_time": "2 days, 21:46:08", "remaining_time": "6:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8833, "total_steps": 9627, "loss": 1.6477, "learning_rate": 1.6690436810681832e-06, "epoch": 0.9175236314532045, "percentage": 91.75, "elapsed_time": "2 days, 21:46:38", "remaining_time": "6:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8834, "total_steps": 9627, "loss": 1.6891, "learning_rate": 1.664865661627918e-06, "epoch": 0.9176275059727849, "percentage": 91.76, "elapsed_time": "2 days, 21:47:06", "remaining_time": "6:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8835, "total_steps": 9627, "loss": 1.5716, "learning_rate": 1.6606927895024217e-06, "epoch": 0.9177313804923652, "percentage": 91.77, "elapsed_time": "2 days, 21:47:35", "remaining_time": "6:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8836, "total_steps": 9627, "loss": 1.6978, "learning_rate": 1.6565250651360997e-06, "epoch": 0.9178352550119455, "percentage": 91.78, "elapsed_time": "2 days, 21:48:04", "remaining_time": "6:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8837, "total_steps": 9627, "loss": 1.7084, "learning_rate": 1.6523624889727474e-06, "epoch": 0.9179391295315259, "percentage": 91.79, "elapsed_time": "2 days, 21:48:33", "remaining_time": "6:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8838, "total_steps": 9627, "loss": 1.4483, "learning_rate": 1.6482050614556709e-06, "epoch": 0.9180430040511063, "percentage": 91.8, "elapsed_time": "2 days, 21:49:01", "remaining_time": "6:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8839, "total_steps": 9627, "loss": 1.7525, "learning_rate": 1.6440527830275997e-06, "epoch": 0.9181468785706867, "percentage": 91.81, "elapsed_time": "2 days, 21:49:31", "remaining_time": "6:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8840, "total_steps": 9627, "loss": 1.5032, "learning_rate": 1.6399056541307134e-06, "epoch": 0.9182507530902669, "percentage": 91.83, "elapsed_time": "2 days, 21:50:00", "remaining_time": "6:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8841, "total_steps": 9627, "loss": 1.6178, "learning_rate": 1.6357636752066529e-06, "epoch": 0.9183546276098473, "percentage": 91.84, "elapsed_time": "2 days, 21:50:29", "remaining_time": "6:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8842, "total_steps": 9627, "loss": 1.6032, "learning_rate": 1.6316268466965046e-06, "epoch": 0.9184585021294277, "percentage": 91.85, "elapsed_time": "2 days, 21:50:58", "remaining_time": "6:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8843, "total_steps": 9627, "loss": 1.7141, "learning_rate": 1.6274951690408158e-06, "epoch": 0.918562376649008, "percentage": 91.86, "elapsed_time": "2 days, 21:51:27", "remaining_time": "6:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8844, "total_steps": 9627, "loss": 1.6226, "learning_rate": 1.623368642679557e-06, "epoch": 0.9186662511685884, "percentage": 91.87, "elapsed_time": "2 days, 21:51:56", "remaining_time": "6:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8845, "total_steps": 9627, "loss": 1.9285, "learning_rate": 1.6192472680521987e-06, "epoch": 0.9187701256881687, "percentage": 91.88, "elapsed_time": "2 days, 21:52:24", "remaining_time": "6:10:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8846, "total_steps": 9627, "loss": 1.7397, "learning_rate": 1.6151310455976176e-06, "epoch": 0.918874000207749, "percentage": 91.89, "elapsed_time": "2 days, 21:52:54", "remaining_time": "6:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8847, "total_steps": 9627, "loss": 1.5453, "learning_rate": 1.6110199757541632e-06, "epoch": 0.9189778747273294, "percentage": 91.9, "elapsed_time": "2 days, 21:53:23", "remaining_time": "6:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8848, "total_steps": 9627, "loss": 1.6, "learning_rate": 1.6069140589596299e-06, "epoch": 0.9190817492469098, "percentage": 91.91, "elapsed_time": "2 days, 21:53:52", "remaining_time": "6:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8849, "total_steps": 9627, "loss": 1.6392, "learning_rate": 1.6028132956512732e-06, "epoch": 0.91918562376649, "percentage": 91.92, "elapsed_time": "2 days, 21:54:20", "remaining_time": "6:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8850, "total_steps": 9627, "loss": 1.6164, "learning_rate": 1.5987176862657882e-06, "epoch": 0.9192894982860704, "percentage": 91.93, "elapsed_time": "2 days, 21:54:49", "remaining_time": "6:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8851, "total_steps": 9627, "loss": 1.5529, "learning_rate": 1.5946272312393206e-06, "epoch": 0.9193933728056508, "percentage": 91.94, "elapsed_time": "2 days, 21:55:19", "remaining_time": "6:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8852, "total_steps": 9627, "loss": 1.7714, "learning_rate": 1.5905419310074831e-06, "epoch": 0.9194972473252311, "percentage": 91.95, "elapsed_time": "2 days, 21:55:47", "remaining_time": "6:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8853, "total_steps": 9627, "loss": 1.703, "learning_rate": 1.586461786005311e-06, "epoch": 0.9196011218448115, "percentage": 91.96, "elapsed_time": "2 days, 21:56:17", "remaining_time": "6:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8854, "total_steps": 9627, "loss": 1.6907, "learning_rate": 1.5823867966673288e-06, "epoch": 0.9197049963643918, "percentage": 91.97, "elapsed_time": "2 days, 21:56:45", "remaining_time": "6:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8855, "total_steps": 9627, "loss": 1.7441, "learning_rate": 1.5783169634274787e-06, "epoch": 0.9198088708839721, "percentage": 91.98, "elapsed_time": "2 days, 21:57:14", "remaining_time": "6:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8856, "total_steps": 9627, "loss": 1.5403, "learning_rate": 1.574252286719169e-06, "epoch": 0.9199127454035525, "percentage": 91.99, "elapsed_time": "2 days, 21:57:43", "remaining_time": "6:05:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8857, "total_steps": 9627, "loss": 1.4616, "learning_rate": 1.5701927669752537e-06, "epoch": 0.9200166199231329, "percentage": 92.0, "elapsed_time": "2 days, 21:58:13", "remaining_time": "6:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8858, "total_steps": 9627, "loss": 1.6938, "learning_rate": 1.566138404628037e-06, "epoch": 0.9201204944427132, "percentage": 92.01, "elapsed_time": "2 days, 21:58:41", "remaining_time": "6:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8859, "total_steps": 9627, "loss": 1.5245, "learning_rate": 1.5620892001092902e-06, "epoch": 0.9202243689622935, "percentage": 92.02, "elapsed_time": "2 days, 21:59:10", "remaining_time": "6:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8860, "total_steps": 9627, "loss": 1.6801, "learning_rate": 1.5580451538502016e-06, "epoch": 0.9203282434818739, "percentage": 92.03, "elapsed_time": "2 days, 21:59:39", "remaining_time": "6:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8861, "total_steps": 9627, "loss": 1.8436, "learning_rate": 1.5540062662814603e-06, "epoch": 0.9204321180014542, "percentage": 92.04, "elapsed_time": "2 days, 22:00:07", "remaining_time": "6:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8862, "total_steps": 9627, "loss": 1.6583, "learning_rate": 1.5499725378331441e-06, "epoch": 0.9205359925210346, "percentage": 92.05, "elapsed_time": "2 days, 22:00:37", "remaining_time": "6:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8863, "total_steps": 9627, "loss": 1.6852, "learning_rate": 1.5459439689348266e-06, "epoch": 0.920639867040615, "percentage": 92.06, "elapsed_time": "2 days, 22:01:06", "remaining_time": "6:02:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8864, "total_steps": 9627, "loss": 1.6821, "learning_rate": 1.5419205600155306e-06, "epoch": 0.9207437415601953, "percentage": 92.07, "elapsed_time": "2 days, 22:01:35", "remaining_time": "6:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8865, "total_steps": 9627, "loss": 1.8725, "learning_rate": 1.5379023115037027e-06, "epoch": 0.9208476160797756, "percentage": 92.08, "elapsed_time": "2 days, 22:02:04", "remaining_time": "6:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8866, "total_steps": 9627, "loss": 1.6768, "learning_rate": 1.5338892238272562e-06, "epoch": 0.920951490599356, "percentage": 92.1, "elapsed_time": "2 days, 22:02:32", "remaining_time": "6:00:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8867, "total_steps": 9627, "loss": 1.7364, "learning_rate": 1.5298812974135602e-06, "epoch": 0.9210553651189364, "percentage": 92.11, "elapsed_time": "2 days, 22:03:02", "remaining_time": "6:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8868, "total_steps": 9627, "loss": 1.7075, "learning_rate": 1.5258785326894286e-06, "epoch": 0.9211592396385166, "percentage": 92.12, "elapsed_time": "2 days, 22:03:31", "remaining_time": "5:59:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8869, "total_steps": 9627, "loss": 1.7723, "learning_rate": 1.5218809300811155e-06, "epoch": 0.921263114158097, "percentage": 92.13, "elapsed_time": "2 days, 22:03:58", "remaining_time": "5:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8870, "total_steps": 9627, "loss": 1.6459, "learning_rate": 1.5178884900143353e-06, "epoch": 0.9213669886776774, "percentage": 92.14, "elapsed_time": "2 days, 22:04:29", "remaining_time": "5:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8871, "total_steps": 9627, "loss": 1.5313, "learning_rate": 1.5139012129142704e-06, "epoch": 0.9214708631972577, "percentage": 92.15, "elapsed_time": "2 days, 22:04:57", "remaining_time": "5:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8872, "total_steps": 9627, "loss": 1.7129, "learning_rate": 1.5099190992055034e-06, "epoch": 0.9215747377168381, "percentage": 92.16, "elapsed_time": "2 days, 22:05:27", "remaining_time": "5:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8873, "total_steps": 9627, "loss": 1.4032, "learning_rate": 1.505942149312123e-06, "epoch": 0.9216786122364184, "percentage": 92.17, "elapsed_time": "2 days, 22:05:55", "remaining_time": "5:57:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8874, "total_steps": 9627, "loss": 1.6315, "learning_rate": 1.5019703636576344e-06, "epoch": 0.9217824867559987, "percentage": 92.18, "elapsed_time": "2 days, 22:06:25", "remaining_time": "5:56:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8875, "total_steps": 9627, "loss": 1.6485, "learning_rate": 1.498003742665005e-06, "epoch": 0.9218863612755791, "percentage": 92.19, "elapsed_time": "2 days, 22:06:54", "remaining_time": "5:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8876, "total_steps": 9627, "loss": 1.671, "learning_rate": 1.4940422867566472e-06, "epoch": 0.9219902357951595, "percentage": 92.2, "elapsed_time": "2 days, 22:07:22", "remaining_time": "5:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8877, "total_steps": 9627, "loss": 1.581, "learning_rate": 1.4900859963544233e-06, "epoch": 0.9220941103147398, "percentage": 92.21, "elapsed_time": "2 days, 22:07:52", "remaining_time": "5:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8878, "total_steps": 9627, "loss": 1.7884, "learning_rate": 1.486134871879652e-06, "epoch": 0.9221979848343201, "percentage": 92.22, "elapsed_time": "2 days, 22:08:20", "remaining_time": "5:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8879, "total_steps": 9627, "loss": 1.7156, "learning_rate": 1.4821889137530852e-06, "epoch": 0.9223018593539005, "percentage": 92.23, "elapsed_time": "2 days, 22:08:50", "remaining_time": "5:54:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8880, "total_steps": 9627, "loss": 1.8423, "learning_rate": 1.4782481223949596e-06, "epoch": 0.9224057338734808, "percentage": 92.24, "elapsed_time": "2 days, 22:09:19", "remaining_time": "5:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8881, "total_steps": 9627, "loss": 1.5655, "learning_rate": 1.4743124982249112e-06, "epoch": 0.9225096083930612, "percentage": 92.25, "elapsed_time": "2 days, 22:09:47", "remaining_time": "5:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8882, "total_steps": 9627, "loss": 1.6241, "learning_rate": 1.4703820416620718e-06, "epoch": 0.9226134829126416, "percentage": 92.26, "elapsed_time": "2 days, 22:10:17", "remaining_time": "5:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8883, "total_steps": 9627, "loss": 1.5582, "learning_rate": 1.4664567531250007e-06, "epoch": 0.9227173574322218, "percentage": 92.27, "elapsed_time": "2 days, 22:10:46", "remaining_time": "5:52:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8884, "total_steps": 9627, "loss": 1.6288, "learning_rate": 1.462536633031708e-06, "epoch": 0.9228212319518022, "percentage": 92.28, "elapsed_time": "2 days, 22:11:15", "remaining_time": "5:52:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8885, "total_steps": 9627, "loss": 1.6538, "learning_rate": 1.4586216817996602e-06, "epoch": 0.9229251064713826, "percentage": 92.29, "elapsed_time": "2 days, 22:11:43", "remaining_time": "5:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8886, "total_steps": 9627, "loss": 1.8293, "learning_rate": 1.454711899845762e-06, "epoch": 0.9230289809909629, "percentage": 92.3, "elapsed_time": "2 days, 22:12:13", "remaining_time": "5:51:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8887, "total_steps": 9627, "loss": 1.8293, "learning_rate": 1.450807287586381e-06, "epoch": 0.9231328555105432, "percentage": 92.31, "elapsed_time": "2 days, 22:12:42", "remaining_time": "5:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8888, "total_steps": 9627, "loss": 1.6358, "learning_rate": 1.4469078454373174e-06, "epoch": 0.9232367300301236, "percentage": 92.32, "elapsed_time": "2 days, 22:13:10", "remaining_time": "5:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8889, "total_steps": 9627, "loss": 1.824, "learning_rate": 1.4430135738138561e-06, "epoch": 0.9233406045497039, "percentage": 92.33, "elapsed_time": "2 days, 22:13:40", "remaining_time": "5:49:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8890, "total_steps": 9627, "loss": 1.6387, "learning_rate": 1.4391244731306763e-06, "epoch": 0.9234444790692843, "percentage": 92.34, "elapsed_time": "2 days, 22:14:08", "remaining_time": "5:49:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8891, "total_steps": 9627, "loss": 1.7798, "learning_rate": 1.4352405438019522e-06, "epoch": 0.9235483535888647, "percentage": 92.35, "elapsed_time": "2 days, 22:14:37", "remaining_time": "5:48:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8892, "total_steps": 9627, "loss": 1.8333, "learning_rate": 1.431361786241292e-06, "epoch": 0.923652228108445, "percentage": 92.37, "elapsed_time": "2 days, 22:15:07", "remaining_time": "5:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8893, "total_steps": 9627, "loss": 1.6033, "learning_rate": 1.427488200861754e-06, "epoch": 0.9237561026280253, "percentage": 92.38, "elapsed_time": "2 days, 22:15:35", "remaining_time": "5:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8894, "total_steps": 9627, "loss": 1.5394, "learning_rate": 1.4236197880758416e-06, "epoch": 0.9238599771476057, "percentage": 92.39, "elapsed_time": "2 days, 22:16:04", "remaining_time": "5:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8895, "total_steps": 9627, "loss": 1.8753, "learning_rate": 1.4197565482955144e-06, "epoch": 0.9239638516671861, "percentage": 92.4, "elapsed_time": "2 days, 22:16:34", "remaining_time": "5:46:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8896, "total_steps": 9627, "loss": 1.5401, "learning_rate": 1.4158984819321707e-06, "epoch": 0.9240677261867664, "percentage": 92.41, "elapsed_time": "2 days, 22:17:02", "remaining_time": "5:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8897, "total_steps": 9627, "loss": 1.755, "learning_rate": 1.4120455893966711e-06, "epoch": 0.9241716007063467, "percentage": 92.42, "elapsed_time": "2 days, 22:17:31", "remaining_time": "5:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8898, "total_steps": 9627, "loss": 1.7385, "learning_rate": 1.4081978710993092e-06, "epoch": 0.9242754752259271, "percentage": 92.43, "elapsed_time": "2 days, 22:18:00", "remaining_time": "5:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8899, "total_steps": 9627, "loss": 1.6438, "learning_rate": 1.404355327449852e-06, "epoch": 0.9243793497455074, "percentage": 92.44, "elapsed_time": "2 days, 22:18:28", "remaining_time": "5:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8900, "total_steps": 9627, "loss": 1.3095, "learning_rate": 1.4005179588574835e-06, "epoch": 0.9244832242650878, "percentage": 92.45, "elapsed_time": "2 days, 22:18:58", "remaining_time": "5:44:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8901, "total_steps": 9627, "loss": 1.6767, "learning_rate": 1.3966857657308652e-06, "epoch": 0.9245870987846682, "percentage": 92.46, "elapsed_time": "2 days, 22:19:27", "remaining_time": "5:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8902, "total_steps": 9627, "loss": 1.5915, "learning_rate": 1.392858748478093e-06, "epoch": 0.9246909733042484, "percentage": 92.47, "elapsed_time": "2 days, 22:19:55", "remaining_time": "5:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8903, "total_steps": 9627, "loss": 1.6812, "learning_rate": 1.3890369075067134e-06, "epoch": 0.9247948478238288, "percentage": 92.48, "elapsed_time": "2 days, 22:20:25", "remaining_time": "5:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8904, "total_steps": 9627, "loss": 1.6996, "learning_rate": 1.3852202432237227e-06, "epoch": 0.9248987223434092, "percentage": 92.49, "elapsed_time": "2 days, 22:20:54", "remaining_time": "5:42:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8905, "total_steps": 9627, "loss": 1.5893, "learning_rate": 1.3814087560355682e-06, "epoch": 0.9250025968629895, "percentage": 92.5, "elapsed_time": "2 days, 22:21:22", "remaining_time": "5:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8906, "total_steps": 9627, "loss": 1.7249, "learning_rate": 1.377602446348142e-06, "epoch": 0.9251064713825699, "percentage": 92.51, "elapsed_time": "2 days, 22:21:52", "remaining_time": "5:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8907, "total_steps": 9627, "loss": 1.5488, "learning_rate": 1.3738013145667804e-06, "epoch": 0.9252103459021502, "percentage": 92.52, "elapsed_time": "2 days, 22:22:21", "remaining_time": "5:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8908, "total_steps": 9627, "loss": 1.5541, "learning_rate": 1.3700053610962882e-06, "epoch": 0.9253142204217305, "percentage": 92.53, "elapsed_time": "2 days, 22:22:50", "remaining_time": "5:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8909, "total_steps": 9627, "loss": 1.7434, "learning_rate": 1.366214586340886e-06, "epoch": 0.9254180949413109, "percentage": 92.54, "elapsed_time": "2 days, 22:23:19", "remaining_time": "5:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8910, "total_steps": 9627, "loss": 1.7068, "learning_rate": 1.3624289907042787e-06, "epoch": 0.9255219694608913, "percentage": 92.55, "elapsed_time": "2 days, 22:23:47", "remaining_time": "5:39:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8911, "total_steps": 9627, "loss": 1.7564, "learning_rate": 1.3586485745895993e-06, "epoch": 0.9256258439804715, "percentage": 92.56, "elapsed_time": "2 days, 22:24:16", "remaining_time": "5:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8912, "total_steps": 9627, "loss": 1.6685, "learning_rate": 1.354873338399426e-06, "epoch": 0.9257297185000519, "percentage": 92.57, "elapsed_time": "2 days, 22:24:46", "remaining_time": "5:38:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8913, "total_steps": 9627, "loss": 1.4694, "learning_rate": 1.3511032825357982e-06, "epoch": 0.9258335930196323, "percentage": 92.58, "elapsed_time": "2 days, 22:25:15", "remaining_time": "5:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8914, "total_steps": 9627, "loss": 1.5793, "learning_rate": 1.3473384074001893e-06, "epoch": 0.9259374675392126, "percentage": 92.59, "elapsed_time": "2 days, 22:25:44", "remaining_time": "5:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8915, "total_steps": 9627, "loss": 1.8184, "learning_rate": 1.3435787133935397e-06, "epoch": 0.926041342058793, "percentage": 92.6, "elapsed_time": "2 days, 22:26:13", "remaining_time": "5:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8916, "total_steps": 9627, "loss": 1.795, "learning_rate": 1.3398242009162177e-06, "epoch": 0.9261452165783733, "percentage": 92.61, "elapsed_time": "2 days, 22:26:42", "remaining_time": "5:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8917, "total_steps": 9627, "loss": 1.6734, "learning_rate": 1.3360748703680537e-06, "epoch": 0.9262490910979537, "percentage": 92.62, "elapsed_time": "2 days, 22:27:11", "remaining_time": "5:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8918, "total_steps": 9627, "loss": 1.5626, "learning_rate": 1.3323307221483339e-06, "epoch": 0.926352965617534, "percentage": 92.64, "elapsed_time": "2 days, 22:27:40", "remaining_time": "5:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8919, "total_steps": 9627, "loss": 1.6638, "learning_rate": 1.328591756655756e-06, "epoch": 0.9264568401371144, "percentage": 92.65, "elapsed_time": "2 days, 22:28:10", "remaining_time": "5:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8920, "total_steps": 9627, "loss": 1.552, "learning_rate": 1.3248579742885126e-06, "epoch": 0.9265607146566948, "percentage": 92.66, "elapsed_time": "2 days, 22:28:39", "remaining_time": "5:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8921, "total_steps": 9627, "loss": 1.6251, "learning_rate": 1.3211293754442134e-06, "epoch": 0.926664589176275, "percentage": 92.67, "elapsed_time": "2 days, 22:29:08", "remaining_time": "5:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8922, "total_steps": 9627, "loss": 1.6939, "learning_rate": 1.317405960519924e-06, "epoch": 0.9267684636958554, "percentage": 92.68, "elapsed_time": "2 days, 22:29:38", "remaining_time": "5:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8923, "total_steps": 9627, "loss": 1.6519, "learning_rate": 1.3136877299121608e-06, "epoch": 0.9268723382154358, "percentage": 92.69, "elapsed_time": "2 days, 22:30:06", "remaining_time": "5:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8924, "total_steps": 9627, "loss": 1.5427, "learning_rate": 1.3099746840168903e-06, "epoch": 0.9269762127350161, "percentage": 92.7, "elapsed_time": "2 days, 22:30:34", "remaining_time": "5:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8925, "total_steps": 9627, "loss": 1.5207, "learning_rate": 1.3062668232295128e-06, "epoch": 0.9270800872545965, "percentage": 92.71, "elapsed_time": "2 days, 22:31:03", "remaining_time": "5:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8926, "total_steps": 9627, "loss": 1.8273, "learning_rate": 1.3025641479448958e-06, "epoch": 0.9271839617741768, "percentage": 92.72, "elapsed_time": "2 days, 22:31:32", "remaining_time": "5:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8927, "total_steps": 9627, "loss": 1.4928, "learning_rate": 1.2988666585573461e-06, "epoch": 0.9272878362937571, "percentage": 92.73, "elapsed_time": "2 days, 22:32:01", "remaining_time": "5:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8928, "total_steps": 9627, "loss": 1.6839, "learning_rate": 1.2951743554606044e-06, "epoch": 0.9273917108133375, "percentage": 92.74, "elapsed_time": "2 days, 22:32:31", "remaining_time": "5:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8929, "total_steps": 9627, "loss": 1.7069, "learning_rate": 1.2914872390478894e-06, "epoch": 0.9274955853329179, "percentage": 92.75, "elapsed_time": "2 days, 22:33:00", "remaining_time": "5:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8930, "total_steps": 9627, "loss": 1.6181, "learning_rate": 1.2878053097118425e-06, "epoch": 0.9275994598524981, "percentage": 92.76, "elapsed_time": "2 days, 22:33:29", "remaining_time": "5:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8931, "total_steps": 9627, "loss": 1.599, "learning_rate": 1.2841285678445614e-06, "epoch": 0.9277033343720785, "percentage": 92.77, "elapsed_time": "2 days, 22:33:58", "remaining_time": "5:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8932, "total_steps": 9627, "loss": 1.6496, "learning_rate": 1.2804570138375827e-06, "epoch": 0.9278072088916589, "percentage": 92.78, "elapsed_time": "2 days, 22:34:27", "remaining_time": "5:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8933, "total_steps": 9627, "loss": 1.7878, "learning_rate": 1.2767906480819104e-06, "epoch": 0.9279110834112392, "percentage": 92.79, "elapsed_time": "2 days, 22:34:57", "remaining_time": "5:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8934, "total_steps": 9627, "loss": 1.6478, "learning_rate": 1.273129470967982e-06, "epoch": 0.9280149579308196, "percentage": 92.8, "elapsed_time": "2 days, 22:35:25", "remaining_time": "5:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8935, "total_steps": 9627, "loss": 1.6999, "learning_rate": 1.2694734828856691e-06, "epoch": 0.9281188324503999, "percentage": 92.81, "elapsed_time": "2 days, 22:35:55", "remaining_time": "5:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8936, "total_steps": 9627, "loss": 1.5892, "learning_rate": 1.265822684224327e-06, "epoch": 0.9282227069699802, "percentage": 92.82, "elapsed_time": "2 days, 22:36:25", "remaining_time": "5:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8937, "total_steps": 9627, "loss": 1.661, "learning_rate": 1.2621770753727224e-06, "epoch": 0.9283265814895606, "percentage": 92.83, "elapsed_time": "2 days, 22:36:53", "remaining_time": "5:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8938, "total_steps": 9627, "loss": 1.7309, "learning_rate": 1.2585366567190949e-06, "epoch": 0.928430456009141, "percentage": 92.84, "elapsed_time": "2 days, 22:37:23", "remaining_time": "5:26:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8939, "total_steps": 9627, "loss": 1.5562, "learning_rate": 1.2549014286511118e-06, "epoch": 0.9285343305287213, "percentage": 92.85, "elapsed_time": "2 days, 22:37:52", "remaining_time": "5:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8940, "total_steps": 9627, "loss": 1.5712, "learning_rate": 1.2512713915559027e-06, "epoch": 0.9286382050483016, "percentage": 92.86, "elapsed_time": "2 days, 22:38:20", "remaining_time": "5:25:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8941, "total_steps": 9627, "loss": 1.6381, "learning_rate": 1.247646545820036e-06, "epoch": 0.928742079567882, "percentage": 92.87, "elapsed_time": "2 days, 22:38:49", "remaining_time": "5:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8942, "total_steps": 9627, "loss": 1.71, "learning_rate": 1.2440268918295194e-06, "epoch": 0.9288459540874624, "percentage": 92.88, "elapsed_time": "2 days, 22:39:19", "remaining_time": "5:24:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8943, "total_steps": 9627, "loss": 1.7413, "learning_rate": 1.240412429969845e-06, "epoch": 0.9289498286070427, "percentage": 92.89, "elapsed_time": "2 days, 22:39:48", "remaining_time": "5:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8944, "total_steps": 9627, "loss": 1.8444, "learning_rate": 1.2368031606258934e-06, "epoch": 0.929053703126623, "percentage": 92.91, "elapsed_time": "2 days, 22:40:18", "remaining_time": "5:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8945, "total_steps": 9627, "loss": 1.8187, "learning_rate": 1.2331990841820407e-06, "epoch": 0.9291575776462034, "percentage": 92.92, "elapsed_time": "2 days, 22:40:46", "remaining_time": "5:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8946, "total_steps": 9627, "loss": 1.6616, "learning_rate": 1.2296002010220964e-06, "epoch": 0.9292614521657837, "percentage": 92.93, "elapsed_time": "2 days, 22:41:16", "remaining_time": "5:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8947, "total_steps": 9627, "loss": 1.6949, "learning_rate": 1.2260065115292984e-06, "epoch": 0.9293653266853641, "percentage": 92.94, "elapsed_time": "2 days, 22:41:44", "remaining_time": "5:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8948, "total_steps": 9627, "loss": 1.535, "learning_rate": 1.2224180160863574e-06, "epoch": 0.9294692012049445, "percentage": 92.95, "elapsed_time": "2 days, 22:42:14", "remaining_time": "5:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8949, "total_steps": 9627, "loss": 1.7167, "learning_rate": 1.2188347150754231e-06, "epoch": 0.9295730757245247, "percentage": 92.96, "elapsed_time": "2 days, 22:42:42", "remaining_time": "5:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8950, "total_steps": 9627, "loss": 1.5799, "learning_rate": 1.2152566088780792e-06, "epoch": 0.9296769502441051, "percentage": 92.97, "elapsed_time": "2 days, 22:43:13", "remaining_time": "5:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8951, "total_steps": 9627, "loss": 1.603, "learning_rate": 1.2116836978753709e-06, "epoch": 0.9297808247636855, "percentage": 92.98, "elapsed_time": "2 days, 22:43:41", "remaining_time": "5:20:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8952, "total_steps": 9627, "loss": 1.5984, "learning_rate": 1.2081159824477883e-06, "epoch": 0.9298846992832658, "percentage": 92.99, "elapsed_time": "2 days, 22:44:10", "remaining_time": "5:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8953, "total_steps": 9627, "loss": 1.6496, "learning_rate": 1.2045534629752609e-06, "epoch": 0.9299885738028462, "percentage": 93.0, "elapsed_time": "2 days, 22:44:39", "remaining_time": "5:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8954, "total_steps": 9627, "loss": 1.4944, "learning_rate": 1.2009961398371628e-06, "epoch": 0.9300924483224265, "percentage": 93.01, "elapsed_time": "2 days, 22:45:08", "remaining_time": "5:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8955, "total_steps": 9627, "loss": 1.5212, "learning_rate": 1.197444013412341e-06, "epoch": 0.9301963228420068, "percentage": 93.02, "elapsed_time": "2 days, 22:45:37", "remaining_time": "5:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8956, "total_steps": 9627, "loss": 1.6037, "learning_rate": 1.1938970840790486e-06, "epoch": 0.9303001973615872, "percentage": 93.03, "elapsed_time": "2 days, 22:46:05", "remaining_time": "5:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8957, "total_steps": 9627, "loss": 1.7366, "learning_rate": 1.1903553522150169e-06, "epoch": 0.9304040718811676, "percentage": 93.04, "elapsed_time": "2 days, 22:46:36", "remaining_time": "5:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8958, "total_steps": 9627, "loss": 1.5468, "learning_rate": 1.186818818197416e-06, "epoch": 0.9305079464007479, "percentage": 93.05, "elapsed_time": "2 days, 22:47:04", "remaining_time": "5:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8959, "total_steps": 9627, "loss": 1.5958, "learning_rate": 1.1832874824028451e-06, "epoch": 0.9306118209203282, "percentage": 93.06, "elapsed_time": "2 days, 22:47:34", "remaining_time": "5:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8960, "total_steps": 9627, "loss": 1.5762, "learning_rate": 1.1797613452073808e-06, "epoch": 0.9307156954399086, "percentage": 93.07, "elapsed_time": "2 days, 22:48:03", "remaining_time": "5:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8961, "total_steps": 9627, "loss": 1.6074, "learning_rate": 1.1762404069865174e-06, "epoch": 0.9308195699594889, "percentage": 93.08, "elapsed_time": "2 days, 22:48:33", "remaining_time": "5:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8962, "total_steps": 9627, "loss": 1.7324, "learning_rate": 1.1727246681152049e-06, "epoch": 0.9309234444790693, "percentage": 93.09, "elapsed_time": "2 days, 22:49:02", "remaining_time": "5:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8963, "total_steps": 9627, "loss": 1.6437, "learning_rate": 1.1692141289678492e-06, "epoch": 0.9310273189986497, "percentage": 93.1, "elapsed_time": "2 days, 22:49:31", "remaining_time": "5:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8964, "total_steps": 9627, "loss": 1.5817, "learning_rate": 1.1657087899183016e-06, "epoch": 0.9311311935182299, "percentage": 93.11, "elapsed_time": "2 days, 22:50:00", "remaining_time": "5:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8965, "total_steps": 9627, "loss": 1.7894, "learning_rate": 1.162208651339841e-06, "epoch": 0.9312350680378103, "percentage": 93.12, "elapsed_time": "2 days, 22:50:29", "remaining_time": "5:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8966, "total_steps": 9627, "loss": 1.5805, "learning_rate": 1.1587137136052083e-06, "epoch": 0.9313389425573907, "percentage": 93.13, "elapsed_time": "2 days, 22:50:59", "remaining_time": "5:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8967, "total_steps": 9627, "loss": 1.6191, "learning_rate": 1.1552239770865892e-06, "epoch": 0.931442817076971, "percentage": 93.14, "elapsed_time": "2 days, 22:51:27", "remaining_time": "5:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8968, "total_steps": 9627, "loss": 1.7234, "learning_rate": 1.1517394421556138e-06, "epoch": 0.9315466915965513, "percentage": 93.15, "elapsed_time": "2 days, 22:51:57", "remaining_time": "5:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8969, "total_steps": 9627, "loss": 1.6766, "learning_rate": 1.1482601091833578e-06, "epoch": 0.9316505661161317, "percentage": 93.17, "elapsed_time": "2 days, 22:52:25", "remaining_time": "5:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8970, "total_steps": 9627, "loss": 1.7669, "learning_rate": 1.1447859785403359e-06, "epoch": 0.9317544406357121, "percentage": 93.18, "elapsed_time": "2 days, 22:52:56", "remaining_time": "5:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8971, "total_steps": 9627, "loss": 1.7189, "learning_rate": 1.1413170505965354e-06, "epoch": 0.9318583151552924, "percentage": 93.19, "elapsed_time": "2 days, 22:53:24", "remaining_time": "5:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8972, "total_steps": 9627, "loss": 1.8092, "learning_rate": 1.1378533257213387e-06, "epoch": 0.9319621896748728, "percentage": 93.2, "elapsed_time": "2 days, 22:53:54", "remaining_time": "5:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8973, "total_steps": 9627, "loss": 1.8075, "learning_rate": 1.134394804283634e-06, "epoch": 0.9320660641944531, "percentage": 93.21, "elapsed_time": "2 days, 22:54:23", "remaining_time": "5:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8974, "total_steps": 9627, "loss": 1.7678, "learning_rate": 1.1309414866517209e-06, "epoch": 0.9321699387140334, "percentage": 93.22, "elapsed_time": "2 days, 22:54:52", "remaining_time": "5:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8975, "total_steps": 9627, "loss": 1.6321, "learning_rate": 1.127493373193339e-06, "epoch": 0.9322738132336138, "percentage": 93.23, "elapsed_time": "2 days, 22:55:22", "remaining_time": "5:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8976, "total_steps": 9627, "loss": 1.7411, "learning_rate": 1.1240504642756945e-06, "epoch": 0.9323776877531942, "percentage": 93.24, "elapsed_time": "2 days, 22:55:51", "remaining_time": "5:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8977, "total_steps": 9627, "loss": 1.9319, "learning_rate": 1.1206127602654271e-06, "epoch": 0.9324815622727745, "percentage": 93.25, "elapsed_time": "2 days, 22:56:21", "remaining_time": "5:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8978, "total_steps": 9627, "loss": 1.6936, "learning_rate": 1.1171802615286275e-06, "epoch": 0.9325854367923548, "percentage": 93.26, "elapsed_time": "2 days, 22:56:50", "remaining_time": "5:07:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8979, "total_steps": 9627, "loss": 1.7217, "learning_rate": 1.1137529684308311e-06, "epoch": 0.9326893113119352, "percentage": 93.27, "elapsed_time": "2 days, 22:57:18", "remaining_time": "5:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8980, "total_steps": 9627, "loss": 1.6731, "learning_rate": 1.110330881337013e-06, "epoch": 0.9327931858315155, "percentage": 93.28, "elapsed_time": "2 days, 22:57:47", "remaining_time": "5:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8981, "total_steps": 9627, "loss": 1.5772, "learning_rate": 1.106914000611603e-06, "epoch": 0.9328970603510959, "percentage": 93.29, "elapsed_time": "2 days, 22:58:17", "remaining_time": "5:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8982, "total_steps": 9627, "loss": 1.6541, "learning_rate": 1.1035023266184663e-06, "epoch": 0.9330009348706763, "percentage": 93.3, "elapsed_time": "2 days, 22:58:47", "remaining_time": "5:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8983, "total_steps": 9627, "loss": 1.6717, "learning_rate": 1.1000958597209343e-06, "epoch": 0.9331048093902565, "percentage": 93.31, "elapsed_time": "2 days, 22:59:15", "remaining_time": "5:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8984, "total_steps": 9627, "loss": 1.8383, "learning_rate": 1.0966946002817557e-06, "epoch": 0.9332086839098369, "percentage": 93.32, "elapsed_time": "2 days, 22:59:46", "remaining_time": "5:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8985, "total_steps": 9627, "loss": 1.6386, "learning_rate": 1.0932985486631408e-06, "epoch": 0.9333125584294173, "percentage": 93.33, "elapsed_time": "2 days, 23:00:14", "remaining_time": "5:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8986, "total_steps": 9627, "loss": 1.6147, "learning_rate": 1.0899077052267393e-06, "epoch": 0.9334164329489976, "percentage": 93.34, "elapsed_time": "2 days, 23:00:44", "remaining_time": "5:03:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8987, "total_steps": 9627, "loss": 1.6074, "learning_rate": 1.086522070333662e-06, "epoch": 0.933520307468578, "percentage": 93.35, "elapsed_time": "2 days, 23:01:13", "remaining_time": "5:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8988, "total_steps": 9627, "loss": 1.7838, "learning_rate": 1.0831416443444376e-06, "epoch": 0.9336241819881583, "percentage": 93.36, "elapsed_time": "2 days, 23:01:42", "remaining_time": "5:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8989, "total_steps": 9627, "loss": 1.5811, "learning_rate": 1.0797664276190666e-06, "epoch": 0.9337280565077386, "percentage": 93.37, "elapsed_time": "2 days, 23:02:11", "remaining_time": "5:02:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8990, "total_steps": 9627, "loss": 1.7476, "learning_rate": 1.0763964205169786e-06, "epoch": 0.933831931027319, "percentage": 93.38, "elapsed_time": "2 days, 23:02:40", "remaining_time": "5:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8991, "total_steps": 9627, "loss": 1.7751, "learning_rate": 1.0730316233970473e-06, "epoch": 0.9339358055468994, "percentage": 93.39, "elapsed_time": "2 days, 23:03:10", "remaining_time": "5:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8992, "total_steps": 9627, "loss": 1.5934, "learning_rate": 1.0696720366176138e-06, "epoch": 0.9340396800664796, "percentage": 93.4, "elapsed_time": "2 days, 23:03:39", "remaining_time": "5:01:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8993, "total_steps": 9627, "loss": 1.7941, "learning_rate": 1.0663176605364255e-06, "epoch": 0.93414355458606, "percentage": 93.41, "elapsed_time": "2 days, 23:04:08", "remaining_time": "5:00:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8994, "total_steps": 9627, "loss": 1.4659, "learning_rate": 1.0629684955107132e-06, "epoch": 0.9342474291056404, "percentage": 93.42, "elapsed_time": "2 days, 23:04:39", "remaining_time": "5:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8995, "total_steps": 9627, "loss": 1.5177, "learning_rate": 1.0596245418971307e-06, "epoch": 0.9343513036252208, "percentage": 93.44, "elapsed_time": "2 days, 23:05:07", "remaining_time": "4:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8996, "total_steps": 9627, "loss": 1.774, "learning_rate": 1.0562858000517928e-06, "epoch": 0.9344551781448011, "percentage": 93.45, "elapsed_time": "2 days, 23:05:37", "remaining_time": "4:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8997, "total_steps": 9627, "loss": 1.578, "learning_rate": 1.0529522703302319e-06, "epoch": 0.9345590526643814, "percentage": 93.46, "elapsed_time": "2 days, 23:06:06", "remaining_time": "4:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8998, "total_steps": 9627, "loss": 1.6469, "learning_rate": 1.049623953087453e-06, "epoch": 0.9346629271839618, "percentage": 93.47, "elapsed_time": "2 days, 23:06:34", "remaining_time": "4:58:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8999, "total_steps": 9627, "loss": 1.5999, "learning_rate": 1.0463008486779058e-06, "epoch": 0.9347668017035421, "percentage": 93.48, "elapsed_time": "2 days, 23:07:03", "remaining_time": "4:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9000, "total_steps": 9627, "loss": 1.5968, "learning_rate": 1.0429829574554574e-06, "epoch": 0.9348706762231225, "percentage": 93.49, "elapsed_time": "2 days, 23:07:32", "remaining_time": "4:57:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9001, "total_steps": 9627, "loss": 1.5762, "learning_rate": 1.0396702797734415e-06, "epoch": 0.9349745507427029, "percentage": 93.5, "elapsed_time": "2 days, 23:08:02", "remaining_time": "4:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9002, "total_steps": 9627, "loss": 1.4743, "learning_rate": 1.0363628159846483e-06, "epoch": 0.9350784252622831, "percentage": 93.51, "elapsed_time": "2 days, 23:08:32", "remaining_time": "4:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9003, "total_steps": 9627, "loss": 1.6244, "learning_rate": 1.0330605664412684e-06, "epoch": 0.9351822997818635, "percentage": 93.52, "elapsed_time": "2 days, 23:09:01", "remaining_time": "4:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9004, "total_steps": 9627, "loss": 1.8127, "learning_rate": 1.0297635314949872e-06, "epoch": 0.9352861743014439, "percentage": 93.53, "elapsed_time": "2 days, 23:09:31", "remaining_time": "4:55:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9005, "total_steps": 9627, "loss": 1.5446, "learning_rate": 1.0264717114969125e-06, "epoch": 0.9353900488210242, "percentage": 93.54, "elapsed_time": "2 days, 23:10:00", "remaining_time": "4:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9006, "total_steps": 9627, "loss": 1.7789, "learning_rate": 1.023185106797586e-06, "epoch": 0.9354939233406045, "percentage": 93.55, "elapsed_time": "2 days, 23:10:29", "remaining_time": "4:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9007, "total_steps": 9627, "loss": 1.7449, "learning_rate": 1.0199037177470172e-06, "epoch": 0.9355977978601849, "percentage": 93.56, "elapsed_time": "2 days, 23:10:59", "remaining_time": "4:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9008, "total_steps": 9627, "loss": 1.7044, "learning_rate": 1.0166275446946372e-06, "epoch": 0.9357016723797652, "percentage": 93.57, "elapsed_time": "2 days, 23:11:28", "remaining_time": "4:53:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9009, "total_steps": 9627, "loss": 1.7159, "learning_rate": 1.0133565879893447e-06, "epoch": 0.9358055468993456, "percentage": 93.58, "elapsed_time": "2 days, 23:11:57", "remaining_time": "4:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9010, "total_steps": 9627, "loss": 1.5209, "learning_rate": 1.0100908479794558e-06, "epoch": 0.935909421418926, "percentage": 93.59, "elapsed_time": "2 days, 23:12:26", "remaining_time": "4:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9011, "total_steps": 9627, "loss": 1.7395, "learning_rate": 1.0068303250127697e-06, "epoch": 0.9360132959385062, "percentage": 93.6, "elapsed_time": "2 days, 23:12:56", "remaining_time": "4:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9012, "total_steps": 9627, "loss": 1.6103, "learning_rate": 1.0035750194364758e-06, "epoch": 0.9361171704580866, "percentage": 93.61, "elapsed_time": "2 days, 23:13:25", "remaining_time": "4:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9013, "total_steps": 9627, "loss": 1.7848, "learning_rate": 1.0003249315972684e-06, "epoch": 0.936221044977667, "percentage": 93.62, "elapsed_time": "2 days, 23:13:55", "remaining_time": "4:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9014, "total_steps": 9627, "loss": 1.7764, "learning_rate": 9.97080061841238e-07, "epoch": 0.9363249194972473, "percentage": 93.63, "elapsed_time": "2 days, 23:14:25", "remaining_time": "4:50:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9015, "total_steps": 9627, "loss": 1.6056, "learning_rate": 9.938404105139465e-07, "epoch": 0.9364287940168277, "percentage": 93.64, "elapsed_time": "2 days, 23:14:54", "remaining_time": "4:50:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9016, "total_steps": 9627, "loss": 1.5732, "learning_rate": 9.906059779603849e-07, "epoch": 0.936532668536408, "percentage": 93.65, "elapsed_time": "2 days, 23:15:22", "remaining_time": "4:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9017, "total_steps": 9627, "loss": 1.8166, "learning_rate": 9.873767645250055e-07, "epoch": 0.9366365430559883, "percentage": 93.66, "elapsed_time": "2 days, 23:15:52", "remaining_time": "4:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9018, "total_steps": 9627, "loss": 1.6245, "learning_rate": 9.84152770551683e-07, "epoch": 0.9367404175755687, "percentage": 93.67, "elapsed_time": "2 days, 23:16:21", "remaining_time": "4:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9019, "total_steps": 9627, "loss": 1.6387, "learning_rate": 9.809339963837426e-07, "epoch": 0.9368442920951491, "percentage": 93.68, "elapsed_time": "2 days, 23:16:51", "remaining_time": "4:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9020, "total_steps": 9627, "loss": 1.3704, "learning_rate": 9.77720442363983e-07, "epoch": 0.9369481666147295, "percentage": 93.69, "elapsed_time": "2 days, 23:17:21", "remaining_time": "4:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9021, "total_steps": 9627, "loss": 1.7435, "learning_rate": 9.745121088346021e-07, "epoch": 0.9370520411343097, "percentage": 93.71, "elapsed_time": "2 days, 23:17:50", "remaining_time": "4:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9022, "total_steps": 9627, "loss": 1.8335, "learning_rate": 9.713089961372657e-07, "epoch": 0.9371559156538901, "percentage": 93.72, "elapsed_time": "2 days, 23:18:19", "remaining_time": "4:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9023, "total_steps": 9627, "loss": 1.6002, "learning_rate": 9.681111046130843e-07, "epoch": 0.9372597901734705, "percentage": 93.73, "elapsed_time": "2 days, 23:18:49", "remaining_time": "4:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9024, "total_steps": 9627, "loss": 1.7331, "learning_rate": 9.64918434602613e-07, "epoch": 0.9373636646930508, "percentage": 93.74, "elapsed_time": "2 days, 23:19:19", "remaining_time": "4:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9025, "total_steps": 9627, "loss": 1.7173, "learning_rate": 9.617309864458358e-07, "epoch": 0.9374675392126312, "percentage": 93.75, "elapsed_time": "2 days, 23:19:48", "remaining_time": "4:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9026, "total_steps": 9627, "loss": 1.5642, "learning_rate": 9.585487604821863e-07, "epoch": 0.9375714137322115, "percentage": 93.76, "elapsed_time": "2 days, 23:20:16", "remaining_time": "4:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9027, "total_steps": 9627, "loss": 1.6186, "learning_rate": 9.553717570505716e-07, "epoch": 0.9376752882517918, "percentage": 93.77, "elapsed_time": "2 days, 23:20:45", "remaining_time": "4:44:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9028, "total_steps": 9627, "loss": 1.5881, "learning_rate": 9.521999764892875e-07, "epoch": 0.9377791627713722, "percentage": 93.78, "elapsed_time": "2 days, 23:21:15", "remaining_time": "4:44:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9029, "total_steps": 9627, "loss": 1.5853, "learning_rate": 9.49033419136125e-07, "epoch": 0.9378830372909526, "percentage": 93.79, "elapsed_time": "2 days, 23:21:45", "remaining_time": "4:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9030, "total_steps": 9627, "loss": 1.5876, "learning_rate": 9.458720853282977e-07, "epoch": 0.9379869118105328, "percentage": 93.8, "elapsed_time": "2 days, 23:22:14", "remaining_time": "4:43:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9031, "total_steps": 9627, "loss": 1.694, "learning_rate": 9.427159754024473e-07, "epoch": 0.9380907863301132, "percentage": 93.81, "elapsed_time": "2 days, 23:22:43", "remaining_time": "4:42:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9032, "total_steps": 9627, "loss": 1.686, "learning_rate": 9.395650896946884e-07, "epoch": 0.9381946608496936, "percentage": 93.82, "elapsed_time": "2 days, 23:23:13", "remaining_time": "4:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9033, "total_steps": 9627, "loss": 1.6361, "learning_rate": 9.364194285405581e-07, "epoch": 0.9382985353692739, "percentage": 93.83, "elapsed_time": "2 days, 23:23:42", "remaining_time": "4:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9034, "total_steps": 9627, "loss": 1.5855, "learning_rate": 9.332789922750495e-07, "epoch": 0.9384024098888543, "percentage": 93.84, "elapsed_time": "2 days, 23:24:11", "remaining_time": "4:41:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9035, "total_steps": 9627, "loss": 1.6175, "learning_rate": 9.301437812325952e-07, "epoch": 0.9385062844084346, "percentage": 93.85, "elapsed_time": "2 days, 23:24:41", "remaining_time": "4:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9036, "total_steps": 9627, "loss": 1.6779, "learning_rate": 9.27013795747067e-07, "epoch": 0.9386101589280149, "percentage": 93.86, "elapsed_time": "2 days, 23:25:11", "remaining_time": "4:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9037, "total_steps": 9627, "loss": 1.7196, "learning_rate": 9.238890361517815e-07, "epoch": 0.9387140334475953, "percentage": 93.87, "elapsed_time": "2 days, 23:25:40", "remaining_time": "4:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9038, "total_steps": 9627, "loss": 1.5481, "learning_rate": 9.20769502779506e-07, "epoch": 0.9388179079671757, "percentage": 93.88, "elapsed_time": "2 days, 23:26:10", "remaining_time": "4:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9039, "total_steps": 9627, "loss": 1.5561, "learning_rate": 9.176551959624524e-07, "epoch": 0.938921782486756, "percentage": 93.89, "elapsed_time": "2 days, 23:26:40", "remaining_time": "4:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9040, "total_steps": 9627, "loss": 1.6116, "learning_rate": 9.145461160322555e-07, "epoch": 0.9390256570063363, "percentage": 93.9, "elapsed_time": "2 days, 23:27:08", "remaining_time": "4:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9041, "total_steps": 9627, "loss": 1.5454, "learning_rate": 9.114422633200226e-07, "epoch": 0.9391295315259167, "percentage": 93.91, "elapsed_time": "2 days, 23:27:38", "remaining_time": "4:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9042, "total_steps": 9627, "loss": 1.6116, "learning_rate": 9.083436381562838e-07, "epoch": 0.939233406045497, "percentage": 93.92, "elapsed_time": "2 days, 23:28:08", "remaining_time": "4:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9043, "total_steps": 9627, "loss": 1.7028, "learning_rate": 9.05250240871014e-07, "epoch": 0.9393372805650774, "percentage": 93.93, "elapsed_time": "2 days, 23:28:37", "remaining_time": "4:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9044, "total_steps": 9627, "loss": 1.7121, "learning_rate": 9.021620717936385e-07, "epoch": 0.9394411550846578, "percentage": 93.94, "elapsed_time": "2 days, 23:29:08", "remaining_time": "4:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9045, "total_steps": 9627, "loss": 1.6753, "learning_rate": 8.990791312530222e-07, "epoch": 0.9395450296042381, "percentage": 93.95, "elapsed_time": "2 days, 23:29:36", "remaining_time": "4:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9046, "total_steps": 9627, "loss": 1.7523, "learning_rate": 8.960014195774857e-07, "epoch": 0.9396489041238184, "percentage": 93.96, "elapsed_time": "2 days, 23:30:06", "remaining_time": "4:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9047, "total_steps": 9627, "loss": 1.5365, "learning_rate": 8.929289370947669e-07, "epoch": 0.9397527786433988, "percentage": 93.98, "elapsed_time": "2 days, 23:30:35", "remaining_time": "4:35:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9048, "total_steps": 9627, "loss": 1.7463, "learning_rate": 8.89861684132065e-07, "epoch": 0.9398566531629792, "percentage": 93.99, "elapsed_time": "2 days, 23:31:05", "remaining_time": "4:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9049, "total_steps": 9627, "loss": 1.6094, "learning_rate": 8.867996610160246e-07, "epoch": 0.9399605276825594, "percentage": 94.0, "elapsed_time": "2 days, 23:31:35", "remaining_time": "4:34:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9050, "total_steps": 9627, "loss": 1.7627, "learning_rate": 8.837428680727178e-07, "epoch": 0.9400644022021398, "percentage": 94.01, "elapsed_time": "2 days, 23:32:04", "remaining_time": "4:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9051, "total_steps": 9627, "loss": 1.7939, "learning_rate": 8.806913056276788e-07, "epoch": 0.9401682767217202, "percentage": 94.02, "elapsed_time": "2 days, 23:32:34", "remaining_time": "4:33:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9052, "total_steps": 9627, "loss": 1.7245, "learning_rate": 8.776449740058645e-07, "epoch": 0.9402721512413005, "percentage": 94.03, "elapsed_time": "2 days, 23:33:03", "remaining_time": "4:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9053, "total_steps": 9627, "loss": 1.5208, "learning_rate": 8.746038735316931e-07, "epoch": 0.9403760257608809, "percentage": 94.04, "elapsed_time": "2 days, 23:33:32", "remaining_time": "4:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9054, "total_steps": 9627, "loss": 1.8578, "learning_rate": 8.715680045290165e-07, "epoch": 0.9404799002804612, "percentage": 94.05, "elapsed_time": "2 days, 23:34:01", "remaining_time": "4:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9055, "total_steps": 9627, "loss": 1.6814, "learning_rate": 8.685373673211372e-07, "epoch": 0.9405837748000415, "percentage": 94.06, "elapsed_time": "2 days, 23:34:32", "remaining_time": "4:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9056, "total_steps": 9627, "loss": 1.327, "learning_rate": 8.655119622307806e-07, "epoch": 0.9406876493196219, "percentage": 94.07, "elapsed_time": "2 days, 23:35:01", "remaining_time": "4:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9057, "total_steps": 9627, "loss": 1.6839, "learning_rate": 8.624917895801388e-07, "epoch": 0.9407915238392023, "percentage": 94.08, "elapsed_time": "2 days, 23:35:31", "remaining_time": "4:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9058, "total_steps": 9627, "loss": 1.5596, "learning_rate": 8.594768496908378e-07, "epoch": 0.9408953983587826, "percentage": 94.09, "elapsed_time": "2 days, 23:36:00", "remaining_time": "4:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9059, "total_steps": 9627, "loss": 1.5437, "learning_rate": 8.564671428839321e-07, "epoch": 0.9409992728783629, "percentage": 94.1, "elapsed_time": "2 days, 23:36:30", "remaining_time": "4:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9060, "total_steps": 9627, "loss": 1.5591, "learning_rate": 8.534626694799485e-07, "epoch": 0.9411031473979433, "percentage": 94.11, "elapsed_time": "2 days, 23:37:00", "remaining_time": "4:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9061, "total_steps": 9627, "loss": 1.7288, "learning_rate": 8.504634297988312e-07, "epoch": 0.9412070219175236, "percentage": 94.12, "elapsed_time": "2 days, 23:37:30", "remaining_time": "4:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9062, "total_steps": 9627, "loss": 1.5736, "learning_rate": 8.4746942415998e-07, "epoch": 0.941310896437104, "percentage": 94.13, "elapsed_time": "2 days, 23:37:58", "remaining_time": "4:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9063, "total_steps": 9627, "loss": 1.5708, "learning_rate": 8.444806528822291e-07, "epoch": 0.9414147709566844, "percentage": 94.14, "elapsed_time": "2 days, 23:38:28", "remaining_time": "4:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9064, "total_steps": 9627, "loss": 1.6112, "learning_rate": 8.41497116283857e-07, "epoch": 0.9415186454762646, "percentage": 94.15, "elapsed_time": "2 days, 23:38:59", "remaining_time": "4:27:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9065, "total_steps": 9627, "loss": 1.6238, "learning_rate": 8.385188146825984e-07, "epoch": 0.941622519995845, "percentage": 94.16, "elapsed_time": "2 days, 23:39:28", "remaining_time": "4:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9066, "total_steps": 9627, "loss": 1.8539, "learning_rate": 8.355457483955998e-07, "epoch": 0.9417263945154254, "percentage": 94.17, "elapsed_time": "2 days, 23:39:58", "remaining_time": "4:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9067, "total_steps": 9627, "loss": 1.709, "learning_rate": 8.325779177394965e-07, "epoch": 0.9418302690350057, "percentage": 94.18, "elapsed_time": "2 days, 23:40:27", "remaining_time": "4:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9068, "total_steps": 9627, "loss": 1.8527, "learning_rate": 8.296153230303139e-07, "epoch": 0.941934143554586, "percentage": 94.19, "elapsed_time": "2 days, 23:40:57", "remaining_time": "4:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9069, "total_steps": 9627, "loss": 1.4964, "learning_rate": 8.266579645835548e-07, "epoch": 0.9420380180741664, "percentage": 94.2, "elapsed_time": "2 days, 23:41:27", "remaining_time": "4:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9070, "total_steps": 9627, "loss": 1.5452, "learning_rate": 8.237058427141619e-07, "epoch": 0.9421418925937467, "percentage": 94.21, "elapsed_time": "2 days, 23:41:57", "remaining_time": "4:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9071, "total_steps": 9627, "loss": 1.6578, "learning_rate": 8.20758957736506e-07, "epoch": 0.9422457671133271, "percentage": 94.22, "elapsed_time": "2 days, 23:42:26", "remaining_time": "4:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9072, "total_steps": 9627, "loss": 1.4836, "learning_rate": 8.178173099644082e-07, "epoch": 0.9423496416329075, "percentage": 94.23, "elapsed_time": "2 days, 23:42:57", "remaining_time": "4:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9073, "total_steps": 9627, "loss": 1.4885, "learning_rate": 8.148808997111234e-07, "epoch": 0.9424535161524878, "percentage": 94.25, "elapsed_time": "2 days, 23:43:26", "remaining_time": "4:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9074, "total_steps": 9627, "loss": 1.4961, "learning_rate": 8.119497272893739e-07, "epoch": 0.9425573906720681, "percentage": 94.26, "elapsed_time": "2 days, 23:43:56", "remaining_time": "4:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9075, "total_steps": 9627, "loss": 1.7644, "learning_rate": 8.090237930112932e-07, "epoch": 0.9426612651916485, "percentage": 94.27, "elapsed_time": "2 days, 23:44:25", "remaining_time": "4:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9076, "total_steps": 9627, "loss": 1.7283, "learning_rate": 8.061030971884709e-07, "epoch": 0.9427651397112289, "percentage": 94.28, "elapsed_time": "2 days, 23:44:55", "remaining_time": "4:21:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9077, "total_steps": 9627, "loss": 1.7438, "learning_rate": 8.031876401319471e-07, "epoch": 0.9428690142308092, "percentage": 94.29, "elapsed_time": "2 days, 23:45:24", "remaining_time": "4:20:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9078, "total_steps": 9627, "loss": 1.5288, "learning_rate": 8.002774221521903e-07, "epoch": 0.9429728887503895, "percentage": 94.3, "elapsed_time": "2 days, 23:45:55", "remaining_time": "4:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9079, "total_steps": 9627, "loss": 1.8106, "learning_rate": 7.973724435591135e-07, "epoch": 0.9430767632699699, "percentage": 94.31, "elapsed_time": "2 days, 23:46:25", "remaining_time": "4:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9080, "total_steps": 9627, "loss": 1.7294, "learning_rate": 7.944727046620748e-07, "epoch": 0.9431806377895502, "percentage": 94.32, "elapsed_time": "2 days, 23:46:55", "remaining_time": "4:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9081, "total_steps": 9627, "loss": 1.6364, "learning_rate": 7.915782057698772e-07, "epoch": 0.9432845123091306, "percentage": 94.33, "elapsed_time": "2 days, 23:47:24", "remaining_time": "4:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9082, "total_steps": 9627, "loss": 1.7965, "learning_rate": 7.886889471907521e-07, "epoch": 0.943388386828711, "percentage": 94.34, "elapsed_time": "2 days, 23:47:54", "remaining_time": "4:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9083, "total_steps": 9627, "loss": 1.6954, "learning_rate": 7.858049292324032e-07, "epoch": 0.9434922613482912, "percentage": 94.35, "elapsed_time": "2 days, 23:48:24", "remaining_time": "4:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9084, "total_steps": 9627, "loss": 1.5585, "learning_rate": 7.829261522019349e-07, "epoch": 0.9435961358678716, "percentage": 94.36, "elapsed_time": "2 days, 23:48:53", "remaining_time": "4:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9085, "total_steps": 9627, "loss": 1.6892, "learning_rate": 7.800526164059296e-07, "epoch": 0.943700010387452, "percentage": 94.37, "elapsed_time": "2 days, 23:49:24", "remaining_time": "4:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9086, "total_steps": 9627, "loss": 1.816, "learning_rate": 7.771843221503927e-07, "epoch": 0.9438038849070323, "percentage": 94.38, "elapsed_time": "2 days, 23:49:52", "remaining_time": "4:16:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9087, "total_steps": 9627, "loss": 1.5559, "learning_rate": 7.743212697407631e-07, "epoch": 0.9439077594266126, "percentage": 94.39, "elapsed_time": "2 days, 23:50:23", "remaining_time": "4:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9088, "total_steps": 9627, "loss": 1.7509, "learning_rate": 7.71463459481947e-07, "epoch": 0.944011633946193, "percentage": 94.4, "elapsed_time": "2 days, 23:50:52", "remaining_time": "4:15:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9089, "total_steps": 9627, "loss": 1.4442, "learning_rate": 7.686108916782786e-07, "epoch": 0.9441155084657733, "percentage": 94.41, "elapsed_time": "2 days, 23:51:22", "remaining_time": "4:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9090, "total_steps": 9627, "loss": 1.5161, "learning_rate": 7.657635666335316e-07, "epoch": 0.9442193829853537, "percentage": 94.42, "elapsed_time": "2 days, 23:51:52", "remaining_time": "4:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9091, "total_steps": 9627, "loss": 1.7279, "learning_rate": 7.629214846509191e-07, "epoch": 0.9443232575049341, "percentage": 94.43, "elapsed_time": "2 days, 23:52:22", "remaining_time": "4:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9092, "total_steps": 9627, "loss": 1.6004, "learning_rate": 7.600846460331046e-07, "epoch": 0.9444271320245143, "percentage": 94.44, "elapsed_time": "2 days, 23:52:52", "remaining_time": "4:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9093, "total_steps": 9627, "loss": 1.6926, "learning_rate": 7.572530510821907e-07, "epoch": 0.9445310065440947, "percentage": 94.45, "elapsed_time": "2 days, 23:53:22", "remaining_time": "4:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9094, "total_steps": 9627, "loss": 1.6929, "learning_rate": 7.544267000997141e-07, "epoch": 0.9446348810636751, "percentage": 94.46, "elapsed_time": "2 days, 23:53:52", "remaining_time": "4:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9095, "total_steps": 9627, "loss": 1.6725, "learning_rate": 7.516055933866728e-07, "epoch": 0.9447387555832554, "percentage": 94.47, "elapsed_time": "2 days, 23:54:21", "remaining_time": "4:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9096, "total_steps": 9627, "loss": 1.76, "learning_rate": 7.487897312434711e-07, "epoch": 0.9448426301028358, "percentage": 94.48, "elapsed_time": "2 days, 23:54:51", "remaining_time": "4:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9097, "total_steps": 9627, "loss": 1.6635, "learning_rate": 7.459791139699968e-07, "epoch": 0.9449465046224161, "percentage": 94.49, "elapsed_time": "2 days, 23:55:21", "remaining_time": "4:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9098, "total_steps": 9627, "loss": 1.7047, "learning_rate": 7.431737418655494e-07, "epoch": 0.9450503791419965, "percentage": 94.51, "elapsed_time": "2 days, 23:55:51", "remaining_time": "4:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9099, "total_steps": 9627, "loss": 1.4739, "learning_rate": 7.403736152288842e-07, "epoch": 0.9451542536615768, "percentage": 94.52, "elapsed_time": "2 days, 23:56:21", "remaining_time": "4:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9100, "total_steps": 9627, "loss": 1.8124, "learning_rate": 7.375787343581852e-07, "epoch": 0.9452581281811572, "percentage": 94.53, "elapsed_time": "2 days, 23:56:50", "remaining_time": "4:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9101, "total_steps": 9627, "loss": 1.7298, "learning_rate": 7.347890995510864e-07, "epoch": 0.9453620027007376, "percentage": 94.54, "elapsed_time": "2 days, 23:57:21", "remaining_time": "4:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9102, "total_steps": 9627, "loss": 1.6317, "learning_rate": 7.320047111046724e-07, "epoch": 0.9454658772203178, "percentage": 94.55, "elapsed_time": "2 days, 23:57:51", "remaining_time": "4:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9103, "total_steps": 9627, "loss": 1.6771, "learning_rate": 7.292255693154449e-07, "epoch": 0.9455697517398982, "percentage": 94.56, "elapsed_time": "2 days, 23:58:19", "remaining_time": "4:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9104, "total_steps": 9627, "loss": 1.6163, "learning_rate": 7.264516744793671e-07, "epoch": 0.9456736262594786, "percentage": 94.57, "elapsed_time": "2 days, 23:58:50", "remaining_time": "4:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9105, "total_steps": 9627, "loss": 1.6949, "learning_rate": 7.236830268918415e-07, "epoch": 0.9457775007790589, "percentage": 94.58, "elapsed_time": "2 days, 23:59:19", "remaining_time": "4:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9106, "total_steps": 9627, "loss": 1.5172, "learning_rate": 7.209196268477047e-07, "epoch": 0.9458813752986392, "percentage": 94.59, "elapsed_time": "2 days, 23:59:49", "remaining_time": "4:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9107, "total_steps": 9627, "loss": 1.5826, "learning_rate": 7.181614746412324e-07, "epoch": 0.9459852498182196, "percentage": 94.6, "elapsed_time": "3 days, 0:00:20", "remaining_time": "4:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9108, "total_steps": 9627, "loss": 1.8974, "learning_rate": 7.154085705661506e-07, "epoch": 0.9460891243377999, "percentage": 94.61, "elapsed_time": "3 days, 0:00:49", "remaining_time": "4:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9109, "total_steps": 9627, "loss": 1.7432, "learning_rate": 7.126609149156249e-07, "epoch": 0.9461929988573803, "percentage": 94.62, "elapsed_time": "3 days, 0:01:19", "remaining_time": "4:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9110, "total_steps": 9627, "loss": 1.614, "learning_rate": 7.09918507982249e-07, "epoch": 0.9462968733769607, "percentage": 94.63, "elapsed_time": "3 days, 0:01:48", "remaining_time": "4:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9111, "total_steps": 9627, "loss": 1.6488, "learning_rate": 7.071813500580837e-07, "epoch": 0.9464007478965409, "percentage": 94.64, "elapsed_time": "3 days, 0:02:18", "remaining_time": "4:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9112, "total_steps": 9627, "loss": 1.5024, "learning_rate": 7.044494414346015e-07, "epoch": 0.9465046224161213, "percentage": 94.65, "elapsed_time": "3 days, 0:02:49", "remaining_time": "4:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9113, "total_steps": 9627, "loss": 1.6628, "learning_rate": 7.017227824027305e-07, "epoch": 0.9466084969357017, "percentage": 94.66, "elapsed_time": "3 days, 0:03:17", "remaining_time": "4:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9114, "total_steps": 9627, "loss": 1.6693, "learning_rate": 6.990013732528444e-07, "epoch": 0.946712371455282, "percentage": 94.67, "elapsed_time": "3 days, 0:03:48", "remaining_time": "4:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9115, "total_steps": 9627, "loss": 1.5755, "learning_rate": 6.9628521427475e-07, "epoch": 0.9468162459748624, "percentage": 94.68, "elapsed_time": "3 days, 0:04:18", "remaining_time": "4:02:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9116, "total_steps": 9627, "loss": 1.6624, "learning_rate": 6.935743057576938e-07, "epoch": 0.9469201204944427, "percentage": 94.69, "elapsed_time": "3 days, 0:04:48", "remaining_time": "4:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9117, "total_steps": 9627, "loss": 1.6738, "learning_rate": 6.908686479903725e-07, "epoch": 0.947023995014023, "percentage": 94.7, "elapsed_time": "3 days, 0:05:17", "remaining_time": "4:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9118, "total_steps": 9627, "loss": 1.7311, "learning_rate": 6.881682412609114e-07, "epoch": 0.9471278695336034, "percentage": 94.71, "elapsed_time": "3 days, 0:05:48", "remaining_time": "4:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9119, "total_steps": 9627, "loss": 1.7126, "learning_rate": 6.854730858568914e-07, "epoch": 0.9472317440531838, "percentage": 94.72, "elapsed_time": "3 days, 0:06:17", "remaining_time": "4:01:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9120, "total_steps": 9627, "loss": 1.7939, "learning_rate": 6.827831820653163e-07, "epoch": 0.947335618572764, "percentage": 94.73, "elapsed_time": "3 days, 0:06:47", "remaining_time": "4:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9121, "total_steps": 9627, "loss": 1.6198, "learning_rate": 6.800985301726404e-07, "epoch": 0.9474394930923444, "percentage": 94.74, "elapsed_time": "3 days, 0:07:16", "remaining_time": "4:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9122, "total_steps": 9627, "loss": 1.73, "learning_rate": 6.77419130464757e-07, "epoch": 0.9475433676119248, "percentage": 94.75, "elapsed_time": "3 days, 0:07:47", "remaining_time": "3:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9123, "total_steps": 9627, "loss": 1.6677, "learning_rate": 6.747449832270158e-07, "epoch": 0.9476472421315052, "percentage": 94.76, "elapsed_time": "3 days, 0:08:16", "remaining_time": "3:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9124, "total_steps": 9627, "loss": 1.8017, "learning_rate": 6.720760887441779e-07, "epoch": 0.9477511166510855, "percentage": 94.78, "elapsed_time": "3 days, 0:08:47", "remaining_time": "3:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9125, "total_steps": 9627, "loss": 1.6173, "learning_rate": 6.694124473004604e-07, "epoch": 0.9478549911706659, "percentage": 94.79, "elapsed_time": "3 days, 0:09:15", "remaining_time": "3:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9126, "total_steps": 9627, "loss": 1.5386, "learning_rate": 6.667540591795307e-07, "epoch": 0.9479588656902462, "percentage": 94.8, "elapsed_time": "3 days, 0:09:46", "remaining_time": "3:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9127, "total_steps": 9627, "loss": 1.652, "learning_rate": 6.641009246644736e-07, "epoch": 0.9480627402098265, "percentage": 94.81, "elapsed_time": "3 days, 0:10:16", "remaining_time": "3:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9128, "total_steps": 9627, "loss": 1.6695, "learning_rate": 6.614530440378352e-07, "epoch": 0.9481666147294069, "percentage": 94.82, "elapsed_time": "3 days, 0:10:47", "remaining_time": "3:56:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9129, "total_steps": 9627, "loss": 1.4878, "learning_rate": 6.588104175815901e-07, "epoch": 0.9482704892489873, "percentage": 94.83, "elapsed_time": "3 days, 0:11:17", "remaining_time": "3:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9130, "total_steps": 9627, "loss": 1.6489, "learning_rate": 6.561730455771686e-07, "epoch": 0.9483743637685675, "percentage": 94.84, "elapsed_time": "3 days, 0:11:47", "remaining_time": "3:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9131, "total_steps": 9627, "loss": 1.6737, "learning_rate": 6.535409283054073e-07, "epoch": 0.9484782382881479, "percentage": 94.85, "elapsed_time": "3 days, 0:12:16", "remaining_time": "3:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9132, "total_steps": 9627, "loss": 1.6735, "learning_rate": 6.509140660466318e-07, "epoch": 0.9485821128077283, "percentage": 94.86, "elapsed_time": "3 days, 0:12:46", "remaining_time": "3:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9133, "total_steps": 9627, "loss": 1.6911, "learning_rate": 6.482924590805627e-07, "epoch": 0.9486859873273086, "percentage": 94.87, "elapsed_time": "3 days, 0:13:17", "remaining_time": "3:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9134, "total_steps": 9627, "loss": 1.5338, "learning_rate": 6.456761076863937e-07, "epoch": 0.948789861846889, "percentage": 94.88, "elapsed_time": "3 days, 0:13:46", "remaining_time": "3:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9135, "total_steps": 9627, "loss": 1.5234, "learning_rate": 6.430650121427406e-07, "epoch": 0.9488937363664693, "percentage": 94.89, "elapsed_time": "3 days, 0:14:17", "remaining_time": "3:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9136, "total_steps": 9627, "loss": 1.7075, "learning_rate": 6.404591727276588e-07, "epoch": 0.9489976108860496, "percentage": 94.9, "elapsed_time": "3 days, 0:14:46", "remaining_time": "3:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9137, "total_steps": 9627, "loss": 1.6455, "learning_rate": 6.378585897186651e-07, "epoch": 0.94910148540563, "percentage": 94.91, "elapsed_time": "3 days, 0:15:17", "remaining_time": "3:52:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9138, "total_steps": 9627, "loss": 1.5482, "learning_rate": 6.352632633926825e-07, "epoch": 0.9492053599252104, "percentage": 94.92, "elapsed_time": "3 days, 0:15:47", "remaining_time": "3:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9139, "total_steps": 9627, "loss": 1.7572, "learning_rate": 6.326731940261122e-07, "epoch": 0.9493092344447907, "percentage": 94.93, "elapsed_time": "3 days, 0:16:17", "remaining_time": "3:51:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9140, "total_steps": 9627, "loss": 1.6723, "learning_rate": 6.300883818947611e-07, "epoch": 0.949413108964371, "percentage": 94.94, "elapsed_time": "3 days, 0:16:46", "remaining_time": "3:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9141, "total_steps": 9627, "loss": 1.7014, "learning_rate": 6.275088272738927e-07, "epoch": 0.9495169834839514, "percentage": 94.95, "elapsed_time": "3 days, 0:17:17", "remaining_time": "3:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9142, "total_steps": 9627, "loss": 1.6569, "learning_rate": 6.249345304382259e-07, "epoch": 0.9496208580035317, "percentage": 94.96, "elapsed_time": "3 days, 0:17:46", "remaining_time": "3:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9143, "total_steps": 9627, "loss": 1.6363, "learning_rate": 6.223654916618804e-07, "epoch": 0.9497247325231121, "percentage": 94.97, "elapsed_time": "3 days, 0:18:17", "remaining_time": "3:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9144, "total_steps": 9627, "loss": 1.5838, "learning_rate": 6.19801711218454e-07, "epoch": 0.9498286070426925, "percentage": 94.98, "elapsed_time": "3 days, 0:18:47", "remaining_time": "3:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9145, "total_steps": 9627, "loss": 1.4252, "learning_rate": 6.172431893809616e-07, "epoch": 0.9499324815622727, "percentage": 94.99, "elapsed_time": "3 days, 0:19:16", "remaining_time": "3:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9146, "total_steps": 9627, "loss": 1.5948, "learning_rate": 6.146899264218742e-07, "epoch": 0.9500363560818531, "percentage": 95.0, "elapsed_time": "3 days, 0:19:47", "remaining_time": "3:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9147, "total_steps": 9627, "loss": 1.5962, "learning_rate": 6.121419226130909e-07, "epoch": 0.9501402306014335, "percentage": 95.01, "elapsed_time": "3 days, 0:20:17", "remaining_time": "3:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9148, "total_steps": 9627, "loss": 1.6758, "learning_rate": 6.095991782259447e-07, "epoch": 0.9502441051210138, "percentage": 95.02, "elapsed_time": "3 days, 0:20:47", "remaining_time": "3:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9149, "total_steps": 9627, "loss": 1.4357, "learning_rate": 6.070616935312357e-07, "epoch": 0.9503479796405941, "percentage": 95.03, "elapsed_time": "3 days, 0:21:17", "remaining_time": "3:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9150, "total_steps": 9627, "loss": 1.8251, "learning_rate": 6.045294687991643e-07, "epoch": 0.9504518541601745, "percentage": 95.05, "elapsed_time": "3 days, 0:21:48", "remaining_time": "3:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9151, "total_steps": 9627, "loss": 1.8014, "learning_rate": 6.020025042994148e-07, "epoch": 0.9505557286797549, "percentage": 95.06, "elapsed_time": "3 days, 0:22:18", "remaining_time": "3:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9152, "total_steps": 9627, "loss": 1.5917, "learning_rate": 5.994808003010777e-07, "epoch": 0.9506596031993352, "percentage": 95.07, "elapsed_time": "3 days, 0:22:47", "remaining_time": "3:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9153, "total_steps": 9627, "loss": 1.5155, "learning_rate": 5.969643570726935e-07, "epoch": 0.9507634777189156, "percentage": 95.08, "elapsed_time": "3 days, 0:23:18", "remaining_time": "3:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9154, "total_steps": 9627, "loss": 1.489, "learning_rate": 5.944531748822535e-07, "epoch": 0.9508673522384959, "percentage": 95.09, "elapsed_time": "3 days, 0:23:47", "remaining_time": "3:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9155, "total_steps": 9627, "loss": 1.4501, "learning_rate": 5.91947253997166e-07, "epoch": 0.9509712267580762, "percentage": 95.1, "elapsed_time": "3 days, 0:24:17", "remaining_time": "3:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9156, "total_steps": 9627, "loss": 1.5144, "learning_rate": 5.894465946843008e-07, "epoch": 0.9510751012776566, "percentage": 95.11, "elapsed_time": "3 days, 0:24:46", "remaining_time": "3:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9157, "total_steps": 9627, "loss": 1.6731, "learning_rate": 5.869511972099506e-07, "epoch": 0.951178975797237, "percentage": 95.12, "elapsed_time": "3 days, 0:25:18", "remaining_time": "3:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9158, "total_steps": 9627, "loss": 1.7321, "learning_rate": 5.844610618398693e-07, "epoch": 0.9512828503168173, "percentage": 95.13, "elapsed_time": "3 days, 0:25:47", "remaining_time": "3:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9159, "total_steps": 9627, "loss": 1.7712, "learning_rate": 5.819761888392228e-07, "epoch": 0.9513867248363976, "percentage": 95.14, "elapsed_time": "3 days, 0:26:18", "remaining_time": "3:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9160, "total_steps": 9627, "loss": 1.7595, "learning_rate": 5.794965784726436e-07, "epoch": 0.951490599355978, "percentage": 95.15, "elapsed_time": "3 days, 0:26:47", "remaining_time": "3:41:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9161, "total_steps": 9627, "loss": 1.7085, "learning_rate": 5.770222310041817e-07, "epoch": 0.9515944738755583, "percentage": 95.16, "elapsed_time": "3 days, 0:27:17", "remaining_time": "3:41:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9162, "total_steps": 9627, "loss": 1.7196, "learning_rate": 5.745531466973375e-07, "epoch": 0.9516983483951387, "percentage": 95.17, "elapsed_time": "3 days, 0:27:47", "remaining_time": "3:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9163, "total_steps": 9627, "loss": 1.7608, "learning_rate": 5.720893258150451e-07, "epoch": 0.951802222914719, "percentage": 95.18, "elapsed_time": "3 days, 0:28:17", "remaining_time": "3:40:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9164, "total_steps": 9627, "loss": 1.6069, "learning_rate": 5.696307686196944e-07, "epoch": 0.9519060974342993, "percentage": 95.19, "elapsed_time": "3 days, 0:28:46", "remaining_time": "3:39:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9165, "total_steps": 9627, "loss": 1.5777, "learning_rate": 5.67177475373093e-07, "epoch": 0.9520099719538797, "percentage": 95.2, "elapsed_time": "3 days, 0:29:16", "remaining_time": "3:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9166, "total_steps": 9627, "loss": 1.8119, "learning_rate": 5.647294463364927e-07, "epoch": 0.9521138464734601, "percentage": 95.21, "elapsed_time": "3 days, 0:29:46", "remaining_time": "3:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9167, "total_steps": 9627, "loss": 1.5702, "learning_rate": 5.622866817706074e-07, "epoch": 0.9522177209930404, "percentage": 95.22, "elapsed_time": "3 days, 0:30:15", "remaining_time": "3:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9168, "total_steps": 9627, "loss": 1.679, "learning_rate": 5.598491819355567e-07, "epoch": 0.9523215955126207, "percentage": 95.23, "elapsed_time": "3 days, 0:30:45", "remaining_time": "3:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9169, "total_steps": 9627, "loss": 1.6981, "learning_rate": 5.574169470909163e-07, "epoch": 0.9524254700322011, "percentage": 95.24, "elapsed_time": "3 days, 0:31:15", "remaining_time": "3:37:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9170, "total_steps": 9627, "loss": 1.5524, "learning_rate": 5.549899774957123e-07, "epoch": 0.9525293445517814, "percentage": 95.25, "elapsed_time": "3 days, 0:31:46", "remaining_time": "3:36:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9171, "total_steps": 9627, "loss": 1.7129, "learning_rate": 5.52568273408377e-07, "epoch": 0.9526332190713618, "percentage": 95.26, "elapsed_time": "3 days, 0:32:16", "remaining_time": "3:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9172, "total_steps": 9627, "loss": 1.5757, "learning_rate": 5.501518350868262e-07, "epoch": 0.9527370935909422, "percentage": 95.27, "elapsed_time": "3 days, 0:32:46", "remaining_time": "3:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9173, "total_steps": 9627, "loss": 1.6487, "learning_rate": 5.477406627883763e-07, "epoch": 0.9528409681105224, "percentage": 95.28, "elapsed_time": "3 days, 0:33:15", "remaining_time": "3:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9174, "total_steps": 9627, "loss": 1.7217, "learning_rate": 5.453347567698108e-07, "epoch": 0.9529448426301028, "percentage": 95.29, "elapsed_time": "3 days, 0:33:45", "remaining_time": "3:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9175, "total_steps": 9627, "loss": 1.644, "learning_rate": 5.429341172873248e-07, "epoch": 0.9530487171496832, "percentage": 95.3, "elapsed_time": "3 days, 0:34:15", "remaining_time": "3:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9176, "total_steps": 9627, "loss": 1.5666, "learning_rate": 5.405387445965748e-07, "epoch": 0.9531525916692636, "percentage": 95.32, "elapsed_time": "3 days, 0:34:45", "remaining_time": "3:34:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9177, "total_steps": 9627, "loss": 1.5313, "learning_rate": 5.381486389526569e-07, "epoch": 0.9532564661888439, "percentage": 95.33, "elapsed_time": "3 days, 0:35:15", "remaining_time": "3:33:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9178, "total_steps": 9627, "loss": 1.6146, "learning_rate": 5.35763800610084e-07, "epoch": 0.9533603407084242, "percentage": 95.34, "elapsed_time": "3 days, 0:35:45", "remaining_time": "3:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9179, "total_steps": 9627, "loss": 1.7637, "learning_rate": 5.333842298228364e-07, "epoch": 0.9534642152280046, "percentage": 95.35, "elapsed_time": "3 days, 0:36:15", "remaining_time": "3:32:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9180, "total_steps": 9627, "loss": 1.7589, "learning_rate": 5.310099268443114e-07, "epoch": 0.9535680897475849, "percentage": 95.36, "elapsed_time": "3 days, 0:36:45", "remaining_time": "3:32:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9181, "total_steps": 9627, "loss": 1.7186, "learning_rate": 5.286408919273567e-07, "epoch": 0.9536719642671653, "percentage": 95.37, "elapsed_time": "3 days, 0:37:15", "remaining_time": "3:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9182, "total_steps": 9627, "loss": 1.698, "learning_rate": 5.262771253242593e-07, "epoch": 0.9537758387867457, "percentage": 95.38, "elapsed_time": "3 days, 0:37:45", "remaining_time": "3:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9183, "total_steps": 9627, "loss": 1.4785, "learning_rate": 5.239186272867347e-07, "epoch": 0.9538797133063259, "percentage": 95.39, "elapsed_time": "3 days, 0:38:15", "remaining_time": "3:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9184, "total_steps": 9627, "loss": 1.7033, "learning_rate": 5.215653980659485e-07, "epoch": 0.9539835878259063, "percentage": 95.4, "elapsed_time": "3 days, 0:38:45", "remaining_time": "3:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9185, "total_steps": 9627, "loss": 1.6292, "learning_rate": 5.192174379124948e-07, "epoch": 0.9540874623454867, "percentage": 95.41, "elapsed_time": "3 days, 0:39:14", "remaining_time": "3:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9186, "total_steps": 9627, "loss": 1.5956, "learning_rate": 5.16874747076429e-07, "epoch": 0.954191336865067, "percentage": 95.42, "elapsed_time": "3 days, 0:39:44", "remaining_time": "3:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9187, "total_steps": 9627, "loss": 1.7799, "learning_rate": 5.145373258072129e-07, "epoch": 0.9542952113846473, "percentage": 95.43, "elapsed_time": "3 days, 0:40:14", "remaining_time": "3:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9188, "total_steps": 9627, "loss": 1.7143, "learning_rate": 5.122051743537692e-07, "epoch": 0.9543990859042277, "percentage": 95.44, "elapsed_time": "3 days, 0:40:44", "remaining_time": "3:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9189, "total_steps": 9627, "loss": 1.5772, "learning_rate": 5.098782929644607e-07, "epoch": 0.954502960423808, "percentage": 95.45, "elapsed_time": "3 days, 0:41:14", "remaining_time": "3:27:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9190, "total_steps": 9627, "loss": 1.7397, "learning_rate": 5.075566818870725e-07, "epoch": 0.9546068349433884, "percentage": 95.46, "elapsed_time": "3 days, 0:41:45", "remaining_time": "3:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9191, "total_steps": 9627, "loss": 1.6717, "learning_rate": 5.0524034136884e-07, "epoch": 0.9547107094629688, "percentage": 95.47, "elapsed_time": "3 days, 0:42:15", "remaining_time": "3:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9192, "total_steps": 9627, "loss": 1.6091, "learning_rate": 5.029292716564382e-07, "epoch": 0.954814583982549, "percentage": 95.48, "elapsed_time": "3 days, 0:42:44", "remaining_time": "3:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9193, "total_steps": 9627, "loss": 1.6914, "learning_rate": 5.006234729959813e-07, "epoch": 0.9549184585021294, "percentage": 95.49, "elapsed_time": "3 days, 0:43:14", "remaining_time": "3:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9194, "total_steps": 9627, "loss": 1.5895, "learning_rate": 4.983229456330063e-07, "epoch": 0.9550223330217098, "percentage": 95.5, "elapsed_time": "3 days, 0:43:44", "remaining_time": "3:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9195, "total_steps": 9627, "loss": 1.7004, "learning_rate": 4.960276898125227e-07, "epoch": 0.9551262075412901, "percentage": 95.51, "elapsed_time": "3 days, 0:44:14", "remaining_time": "3:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9196, "total_steps": 9627, "loss": 1.684, "learning_rate": 4.93737705778935e-07, "epoch": 0.9552300820608705, "percentage": 95.52, "elapsed_time": "3 days, 0:44:45", "remaining_time": "3:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9197, "total_steps": 9627, "loss": 1.8311, "learning_rate": 4.914529937761147e-07, "epoch": 0.9553339565804508, "percentage": 95.53, "elapsed_time": "3 days, 0:45:14", "remaining_time": "3:24:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9198, "total_steps": 9627, "loss": 1.5433, "learning_rate": 4.891735540473785e-07, "epoch": 0.9554378311000311, "percentage": 95.54, "elapsed_time": "3 days, 0:45:45", "remaining_time": "3:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9199, "total_steps": 9627, "loss": 1.6219, "learning_rate": 4.868993868354544e-07, "epoch": 0.9555417056196115, "percentage": 95.55, "elapsed_time": "3 days, 0:46:15", "remaining_time": "3:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9200, "total_steps": 9627, "loss": 1.6918, "learning_rate": 4.846304923825263e-07, "epoch": 0.9556455801391919, "percentage": 95.56, "elapsed_time": "3 days, 0:46:45", "remaining_time": "3:22:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9201, "total_steps": 9627, "loss": 1.5888, "learning_rate": 4.823668709302176e-07, "epoch": 0.9557494546587723, "percentage": 95.57, "elapsed_time": "3 days, 0:47:15", "remaining_time": "3:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9202, "total_steps": 9627, "loss": 1.6003, "learning_rate": 4.801085227195856e-07, "epoch": 0.9558533291783525, "percentage": 95.59, "elapsed_time": "3 days, 0:47:45", "remaining_time": "3:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9203, "total_steps": 9627, "loss": 1.6384, "learning_rate": 4.778554479911268e-07, "epoch": 0.9559572036979329, "percentage": 95.6, "elapsed_time": "3 days, 0:48:16", "remaining_time": "3:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9204, "total_steps": 9627, "loss": 1.6106, "learning_rate": 4.7560764698477146e-07, "epoch": 0.9560610782175133, "percentage": 95.61, "elapsed_time": "3 days, 0:48:45", "remaining_time": "3:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9205, "total_steps": 9627, "loss": 1.6064, "learning_rate": 4.7336511993990586e-07, "epoch": 0.9561649527370936, "percentage": 95.62, "elapsed_time": "3 days, 0:49:16", "remaining_time": "3:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9206, "total_steps": 9627, "loss": 1.8089, "learning_rate": 4.711278670953223e-07, "epoch": 0.956268827256674, "percentage": 95.63, "elapsed_time": "3 days, 0:49:46", "remaining_time": "3:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9207, "total_steps": 9627, "loss": 1.5888, "learning_rate": 4.688958886892858e-07, "epoch": 0.9563727017762543, "percentage": 95.64, "elapsed_time": "3 days, 0:50:15", "remaining_time": "3:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9208, "total_steps": 9627, "loss": 1.8167, "learning_rate": 4.666691849594784e-07, "epoch": 0.9564765762958346, "percentage": 95.65, "elapsed_time": "3 days, 0:50:45", "remaining_time": "3:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9209, "total_steps": 9627, "loss": 1.6155, "learning_rate": 4.6444775614302714e-07, "epoch": 0.956580450815415, "percentage": 95.66, "elapsed_time": "3 days, 0:51:16", "remaining_time": "3:18:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9210, "total_steps": 9627, "loss": 1.5941, "learning_rate": 4.6223160247650386e-07, "epoch": 0.9566843253349954, "percentage": 95.67, "elapsed_time": "3 days, 0:51:47", "remaining_time": "3:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9211, "total_steps": 9627, "loss": 1.5724, "learning_rate": 4.600207241958976e-07, "epoch": 0.9567881998545756, "percentage": 95.68, "elapsed_time": "3 days, 0:52:17", "remaining_time": "3:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9212, "total_steps": 9627, "loss": 1.6075, "learning_rate": 4.5781512153665884e-07, "epoch": 0.956892074374156, "percentage": 95.69, "elapsed_time": "3 days, 0:52:47", "remaining_time": "3:16:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9213, "total_steps": 9627, "loss": 1.7026, "learning_rate": 4.5561479473366644e-07, "epoch": 0.9569959488937364, "percentage": 95.7, "elapsed_time": "3 days, 0:53:18", "remaining_time": "3:16:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9214, "total_steps": 9627, "loss": 1.5035, "learning_rate": 4.53419744021244e-07, "epoch": 0.9570998234133167, "percentage": 95.71, "elapsed_time": "3 days, 0:53:48", "remaining_time": "3:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9215, "total_steps": 9627, "loss": 1.6648, "learning_rate": 4.5122996963313234e-07, "epoch": 0.9572036979328971, "percentage": 95.72, "elapsed_time": "3 days, 0:54:18", "remaining_time": "3:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9216, "total_steps": 9627, "loss": 1.5704, "learning_rate": 4.4904547180253386e-07, "epoch": 0.9573075724524774, "percentage": 95.73, "elapsed_time": "3 days, 0:54:48", "remaining_time": "3:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9217, "total_steps": 9627, "loss": 1.5082, "learning_rate": 4.468662507620847e-07, "epoch": 0.9574114469720577, "percentage": 95.74, "elapsed_time": "3 days, 0:55:18", "remaining_time": "3:14:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9218, "total_steps": 9627, "loss": 1.5791, "learning_rate": 4.446923067438491e-07, "epoch": 0.9575153214916381, "percentage": 95.75, "elapsed_time": "3 days, 0:55:50", "remaining_time": "3:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9219, "total_steps": 9627, "loss": 1.6155, "learning_rate": 4.425236399793364e-07, "epoch": 0.9576191960112185, "percentage": 95.76, "elapsed_time": "3 days, 0:56:20", "remaining_time": "3:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9220, "total_steps": 9627, "loss": 1.7276, "learning_rate": 4.403602506994897e-07, "epoch": 0.9577230705307987, "percentage": 95.77, "elapsed_time": "3 days, 0:56:49", "remaining_time": "3:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9221, "total_steps": 9627, "loss": 1.6508, "learning_rate": 4.382021391346969e-07, "epoch": 0.9578269450503791, "percentage": 95.78, "elapsed_time": "3 days, 0:57:20", "remaining_time": "3:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9222, "total_steps": 9627, "loss": 1.5887, "learning_rate": 4.360493055147796e-07, "epoch": 0.9579308195699595, "percentage": 95.79, "elapsed_time": "3 days, 0:57:50", "remaining_time": "3:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9223, "total_steps": 9627, "loss": 1.4538, "learning_rate": 4.339017500690046e-07, "epoch": 0.9580346940895398, "percentage": 95.8, "elapsed_time": "3 days, 0:58:21", "remaining_time": "3:11:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9224, "total_steps": 9627, "loss": 1.6011, "learning_rate": 4.3175947302605547e-07, "epoch": 0.9581385686091202, "percentage": 95.81, "elapsed_time": "3 days, 0:58:52", "remaining_time": "3:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9225, "total_steps": 9627, "loss": 1.6147, "learning_rate": 4.296224746140776e-07, "epoch": 0.9582424431287005, "percentage": 95.82, "elapsed_time": "3 days, 0:59:22", "remaining_time": "3:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9226, "total_steps": 9627, "loss": 1.6448, "learning_rate": 4.2749075506063883e-07, "epoch": 0.9583463176482809, "percentage": 95.83, "elapsed_time": "3 days, 0:59:53", "remaining_time": "3:10:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9227, "total_steps": 9627, "loss": 1.663, "learning_rate": 4.253643145927577e-07, "epoch": 0.9584501921678612, "percentage": 95.85, "elapsed_time": "3 days, 1:00:24", "remaining_time": "3:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9228, "total_steps": 9627, "loss": 1.4755, "learning_rate": 4.232431534368808e-07, "epoch": 0.9585540666874416, "percentage": 95.86, "elapsed_time": "3 days, 1:00:54", "remaining_time": "3:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9229, "total_steps": 9627, "loss": 1.6507, "learning_rate": 4.211272718188941e-07, "epoch": 0.958657941207022, "percentage": 95.87, "elapsed_time": "3 days, 1:01:25", "remaining_time": "3:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9230, "total_steps": 9627, "loss": 1.7877, "learning_rate": 4.190166699641229e-07, "epoch": 0.9587618157266022, "percentage": 95.88, "elapsed_time": "3 days, 1:01:56", "remaining_time": "3:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9231, "total_steps": 9627, "loss": 1.5952, "learning_rate": 4.169113480973319e-07, "epoch": 0.9588656902461826, "percentage": 95.89, "elapsed_time": "3 days, 1:02:26", "remaining_time": "3:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9232, "total_steps": 9627, "loss": 1.6713, "learning_rate": 4.148113064427139e-07, "epoch": 0.958969564765763, "percentage": 95.9, "elapsed_time": "3 days, 1:02:58", "remaining_time": "3:07:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9233, "total_steps": 9627, "loss": 1.728, "learning_rate": 4.127165452239179e-07, "epoch": 0.9590734392853433, "percentage": 95.91, "elapsed_time": "3 days, 1:03:28", "remaining_time": "3:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9234, "total_steps": 9627, "loss": 1.7331, "learning_rate": 4.106270646640098e-07, "epoch": 0.9591773138049237, "percentage": 95.92, "elapsed_time": "3 days, 1:03:59", "remaining_time": "3:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9235, "total_steps": 9627, "loss": 1.7273, "learning_rate": 4.085428649855061e-07, "epoch": 0.959281188324504, "percentage": 95.93, "elapsed_time": "3 days, 1:04:31", "remaining_time": "3:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9236, "total_steps": 9627, "loss": 1.6779, "learning_rate": 4.0646394641036255e-07, "epoch": 0.9593850628440843, "percentage": 95.94, "elapsed_time": "3 days, 1:05:00", "remaining_time": "3:05:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9237, "total_steps": 9627, "loss": 1.8105, "learning_rate": 4.043903091599632e-07, "epoch": 0.9594889373636647, "percentage": 95.95, "elapsed_time": "3 days, 1:05:32", "remaining_time": "3:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9238, "total_steps": 9627, "loss": 1.619, "learning_rate": 4.02321953455137e-07, "epoch": 0.9595928118832451, "percentage": 95.96, "elapsed_time": "3 days, 1:06:02", "remaining_time": "3:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9239, "total_steps": 9627, "loss": 1.5693, "learning_rate": 4.002588795161466e-07, "epoch": 0.9596966864028253, "percentage": 95.97, "elapsed_time": "3 days, 1:06:35", "remaining_time": "3:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9240, "total_steps": 9627, "loss": 1.8386, "learning_rate": 3.9820108756268846e-07, "epoch": 0.9598005609224057, "percentage": 95.98, "elapsed_time": "3 days, 1:07:04", "remaining_time": "3:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9241, "total_steps": 9627, "loss": 1.5334, "learning_rate": 3.9614857781390955e-07, "epoch": 0.9599044354419861, "percentage": 95.99, "elapsed_time": "3 days, 1:07:37", "remaining_time": "3:03:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9242, "total_steps": 9627, "loss": 1.7032, "learning_rate": 3.941013504883795e-07, "epoch": 0.9600083099615664, "percentage": 96.0, "elapsed_time": "3 days, 1:08:07", "remaining_time": "3:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9243, "total_steps": 9627, "loss": 1.741, "learning_rate": 3.920594058041183e-07, "epoch": 0.9601121844811468, "percentage": 96.01, "elapsed_time": "3 days, 1:08:37", "remaining_time": "3:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9244, "total_steps": 9627, "loss": 1.8403, "learning_rate": 3.9002274397856863e-07, "epoch": 0.9602160590007272, "percentage": 96.02, "elapsed_time": "3 days, 1:09:09", "remaining_time": "3:01:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9245, "total_steps": 9627, "loss": 1.6718, "learning_rate": 3.8799136522862933e-07, "epoch": 0.9603199335203074, "percentage": 96.03, "elapsed_time": "3 days, 1:09:40", "remaining_time": "3:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9246, "total_steps": 9627, "loss": 1.5569, "learning_rate": 3.859652697706162e-07, "epoch": 0.9604238080398878, "percentage": 96.04, "elapsed_time": "3 days, 1:10:11", "remaining_time": "3:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9247, "total_steps": 9627, "loss": 1.5302, "learning_rate": 3.8394445782030107e-07, "epoch": 0.9605276825594682, "percentage": 96.05, "elapsed_time": "3 days, 1:10:41", "remaining_time": "3:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9248, "total_steps": 9627, "loss": 1.6514, "learning_rate": 3.819289295928785e-07, "epoch": 0.9606315570790485, "percentage": 96.06, "elapsed_time": "3 days, 1:11:14", "remaining_time": "2:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9249, "total_steps": 9627, "loss": 1.5298, "learning_rate": 3.7991868530299345e-07, "epoch": 0.9607354315986288, "percentage": 96.07, "elapsed_time": "3 days, 1:11:44", "remaining_time": "2:59:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9250, "total_steps": 9627, "loss": 1.7081, "learning_rate": 3.7791372516470803e-07, "epoch": 0.9608393061182092, "percentage": 96.08, "elapsed_time": "3 days, 1:12:15", "remaining_time": "2:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9251, "total_steps": 9627, "loss": 1.7594, "learning_rate": 3.759140493915514e-07, "epoch": 0.9609431806377895, "percentage": 96.09, "elapsed_time": "3 days, 1:12:46", "remaining_time": "2:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9252, "total_steps": 9627, "loss": 1.5333, "learning_rate": 3.7391965819646435e-07, "epoch": 0.9610470551573699, "percentage": 96.1, "elapsed_time": "3 days, 1:13:18", "remaining_time": "2:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9253, "total_steps": 9627, "loss": 1.5122, "learning_rate": 3.7193055179183256e-07, "epoch": 0.9611509296769503, "percentage": 96.12, "elapsed_time": "3 days, 1:13:48", "remaining_time": "2:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9254, "total_steps": 9627, "loss": 1.7078, "learning_rate": 3.6994673038948655e-07, "epoch": 0.9612548041965306, "percentage": 96.13, "elapsed_time": "3 days, 1:14:20", "remaining_time": "2:57:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9255, "total_steps": 9627, "loss": 1.5883, "learning_rate": 3.679681942006852e-07, "epoch": 0.9613586787161109, "percentage": 96.14, "elapsed_time": "3 days, 1:14:49", "remaining_time": "2:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9256, "total_steps": 9627, "loss": 1.6098, "learning_rate": 3.6599494343612095e-07, "epoch": 0.9614625532356913, "percentage": 96.15, "elapsed_time": "3 days, 1:15:20", "remaining_time": "2:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9257, "total_steps": 9627, "loss": 1.6603, "learning_rate": 3.6402697830594243e-07, "epoch": 0.9615664277552717, "percentage": 96.16, "elapsed_time": "3 days, 1:15:52", "remaining_time": "2:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9258, "total_steps": 9627, "loss": 1.493, "learning_rate": 3.6206429901970985e-07, "epoch": 0.961670302274852, "percentage": 96.17, "elapsed_time": "3 days, 1:16:24", "remaining_time": "2:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9259, "total_steps": 9627, "loss": 1.5743, "learning_rate": 3.6010690578643924e-07, "epoch": 0.9617741767944323, "percentage": 96.18, "elapsed_time": "3 days, 1:16:54", "remaining_time": "2:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9260, "total_steps": 9627, "loss": 1.4523, "learning_rate": 3.58154798814575e-07, "epoch": 0.9618780513140127, "percentage": 96.19, "elapsed_time": "3 days, 1:17:25", "remaining_time": "2:54:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9261, "total_steps": 9627, "loss": 1.6645, "learning_rate": 3.56207978312012e-07, "epoch": 0.961981925833593, "percentage": 96.2, "elapsed_time": "3 days, 1:17:58", "remaining_time": "2:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9262, "total_steps": 9627, "loss": 1.5695, "learning_rate": 3.542664444860566e-07, "epoch": 0.9620858003531734, "percentage": 96.21, "elapsed_time": "3 days, 1:18:28", "remaining_time": "2:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9263, "total_steps": 9627, "loss": 1.5907, "learning_rate": 3.5233019754347117e-07, "epoch": 0.9621896748727538, "percentage": 96.22, "elapsed_time": "3 days, 1:18:59", "remaining_time": "2:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9264, "total_steps": 9627, "loss": 1.7391, "learning_rate": 3.503992376904575e-07, "epoch": 0.962293549392334, "percentage": 96.23, "elapsed_time": "3 days, 1:19:29", "remaining_time": "2:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9265, "total_steps": 9627, "loss": 1.6637, "learning_rate": 3.4847356513263986e-07, "epoch": 0.9623974239119144, "percentage": 96.24, "elapsed_time": "3 days, 1:20:00", "remaining_time": "2:51:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9266, "total_steps": 9627, "loss": 1.5119, "learning_rate": 3.4655318007509316e-07, "epoch": 0.9625012984314948, "percentage": 96.25, "elapsed_time": "3 days, 1:20:32", "remaining_time": "2:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9267, "total_steps": 9627, "loss": 1.5577, "learning_rate": 3.4463808272232055e-07, "epoch": 0.9626051729510751, "percentage": 96.26, "elapsed_time": "3 days, 1:21:02", "remaining_time": "2:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9268, "total_steps": 9627, "loss": 1.6157, "learning_rate": 3.427282732782644e-07, "epoch": 0.9627090474706554, "percentage": 96.27, "elapsed_time": "3 days, 1:21:34", "remaining_time": "2:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9269, "total_steps": 9627, "loss": 1.5988, "learning_rate": 3.4082375194630643e-07, "epoch": 0.9628129219902358, "percentage": 96.28, "elapsed_time": "3 days, 1:22:05", "remaining_time": "2:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9270, "total_steps": 9627, "loss": 1.5232, "learning_rate": 3.3892451892926227e-07, "epoch": 0.9629167965098161, "percentage": 96.29, "elapsed_time": "3 days, 1:22:36", "remaining_time": "2:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9271, "total_steps": 9627, "loss": 1.7633, "learning_rate": 3.370305744293867e-07, "epoch": 0.9630206710293965, "percentage": 96.3, "elapsed_time": "3 days, 1:23:09", "remaining_time": "2:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9272, "total_steps": 9627, "loss": 1.7437, "learning_rate": 3.351419186483684e-07, "epoch": 0.9631245455489769, "percentage": 96.31, "elapsed_time": "3 days, 1:23:38", "remaining_time": "2:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9273, "total_steps": 9627, "loss": 1.6749, "learning_rate": 3.3325855178733543e-07, "epoch": 0.9632284200685571, "percentage": 96.32, "elapsed_time": "3 days, 1:24:10", "remaining_time": "2:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9274, "total_steps": 9627, "loss": 1.7485, "learning_rate": 3.3138047404684957e-07, "epoch": 0.9633322945881375, "percentage": 96.33, "elapsed_time": "3 days, 1:24:41", "remaining_time": "2:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9275, "total_steps": 9627, "loss": 1.6725, "learning_rate": 3.295076856269119e-07, "epoch": 0.9634361691077179, "percentage": 96.34, "elapsed_time": "3 days, 1:25:11", "remaining_time": "2:47:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9276, "total_steps": 9627, "loss": 1.6062, "learning_rate": 3.2764018672696293e-07, "epoch": 0.9635400436272982, "percentage": 96.35, "elapsed_time": "3 days, 1:25:42", "remaining_time": "2:46:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9277, "total_steps": 9627, "loss": 1.7222, "learning_rate": 3.257779775458769e-07, "epoch": 0.9636439181468786, "percentage": 96.36, "elapsed_time": "3 days, 1:26:13", "remaining_time": "2:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9278, "total_steps": 9627, "loss": 1.7827, "learning_rate": 3.239210582819563e-07, "epoch": 0.9637477926664589, "percentage": 96.37, "elapsed_time": "3 days, 1:26:44", "remaining_time": "2:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9279, "total_steps": 9627, "loss": 1.7343, "learning_rate": 3.220694291329596e-07, "epoch": 0.9638516671860393, "percentage": 96.39, "elapsed_time": "3 days, 1:27:17", "remaining_time": "2:45:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9280, "total_steps": 9627, "loss": 1.3551, "learning_rate": 3.202230902960679e-07, "epoch": 0.9639555417056196, "percentage": 96.4, "elapsed_time": "3 days, 1:27:47", "remaining_time": "2:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9281, "total_steps": 9627, "loss": 1.5912, "learning_rate": 3.1838204196789625e-07, "epoch": 0.9640594162252, "percentage": 96.41, "elapsed_time": "3 days, 1:28:18", "remaining_time": "2:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9282, "total_steps": 9627, "loss": 1.6366, "learning_rate": 3.1654628434450437e-07, "epoch": 0.9641632907447804, "percentage": 96.42, "elapsed_time": "3 days, 1:28:49", "remaining_time": "2:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9283, "total_steps": 9627, "loss": 1.5546, "learning_rate": 3.147158176213916e-07, "epoch": 0.9642671652643606, "percentage": 96.43, "elapsed_time": "3 days, 1:29:21", "remaining_time": "2:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9284, "total_steps": 9627, "loss": 1.6533, "learning_rate": 3.1289064199347964e-07, "epoch": 0.964371039783941, "percentage": 96.44, "elapsed_time": "3 days, 1:29:53", "remaining_time": "2:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9285, "total_steps": 9627, "loss": 1.7311, "learning_rate": 3.110707576551408e-07, "epoch": 0.9644749143035214, "percentage": 96.45, "elapsed_time": "3 days, 1:30:23", "remaining_time": "2:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9286, "total_steps": 9627, "loss": 1.534, "learning_rate": 3.092561648001813e-07, "epoch": 0.9645787888231017, "percentage": 96.46, "elapsed_time": "3 days, 1:30:55", "remaining_time": "2:41:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9287, "total_steps": 9627, "loss": 1.6231, "learning_rate": 3.074468636218353e-07, "epoch": 0.964682663342682, "percentage": 96.47, "elapsed_time": "3 days, 1:31:26", "remaining_time": "2:41:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9288, "total_steps": 9627, "loss": 1.6062, "learning_rate": 3.056428543127765e-07, "epoch": 0.9647865378622624, "percentage": 96.48, "elapsed_time": "3 days, 1:31:58", "remaining_time": "2:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9289, "total_steps": 9627, "loss": 1.6621, "learning_rate": 3.038441370651346e-07, "epoch": 0.9648904123818427, "percentage": 96.49, "elapsed_time": "3 days, 1:32:29", "remaining_time": "2:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9290, "total_steps": 9627, "loss": 1.8125, "learning_rate": 3.020507120704341e-07, "epoch": 0.9649942869014231, "percentage": 96.5, "elapsed_time": "3 days, 1:33:00", "remaining_time": "2:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9291, "total_steps": 9627, "loss": 1.6262, "learning_rate": 3.002625795196834e-07, "epoch": 0.9650981614210035, "percentage": 96.51, "elapsed_time": "3 days, 1:33:32", "remaining_time": "2:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9292, "total_steps": 9627, "loss": 1.6016, "learning_rate": 2.9847973960329124e-07, "epoch": 0.9652020359405837, "percentage": 96.52, "elapsed_time": "3 days, 1:34:02", "remaining_time": "2:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9293, "total_steps": 9627, "loss": 1.9229, "learning_rate": 2.967021925111224e-07, "epoch": 0.9653059104601641, "percentage": 96.53, "elapsed_time": "3 days, 1:34:35", "remaining_time": "2:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9294, "total_steps": 9627, "loss": 1.5661, "learning_rate": 2.949299384324644e-07, "epoch": 0.9654097849797445, "percentage": 96.54, "elapsed_time": "3 days, 1:35:05", "remaining_time": "2:38:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9295, "total_steps": 9627, "loss": 1.542, "learning_rate": 2.931629775560607e-07, "epoch": 0.9655136594993248, "percentage": 96.55, "elapsed_time": "3 days, 1:35:38", "remaining_time": "2:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9296, "total_steps": 9627, "loss": 1.4694, "learning_rate": 2.914013100700663e-07, "epoch": 0.9656175340189052, "percentage": 96.56, "elapsed_time": "3 days, 1:36:10", "remaining_time": "2:37:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9297, "total_steps": 9627, "loss": 1.7179, "learning_rate": 2.896449361620923e-07, "epoch": 0.9657214085384855, "percentage": 96.57, "elapsed_time": "3 days, 1:36:40", "remaining_time": "2:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9298, "total_steps": 9627, "loss": 1.6341, "learning_rate": 2.8789385601917797e-07, "epoch": 0.9658252830580658, "percentage": 96.58, "elapsed_time": "3 days, 1:37:11", "remaining_time": "2:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9299, "total_steps": 9627, "loss": 1.8256, "learning_rate": 2.861480698277963e-07, "epoch": 0.9659291575776462, "percentage": 96.59, "elapsed_time": "3 days, 1:37:43", "remaining_time": "2:35:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9300, "total_steps": 9627, "loss": 1.8018, "learning_rate": 2.844075777738597e-07, "epoch": 0.9660330320972266, "percentage": 96.6, "elapsed_time": "3 days, 1:38:15", "remaining_time": "2:35:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9301, "total_steps": 9627, "loss": 1.6079, "learning_rate": 2.8267238004272554e-07, "epoch": 0.9661369066168068, "percentage": 96.61, "elapsed_time": "3 days, 1:38:46", "remaining_time": "2:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9302, "total_steps": 9627, "loss": 1.7133, "learning_rate": 2.8094247681916817e-07, "epoch": 0.9662407811363872, "percentage": 96.62, "elapsed_time": "3 days, 1:39:18", "remaining_time": "2:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9303, "total_steps": 9627, "loss": 1.6657, "learning_rate": 2.79217868287418e-07, "epoch": 0.9663446556559676, "percentage": 96.63, "elapsed_time": "3 days, 1:39:50", "remaining_time": "2:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9304, "total_steps": 9627, "loss": 1.6412, "learning_rate": 2.7749855463112265e-07, "epoch": 0.966448530175548, "percentage": 96.64, "elapsed_time": "3 days, 1:40:20", "remaining_time": "2:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9305, "total_steps": 9627, "loss": 1.6247, "learning_rate": 2.757845360333855e-07, "epoch": 0.9665524046951283, "percentage": 96.66, "elapsed_time": "3 days, 1:40:52", "remaining_time": "2:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9306, "total_steps": 9627, "loss": 1.6921, "learning_rate": 2.740758126767273e-07, "epoch": 0.9666562792147086, "percentage": 96.67, "elapsed_time": "3 days, 1:41:24", "remaining_time": "2:32:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9307, "total_steps": 9627, "loss": 1.9038, "learning_rate": 2.723723847431192e-07, "epoch": 0.966760153734289, "percentage": 96.68, "elapsed_time": "3 days, 1:41:56", "remaining_time": "2:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9308, "total_steps": 9627, "loss": 1.6905, "learning_rate": 2.7067425241396606e-07, "epoch": 0.9668640282538693, "percentage": 96.69, "elapsed_time": "3 days, 1:42:27", "remaining_time": "2:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9309, "total_steps": 9627, "loss": 1.5855, "learning_rate": 2.689814158700954e-07, "epoch": 0.9669679027734497, "percentage": 96.7, "elapsed_time": "3 days, 1:42:58", "remaining_time": "2:31:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9310, "total_steps": 9627, "loss": 1.5288, "learning_rate": 2.672938752917908e-07, "epoch": 0.9670717772930301, "percentage": 96.71, "elapsed_time": "3 days, 1:43:30", "remaining_time": "2:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9311, "total_steps": 9627, "loss": 1.6313, "learning_rate": 2.6561163085875863e-07, "epoch": 0.9671756518126103, "percentage": 96.72, "elapsed_time": "3 days, 1:44:02", "remaining_time": "2:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9312, "total_steps": 9627, "loss": 1.6358, "learning_rate": 2.6393468275014434e-07, "epoch": 0.9672795263321907, "percentage": 96.73, "elapsed_time": "3 days, 1:44:33", "remaining_time": "2:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9313, "total_steps": 9627, "loss": 1.8352, "learning_rate": 2.6226303114452733e-07, "epoch": 0.9673834008517711, "percentage": 96.74, "elapsed_time": "3 days, 1:45:05", "remaining_time": "2:29:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9314, "total_steps": 9627, "loss": 1.7763, "learning_rate": 2.605966762199319e-07, "epoch": 0.9674872753713514, "percentage": 96.75, "elapsed_time": "3 days, 1:45:36", "remaining_time": "2:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9315, "total_steps": 9627, "loss": 1.6718, "learning_rate": 2.58935618153805e-07, "epoch": 0.9675911498909318, "percentage": 96.76, "elapsed_time": "3 days, 1:46:08", "remaining_time": "2:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9316, "total_steps": 9627, "loss": 1.7835, "learning_rate": 2.5727985712303836e-07, "epoch": 0.9676950244105121, "percentage": 96.77, "elapsed_time": "3 days, 1:46:40", "remaining_time": "2:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9317, "total_steps": 9627, "loss": 1.7533, "learning_rate": 2.5562939330396327e-07, "epoch": 0.9677988989300924, "percentage": 96.78, "elapsed_time": "3 days, 1:47:11", "remaining_time": "2:27:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9318, "total_steps": 9627, "loss": 1.5438, "learning_rate": 2.539842268723336e-07, "epoch": 0.9679027734496728, "percentage": 96.79, "elapsed_time": "3 days, 1:47:43", "remaining_time": "2:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9319, "total_steps": 9627, "loss": 1.6705, "learning_rate": 2.5234435800335354e-07, "epoch": 0.9680066479692532, "percentage": 96.8, "elapsed_time": "3 days, 1:48:14", "remaining_time": "2:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9320, "total_steps": 9627, "loss": 1.7153, "learning_rate": 2.507097868716501e-07, "epoch": 0.9681105224888334, "percentage": 96.81, "elapsed_time": "3 days, 1:48:46", "remaining_time": "2:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9321, "total_steps": 9627, "loss": 1.716, "learning_rate": 2.4908051365129524e-07, "epoch": 0.9682143970084138, "percentage": 96.82, "elapsed_time": "3 days, 1:49:17", "remaining_time": "2:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9322, "total_steps": 9627, "loss": 1.6264, "learning_rate": 2.4745653851579453e-07, "epoch": 0.9683182715279942, "percentage": 96.83, "elapsed_time": "3 days, 1:49:50", "remaining_time": "2:24:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9323, "total_steps": 9627, "loss": 1.8135, "learning_rate": 2.458378616380874e-07, "epoch": 0.9684221460475745, "percentage": 96.84, "elapsed_time": "3 days, 1:50:20", "remaining_time": "2:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9324, "total_steps": 9627, "loss": 1.8665, "learning_rate": 2.442244831905471e-07, "epoch": 0.9685260205671549, "percentage": 96.85, "elapsed_time": "3 days, 1:50:52", "remaining_time": "2:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9325, "total_steps": 9627, "loss": 1.6818, "learning_rate": 2.426164033449918e-07, "epoch": 0.9686298950867352, "percentage": 96.86, "elapsed_time": "3 days, 1:51:24", "remaining_time": "2:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9326, "total_steps": 9627, "loss": 1.5506, "learning_rate": 2.4101362227266776e-07, "epoch": 0.9687337696063155, "percentage": 96.87, "elapsed_time": "3 days, 1:51:55", "remaining_time": "2:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9327, "total_steps": 9627, "loss": 1.8326, "learning_rate": 2.394161401442552e-07, "epoch": 0.9688376441258959, "percentage": 96.88, "elapsed_time": "3 days, 1:52:28", "remaining_time": "2:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9328, "total_steps": 9627, "loss": 1.8348, "learning_rate": 2.3782395712987903e-07, "epoch": 0.9689415186454763, "percentage": 96.89, "elapsed_time": "3 days, 1:53:00", "remaining_time": "2:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9329, "total_steps": 9627, "loss": 1.7733, "learning_rate": 2.3623707339909262e-07, "epoch": 0.9690453931650566, "percentage": 96.9, "elapsed_time": "3 days, 1:53:31", "remaining_time": "2:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9330, "total_steps": 9627, "loss": 1.5234, "learning_rate": 2.3465548912088296e-07, "epoch": 0.9691492676846369, "percentage": 96.91, "elapsed_time": "3 days, 1:54:03", "remaining_time": "2:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9331, "total_steps": 9627, "loss": 1.3639, "learning_rate": 2.3307920446368203e-07, "epoch": 0.9692531422042173, "percentage": 96.93, "elapsed_time": "3 days, 1:54:35", "remaining_time": "2:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9332, "total_steps": 9627, "loss": 1.6738, "learning_rate": 2.3150821959534442e-07, "epoch": 0.9693570167237977, "percentage": 96.94, "elapsed_time": "3 days, 1:55:07", "remaining_time": "2:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9333, "total_steps": 9627, "loss": 1.5251, "learning_rate": 2.299425346831807e-07, "epoch": 0.969460891243378, "percentage": 96.95, "elapsed_time": "3 days, 1:55:38", "remaining_time": "2:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9334, "total_steps": 9627, "loss": 1.6638, "learning_rate": 2.2838214989390762e-07, "epoch": 0.9695647657629584, "percentage": 96.96, "elapsed_time": "3 days, 1:56:10", "remaining_time": "2:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9335, "total_steps": 9627, "loss": 1.4951, "learning_rate": 2.2682706539370324e-07, "epoch": 0.9696686402825387, "percentage": 96.97, "elapsed_time": "3 days, 1:56:42", "remaining_time": "2:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9336, "total_steps": 9627, "loss": 1.7103, "learning_rate": 2.2527728134817406e-07, "epoch": 0.969772514802119, "percentage": 96.98, "elapsed_time": "3 days, 1:57:15", "remaining_time": "2:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9337, "total_steps": 9627, "loss": 1.6718, "learning_rate": 2.2373279792235468e-07, "epoch": 0.9698763893216994, "percentage": 96.99, "elapsed_time": "3 days, 1:57:45", "remaining_time": "2:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9338, "total_steps": 9627, "loss": 1.6202, "learning_rate": 2.2219361528071912e-07, "epoch": 0.9699802638412798, "percentage": 97.0, "elapsed_time": "3 days, 1:58:17", "remaining_time": "2:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9339, "total_steps": 9627, "loss": 1.5318, "learning_rate": 2.2065973358718627e-07, "epoch": 0.97008413836086, "percentage": 97.01, "elapsed_time": "3 days, 1:58:48", "remaining_time": "2:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9340, "total_steps": 9627, "loss": 1.6927, "learning_rate": 2.191311530050977e-07, "epoch": 0.9701880128804404, "percentage": 97.02, "elapsed_time": "3 days, 1:59:20", "remaining_time": "2:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9341, "total_steps": 9627, "loss": 1.6946, "learning_rate": 2.1760787369723423e-07, "epoch": 0.9702918874000208, "percentage": 97.03, "elapsed_time": "3 days, 1:59:53", "remaining_time": "2:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9342, "total_steps": 9627, "loss": 1.4909, "learning_rate": 2.160898958258162e-07, "epoch": 0.9703957619196011, "percentage": 97.04, "elapsed_time": "3 days, 2:00:25", "remaining_time": "2:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9343, "total_steps": 9627, "loss": 1.5696, "learning_rate": 2.14577219552492e-07, "epoch": 0.9704996364391815, "percentage": 97.05, "elapsed_time": "3 days, 2:00:55", "remaining_time": "2:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9344, "total_steps": 9627, "loss": 1.5663, "learning_rate": 2.1306984503835504e-07, "epoch": 0.9706035109587619, "percentage": 97.06, "elapsed_time": "3 days, 2:01:28", "remaining_time": "2:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9345, "total_steps": 9627, "loss": 1.7372, "learning_rate": 2.115677724439269e-07, "epoch": 0.9707073854783421, "percentage": 97.07, "elapsed_time": "3 days, 2:01:59", "remaining_time": "2:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9346, "total_steps": 9627, "loss": 1.6569, "learning_rate": 2.1007100192916296e-07, "epoch": 0.9708112599979225, "percentage": 97.08, "elapsed_time": "3 days, 2:02:30", "remaining_time": "2:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9347, "total_steps": 9627, "loss": 1.5835, "learning_rate": 2.085795336534635e-07, "epoch": 0.9709151345175029, "percentage": 97.09, "elapsed_time": "3 days, 2:03:03", "remaining_time": "2:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9348, "total_steps": 9627, "loss": 1.7689, "learning_rate": 2.0709336777565702e-07, "epoch": 0.9710190090370832, "percentage": 97.1, "elapsed_time": "3 days, 2:03:34", "remaining_time": "2:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9349, "total_steps": 9627, "loss": 1.6882, "learning_rate": 2.0561250445400583e-07, "epoch": 0.9711228835566635, "percentage": 97.11, "elapsed_time": "3 days, 2:04:07", "remaining_time": "2:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9350, "total_steps": 9627, "loss": 1.7222, "learning_rate": 2.041369438462115e-07, "epoch": 0.9712267580762439, "percentage": 97.12, "elapsed_time": "3 days, 2:04:38", "remaining_time": "2:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9351, "total_steps": 9627, "loss": 1.4399, "learning_rate": 2.0266668610940952e-07, "epoch": 0.9713306325958242, "percentage": 97.13, "elapsed_time": "3 days, 2:05:10", "remaining_time": "2:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9352, "total_steps": 9627, "loss": 1.4723, "learning_rate": 2.012017314001746e-07, "epoch": 0.9714345071154046, "percentage": 97.14, "elapsed_time": "3 days, 2:05:42", "remaining_time": "2:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9353, "total_steps": 9627, "loss": 1.739, "learning_rate": 1.9974207987450422e-07, "epoch": 0.971538381634985, "percentage": 97.15, "elapsed_time": "3 days, 2:06:14", "remaining_time": "2:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9354, "total_steps": 9627, "loss": 1.7562, "learning_rate": 1.9828773168785175e-07, "epoch": 0.9716422561545652, "percentage": 97.16, "elapsed_time": "3 days, 2:06:45", "remaining_time": "2:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9355, "total_steps": 9627, "loss": 1.6564, "learning_rate": 1.9683868699508224e-07, "epoch": 0.9717461306741456, "percentage": 97.17, "elapsed_time": "3 days, 2:07:18", "remaining_time": "2:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9356, "total_steps": 9627, "loss": 1.6676, "learning_rate": 1.9539494595051112e-07, "epoch": 0.971850005193726, "percentage": 97.19, "elapsed_time": "3 days, 2:07:50", "remaining_time": "2:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9357, "total_steps": 9627, "loss": 1.6582, "learning_rate": 1.9395650870789316e-07, "epoch": 0.9719538797133064, "percentage": 97.2, "elapsed_time": "3 days, 2:08:20", "remaining_time": "2:08:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9358, "total_steps": 9627, "loss": 1.7257, "learning_rate": 1.9252337542040034e-07, "epoch": 0.9720577542328867, "percentage": 97.21, "elapsed_time": "3 days, 2:08:53", "remaining_time": "2:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9359, "total_steps": 9627, "loss": 1.6339, "learning_rate": 1.910955462406605e-07, "epoch": 0.972161628752467, "percentage": 97.22, "elapsed_time": "3 days, 2:09:25", "remaining_time": "2:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9360, "total_steps": 9627, "loss": 1.5516, "learning_rate": 1.8967302132071317e-07, "epoch": 0.9722655032720474, "percentage": 97.23, "elapsed_time": "3 days, 2:09:56", "remaining_time": "2:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9361, "total_steps": 9627, "loss": 1.6057, "learning_rate": 1.882558008120594e-07, "epoch": 0.9723693777916277, "percentage": 97.24, "elapsed_time": "3 days, 2:10:28", "remaining_time": "2:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9362, "total_steps": 9627, "loss": 1.6723, "learning_rate": 1.8684388486561733e-07, "epoch": 0.9724732523112081, "percentage": 97.25, "elapsed_time": "3 days, 2:11:00", "remaining_time": "2:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9363, "total_steps": 9627, "loss": 1.5695, "learning_rate": 1.854372736317389e-07, "epoch": 0.9725771268307885, "percentage": 97.26, "elapsed_time": "3 days, 2:11:33", "remaining_time": "2:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9364, "total_steps": 9627, "loss": 1.4115, "learning_rate": 1.8403596726022653e-07, "epoch": 0.9726810013503687, "percentage": 97.27, "elapsed_time": "3 days, 2:12:04", "remaining_time": "2:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9365, "total_steps": 9627, "loss": 1.6466, "learning_rate": 1.8263996590029976e-07, "epoch": 0.9727848758699491, "percentage": 97.28, "elapsed_time": "3 days, 2:12:35", "remaining_time": "2:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9366, "total_steps": 9627, "loss": 1.5191, "learning_rate": 1.812492697006285e-07, "epoch": 0.9728887503895295, "percentage": 97.29, "elapsed_time": "3 days, 2:13:08", "remaining_time": "2:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9367, "total_steps": 9627, "loss": 1.8303, "learning_rate": 1.79863878809311e-07, "epoch": 0.9729926249091098, "percentage": 97.3, "elapsed_time": "3 days, 2:13:39", "remaining_time": "2:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9368, "total_steps": 9627, "loss": 1.6194, "learning_rate": 1.7848379337387922e-07, "epoch": 0.9730964994286901, "percentage": 97.31, "elapsed_time": "3 days, 2:14:11", "remaining_time": "2:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9369, "total_steps": 9627, "loss": 1.6873, "learning_rate": 1.7710901354129894e-07, "epoch": 0.9732003739482705, "percentage": 97.32, "elapsed_time": "3 days, 2:14:43", "remaining_time": "2:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9370, "total_steps": 9627, "loss": 1.7127, "learning_rate": 1.7573953945796973e-07, "epoch": 0.9733042484678508, "percentage": 97.33, "elapsed_time": "3 days, 2:15:15", "remaining_time": "2:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9371, "total_steps": 9627, "loss": 1.4936, "learning_rate": 1.7437537126974158e-07, "epoch": 0.9734081229874312, "percentage": 97.34, "elapsed_time": "3 days, 2:15:48", "remaining_time": "2:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9372, "total_steps": 9627, "loss": 1.7144, "learning_rate": 1.7301650912188162e-07, "epoch": 0.9735119975070116, "percentage": 97.35, "elapsed_time": "3 days, 2:16:20", "remaining_time": "2:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9373, "total_steps": 9627, "loss": 1.7131, "learning_rate": 1.716629531590963e-07, "epoch": 0.9736158720265918, "percentage": 97.36, "elapsed_time": "3 days, 2:16:51", "remaining_time": "2:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9374, "total_steps": 9627, "loss": 1.4595, "learning_rate": 1.7031470352553146e-07, "epoch": 0.9737197465461722, "percentage": 97.37, "elapsed_time": "3 days, 2:17:23", "remaining_time": "2:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9375, "total_steps": 9627, "loss": 1.6428, "learning_rate": 1.6897176036476115e-07, "epoch": 0.9738236210657526, "percentage": 97.38, "elapsed_time": "3 days, 2:17:55", "remaining_time": "1:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9376, "total_steps": 9627, "loss": 1.6586, "learning_rate": 1.6763412381980425e-07, "epoch": 0.9739274955853329, "percentage": 97.39, "elapsed_time": "3 days, 2:18:27", "remaining_time": "1:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9377, "total_steps": 9627, "loss": 1.7705, "learning_rate": 1.6630179403310797e-07, "epoch": 0.9740313701049133, "percentage": 97.4, "elapsed_time": "3 days, 2:18:59", "remaining_time": "1:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9378, "total_steps": 9627, "loss": 1.604, "learning_rate": 1.6497477114654768e-07, "epoch": 0.9741352446244936, "percentage": 97.41, "elapsed_time": "3 days, 2:19:30", "remaining_time": "1:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9379, "total_steps": 9627, "loss": 1.5545, "learning_rate": 1.6365305530144926e-07, "epoch": 0.9742391191440739, "percentage": 97.42, "elapsed_time": "3 days, 2:20:02", "remaining_time": "1:57:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9380, "total_steps": 9627, "loss": 1.6171, "learning_rate": 1.623366466385612e-07, "epoch": 0.9743429936636543, "percentage": 97.43, "elapsed_time": "3 days, 2:20:34", "remaining_time": "1:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9381, "total_steps": 9627, "loss": 1.7076, "learning_rate": 1.6102554529807134e-07, "epoch": 0.9744468681832347, "percentage": 97.44, "elapsed_time": "3 days, 2:21:06", "remaining_time": "1:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9382, "total_steps": 9627, "loss": 1.6506, "learning_rate": 1.5971975141960138e-07, "epoch": 0.974550742702815, "percentage": 97.46, "elapsed_time": "3 days, 2:21:37", "remaining_time": "1:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9383, "total_steps": 9627, "loss": 1.526, "learning_rate": 1.5841926514220674e-07, "epoch": 0.9746546172223953, "percentage": 97.47, "elapsed_time": "3 days, 2:22:09", "remaining_time": "1:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9384, "total_steps": 9627, "loss": 1.7779, "learning_rate": 1.571240866043877e-07, "epoch": 0.9747584917419757, "percentage": 97.48, "elapsed_time": "3 days, 2:22:41", "remaining_time": "1:55:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9385, "total_steps": 9627, "loss": 1.7611, "learning_rate": 1.5583421594405623e-07, "epoch": 0.9748623662615561, "percentage": 97.49, "elapsed_time": "3 days, 2:23:14", "remaining_time": "1:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9386, "total_steps": 9627, "loss": 1.5896, "learning_rate": 1.5454965329858573e-07, "epoch": 0.9749662407811364, "percentage": 97.5, "elapsed_time": "3 days, 2:23:45", "remaining_time": "1:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9387, "total_steps": 9627, "loss": 1.59, "learning_rate": 1.5327039880477234e-07, "epoch": 0.9750701153007167, "percentage": 97.51, "elapsed_time": "3 days, 2:24:18", "remaining_time": "1:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9388, "total_steps": 9627, "loss": 1.6747, "learning_rate": 1.5199645259883488e-07, "epoch": 0.9751739898202971, "percentage": 97.52, "elapsed_time": "3 days, 2:24:50", "remaining_time": "1:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9389, "total_steps": 9627, "loss": 1.5841, "learning_rate": 1.5072781481644816e-07, "epoch": 0.9752778643398774, "percentage": 97.53, "elapsed_time": "3 days, 2:25:21", "remaining_time": "1:53:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9390, "total_steps": 9627, "loss": 1.661, "learning_rate": 1.4946448559270964e-07, "epoch": 0.9753817388594578, "percentage": 97.54, "elapsed_time": "3 days, 2:25:53", "remaining_time": "1:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9391, "total_steps": 9627, "loss": 1.5102, "learning_rate": 1.4820646506215064e-07, "epoch": 0.9754856133790382, "percentage": 97.55, "elapsed_time": "3 days, 2:26:25", "remaining_time": "1:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9392, "total_steps": 9627, "loss": 1.4286, "learning_rate": 1.4695375335875282e-07, "epoch": 0.9755894878986184, "percentage": 97.56, "elapsed_time": "3 days, 2:26:57", "remaining_time": "1:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9393, "total_steps": 9627, "loss": 1.6924, "learning_rate": 1.45706350615904e-07, "epoch": 0.9756933624181988, "percentage": 97.57, "elapsed_time": "3 days, 2:27:29", "remaining_time": "1:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9394, "total_steps": 9627, "loss": 1.5943, "learning_rate": 1.444642569664534e-07, "epoch": 0.9757972369377792, "percentage": 97.58, "elapsed_time": "3 days, 2:28:01", "remaining_time": "1:50:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9395, "total_steps": 9627, "loss": 1.628, "learning_rate": 1.43227472542673e-07, "epoch": 0.9759011114573595, "percentage": 97.59, "elapsed_time": "3 days, 2:28:34", "remaining_time": "1:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9396, "total_steps": 9627, "loss": 1.4475, "learning_rate": 1.4199599747626303e-07, "epoch": 0.9760049859769399, "percentage": 97.6, "elapsed_time": "3 days, 2:29:06", "remaining_time": "1:49:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9397, "total_steps": 9627, "loss": 1.6782, "learning_rate": 1.4076983189837967e-07, "epoch": 0.9761088604965202, "percentage": 97.61, "elapsed_time": "3 days, 2:29:38", "remaining_time": "1:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9398, "total_steps": 9627, "loss": 1.5824, "learning_rate": 1.3954897593958516e-07, "epoch": 0.9762127350161005, "percentage": 97.62, "elapsed_time": "3 days, 2:30:10", "remaining_time": "1:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9399, "total_steps": 9627, "loss": 1.5385, "learning_rate": 1.3833342972990327e-07, "epoch": 0.9763166095356809, "percentage": 97.63, "elapsed_time": "3 days, 2:30:41", "remaining_time": "1:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9400, "total_steps": 9627, "loss": 1.7366, "learning_rate": 1.371231933987749e-07, "epoch": 0.9764204840552613, "percentage": 97.64, "elapsed_time": "3 days, 2:31:13", "remaining_time": "1:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9401, "total_steps": 9627, "loss": 1.5265, "learning_rate": 1.3591826707508026e-07, "epoch": 0.9765243585748415, "percentage": 97.65, "elapsed_time": "3 days, 2:31:46", "remaining_time": "1:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9402, "total_steps": 9627, "loss": 1.7914, "learning_rate": 1.3471865088713342e-07, "epoch": 0.9766282330944219, "percentage": 97.66, "elapsed_time": "3 days, 2:32:18", "remaining_time": "1:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9403, "total_steps": 9627, "loss": 1.6576, "learning_rate": 1.3352434496268773e-07, "epoch": 0.9767321076140023, "percentage": 97.67, "elapsed_time": "3 days, 2:32:50", "remaining_time": "1:46:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9404, "total_steps": 9627, "loss": 1.7209, "learning_rate": 1.3233534942892477e-07, "epoch": 0.9768359821335826, "percentage": 97.68, "elapsed_time": "3 days, 2:33:21", "remaining_time": "1:46:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9405, "total_steps": 9627, "loss": 1.6706, "learning_rate": 1.311516644124655e-07, "epoch": 0.976939856653163, "percentage": 97.69, "elapsed_time": "3 days, 2:33:54", "remaining_time": "1:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9406, "total_steps": 9627, "loss": 1.598, "learning_rate": 1.299732900393591e-07, "epoch": 0.9770437311727433, "percentage": 97.7, "elapsed_time": "3 days, 2:34:25", "remaining_time": "1:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9407, "total_steps": 9627, "loss": 1.6247, "learning_rate": 1.2880022643509958e-07, "epoch": 0.9771476056923236, "percentage": 97.71, "elapsed_time": "3 days, 2:34:58", "remaining_time": "1:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9408, "total_steps": 9627, "loss": 1.6006, "learning_rate": 1.2763247372460374e-07, "epoch": 0.977251480211904, "percentage": 97.73, "elapsed_time": "3 days, 2:35:29", "remaining_time": "1:44:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9409, "total_steps": 9627, "loss": 1.6009, "learning_rate": 1.2647003203223318e-07, "epoch": 0.9773553547314844, "percentage": 97.74, "elapsed_time": "3 days, 2:36:01", "remaining_time": "1:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9410, "total_steps": 9627, "loss": 1.6934, "learning_rate": 1.2531290148177221e-07, "epoch": 0.9774592292510648, "percentage": 97.75, "elapsed_time": "3 days, 2:36:33", "remaining_time": "1:43:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9411, "total_steps": 9627, "loss": 1.7892, "learning_rate": 1.2416108219645005e-07, "epoch": 0.977563103770645, "percentage": 97.76, "elapsed_time": "3 days, 2:37:06", "remaining_time": "1:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9412, "total_steps": 9627, "loss": 1.5935, "learning_rate": 1.2301457429892972e-07, "epoch": 0.9776669782902254, "percentage": 97.77, "elapsed_time": "3 days, 2:37:38", "remaining_time": "1:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9413, "total_steps": 9627, "loss": 1.457, "learning_rate": 1.2187337791129682e-07, "epoch": 0.9777708528098058, "percentage": 97.78, "elapsed_time": "3 days, 2:38:10", "remaining_time": "1:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9414, "total_steps": 9627, "loss": 1.6821, "learning_rate": 1.2073749315508754e-07, "epoch": 0.9778747273293861, "percentage": 97.79, "elapsed_time": "3 days, 2:38:42", "remaining_time": "1:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9415, "total_steps": 9627, "loss": 1.7259, "learning_rate": 1.1960692015126062e-07, "epoch": 0.9779786018489665, "percentage": 97.8, "elapsed_time": "3 days, 2:39:14", "remaining_time": "1:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9416, "total_steps": 9627, "loss": 1.4451, "learning_rate": 1.1848165902021424e-07, "epoch": 0.9780824763685468, "percentage": 97.81, "elapsed_time": "3 days, 2:39:45", "remaining_time": "1:40:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9417, "total_steps": 9627, "loss": 1.6452, "learning_rate": 1.1736170988178585e-07, "epoch": 0.9781863508881271, "percentage": 97.82, "elapsed_time": "3 days, 2:40:17", "remaining_time": "1:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9418, "total_steps": 9627, "loss": 1.811, "learning_rate": 1.1624707285523006e-07, "epoch": 0.9782902254077075, "percentage": 97.83, "elapsed_time": "3 days, 2:40:49", "remaining_time": "1:39:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9419, "total_steps": 9627, "loss": 1.4962, "learning_rate": 1.1513774805925748e-07, "epoch": 0.9783940999272879, "percentage": 97.84, "elapsed_time": "3 days, 2:41:21", "remaining_time": "1:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9420, "total_steps": 9627, "loss": 1.4053, "learning_rate": 1.1403373561199582e-07, "epoch": 0.9784979744468681, "percentage": 97.85, "elapsed_time": "3 days, 2:41:53", "remaining_time": "1:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9421, "total_steps": 9627, "loss": 1.6545, "learning_rate": 1.1293503563101216e-07, "epoch": 0.9786018489664485, "percentage": 97.86, "elapsed_time": "3 days, 2:42:25", "remaining_time": "1:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9422, "total_steps": 9627, "loss": 1.6459, "learning_rate": 1.1184164823331844e-07, "epoch": 0.9787057234860289, "percentage": 97.87, "elapsed_time": "3 days, 2:42:57", "remaining_time": "1:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9423, "total_steps": 9627, "loss": 1.5921, "learning_rate": 1.1075357353534377e-07, "epoch": 0.9788095980056092, "percentage": 97.88, "elapsed_time": "3 days, 2:43:29", "remaining_time": "1:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9424, "total_steps": 9627, "loss": 1.8106, "learning_rate": 1.0967081165296211e-07, "epoch": 0.9789134725251896, "percentage": 97.89, "elapsed_time": "3 days, 2:44:02", "remaining_time": "1:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9425, "total_steps": 9627, "loss": 1.6446, "learning_rate": 1.0859336270148124e-07, "epoch": 0.97901734704477, "percentage": 97.9, "elapsed_time": "3 days, 2:44:33", "remaining_time": "1:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9426, "total_steps": 9627, "loss": 1.6376, "learning_rate": 1.0752122679563714e-07, "epoch": 0.9791212215643502, "percentage": 97.91, "elapsed_time": "3 days, 2:45:05", "remaining_time": "1:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9427, "total_steps": 9627, "loss": 1.6317, "learning_rate": 1.0645440404960517e-07, "epoch": 0.9792250960839306, "percentage": 97.92, "elapsed_time": "3 days, 2:45:37", "remaining_time": "1:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9428, "total_steps": 9627, "loss": 1.918, "learning_rate": 1.0539289457699442e-07, "epoch": 0.979328970603511, "percentage": 97.93, "elapsed_time": "3 days, 2:46:09", "remaining_time": "1:34:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9429, "total_steps": 9627, "loss": 1.5551, "learning_rate": 1.0433669849085336e-07, "epoch": 0.9794328451230913, "percentage": 97.94, "elapsed_time": "3 days, 2:46:41", "remaining_time": "1:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9430, "total_steps": 9627, "loss": 1.7375, "learning_rate": 1.032858159036476e-07, "epoch": 0.9795367196426716, "percentage": 97.95, "elapsed_time": "3 days, 2:47:13", "remaining_time": "1:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9431, "total_steps": 9627, "loss": 1.5334, "learning_rate": 1.0224024692729317e-07, "epoch": 0.979640594162252, "percentage": 97.96, "elapsed_time": "3 days, 2:47:45", "remaining_time": "1:33:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9432, "total_steps": 9627, "loss": 1.4757, "learning_rate": 1.0119999167313988e-07, "epoch": 0.9797444686818323, "percentage": 97.97, "elapsed_time": "3 days, 2:48:18", "remaining_time": "1:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9433, "total_steps": 9627, "loss": 1.5889, "learning_rate": 1.0016505025195467e-07, "epoch": 0.9798483432014127, "percentage": 97.98, "elapsed_time": "3 days, 2:48:50", "remaining_time": "1:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9434, "total_steps": 9627, "loss": 1.654, "learning_rate": 9.913542277396604e-08, "epoch": 0.9799522177209931, "percentage": 98.0, "elapsed_time": "3 days, 2:49:22", "remaining_time": "1:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9435, "total_steps": 9627, "loss": 1.4344, "learning_rate": 9.811110934880296e-08, "epoch": 0.9800560922405734, "percentage": 98.01, "elapsed_time": "3 days, 2:49:54", "remaining_time": "1:31:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9436, "total_steps": 9627, "loss": 1.8921, "learning_rate": 9.709211008556707e-08, "epoch": 0.9801599667601537, "percentage": 98.02, "elapsed_time": "3 days, 2:50:27", "remaining_time": "1:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9437, "total_steps": 9627, "loss": 1.6439, "learning_rate": 9.607842509275489e-08, "epoch": 0.9802638412797341, "percentage": 98.03, "elapsed_time": "3 days, 2:50:58", "remaining_time": "1:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9438, "total_steps": 9627, "loss": 1.8815, "learning_rate": 9.507005447833007e-08, "epoch": 0.9803677157993145, "percentage": 98.04, "elapsed_time": "3 days, 2:51:31", "remaining_time": "1:29:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9439, "total_steps": 9627, "loss": 1.4922, "learning_rate": 9.406699834967337e-08, "epoch": 0.9804715903188947, "percentage": 98.05, "elapsed_time": "3 days, 2:52:03", "remaining_time": "1:29:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9440, "total_steps": 9627, "loss": 1.6177, "learning_rate": 9.306925681359935e-08, "epoch": 0.9805754648384751, "percentage": 98.06, "elapsed_time": "3 days, 2:52:35", "remaining_time": "1:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9441, "total_steps": 9627, "loss": 1.6836, "learning_rate": 9.207682997635636e-08, "epoch": 0.9806793393580555, "percentage": 98.07, "elapsed_time": "3 days, 2:53:07", "remaining_time": "1:28:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9442, "total_steps": 9627, "loss": 1.6061, "learning_rate": 9.108971794363763e-08, "epoch": 0.9807832138776358, "percentage": 98.08, "elapsed_time": "3 days, 2:53:39", "remaining_time": "1:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9443, "total_steps": 9627, "loss": 1.5034, "learning_rate": 9.010792082055908e-08, "epoch": 0.9808870883972162, "percentage": 98.09, "elapsed_time": "3 days, 2:54:12", "remaining_time": "1:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9444, "total_steps": 9627, "loss": 1.5912, "learning_rate": 8.91314387116704e-08, "epoch": 0.9809909629167965, "percentage": 98.1, "elapsed_time": "3 days, 2:54:44", "remaining_time": "1:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9445, "total_steps": 9627, "loss": 1.6321, "learning_rate": 8.81602717209662e-08, "epoch": 0.9810948374363768, "percentage": 98.11, "elapsed_time": "3 days, 2:55:17", "remaining_time": "1:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9446, "total_steps": 9627, "loss": 1.6572, "learning_rate": 8.719441995186928e-08, "epoch": 0.9811987119559572, "percentage": 98.12, "elapsed_time": "3 days, 2:55:48", "remaining_time": "1:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9447, "total_steps": 9627, "loss": 1.6643, "learning_rate": 8.623388350722517e-08, "epoch": 0.9813025864755376, "percentage": 98.13, "elapsed_time": "3 days, 2:56:20", "remaining_time": "1:25:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9448, "total_steps": 9627, "loss": 1.4247, "learning_rate": 8.527866248933536e-08, "epoch": 0.9814064609951179, "percentage": 98.14, "elapsed_time": "3 days, 2:56:53", "remaining_time": "1:25:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9449, "total_steps": 9627, "loss": 1.4757, "learning_rate": 8.432875699991849e-08, "epoch": 0.9815103355146982, "percentage": 98.15, "elapsed_time": "3 days, 2:57:25", "remaining_time": "1:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9450, "total_steps": 9627, "loss": 1.6738, "learning_rate": 8.338416714013253e-08, "epoch": 0.9816142100342786, "percentage": 98.16, "elapsed_time": "3 days, 2:57:57", "remaining_time": "1:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9451, "total_steps": 9627, "loss": 1.5149, "learning_rate": 8.244489301056368e-08, "epoch": 0.9817180845538589, "percentage": 98.17, "elapsed_time": "3 days, 2:58:29", "remaining_time": "1:23:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9452, "total_steps": 9627, "loss": 1.6678, "learning_rate": 8.151093471124305e-08, "epoch": 0.9818219590734393, "percentage": 98.18, "elapsed_time": "3 days, 2:59:02", "remaining_time": "1:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9453, "total_steps": 9627, "loss": 1.5014, "learning_rate": 8.058229234162995e-08, "epoch": 0.9819258335930197, "percentage": 98.19, "elapsed_time": "3 days, 2:59:34", "remaining_time": "1:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9454, "total_steps": 9627, "loss": 1.6016, "learning_rate": 7.965896600061751e-08, "epoch": 0.9820297081125999, "percentage": 98.2, "elapsed_time": "3 days, 3:00:06", "remaining_time": "1:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9455, "total_steps": 9627, "loss": 1.6684, "learning_rate": 7.874095578653263e-08, "epoch": 0.9821335826321803, "percentage": 98.21, "elapsed_time": "3 days, 3:00:38", "remaining_time": "1:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9456, "total_steps": 9627, "loss": 1.5004, "learning_rate": 7.782826179713043e-08, "epoch": 0.9822374571517607, "percentage": 98.22, "elapsed_time": "3 days, 3:01:10", "remaining_time": "1:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9457, "total_steps": 9627, "loss": 1.8254, "learning_rate": 7.692088412961096e-08, "epoch": 0.982341331671341, "percentage": 98.23, "elapsed_time": "3 days, 3:01:43", "remaining_time": "1:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9458, "total_steps": 9627, "loss": 1.577, "learning_rate": 7.601882288060247e-08, "epoch": 0.9824452061909213, "percentage": 98.24, "elapsed_time": "3 days, 3:02:15", "remaining_time": "1:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9459, "total_steps": 9627, "loss": 1.6106, "learning_rate": 7.512207814617256e-08, "epoch": 0.9825490807105017, "percentage": 98.25, "elapsed_time": "3 days, 3:02:47", "remaining_time": "1:19:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9460, "total_steps": 9627, "loss": 1.6185, "learning_rate": 7.423065002180596e-08, "epoch": 0.9826529552300821, "percentage": 98.27, "elapsed_time": "3 days, 3:03:19", "remaining_time": "1:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9461, "total_steps": 9627, "loss": 1.5966, "learning_rate": 7.334453860244339e-08, "epoch": 0.9827568297496624, "percentage": 98.28, "elapsed_time": "3 days, 3:03:52", "remaining_time": "1:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9462, "total_steps": 9627, "loss": 1.5905, "learning_rate": 7.24637439824427e-08, "epoch": 0.9828607042692428, "percentage": 98.29, "elapsed_time": "3 days, 3:04:24", "remaining_time": "1:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9463, "total_steps": 9627, "loss": 1.6842, "learning_rate": 7.158826625560112e-08, "epoch": 0.9829645787888232, "percentage": 98.3, "elapsed_time": "3 days, 3:04:57", "remaining_time": "1:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9464, "total_steps": 9627, "loss": 1.6072, "learning_rate": 7.071810551516067e-08, "epoch": 0.9830684533084034, "percentage": 98.31, "elapsed_time": "3 days, 3:05:28", "remaining_time": "1:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9465, "total_steps": 9627, "loss": 1.6148, "learning_rate": 6.98532618537695e-08, "epoch": 0.9831723278279838, "percentage": 98.32, "elapsed_time": "3 days, 3:06:01", "remaining_time": "1:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9466, "total_steps": 9627, "loss": 1.693, "learning_rate": 6.899373536354282e-08, "epoch": 0.9832762023475642, "percentage": 98.33, "elapsed_time": "3 days, 3:06:33", "remaining_time": "1:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9467, "total_steps": 9627, "loss": 1.896, "learning_rate": 6.813952613600183e-08, "epoch": 0.9833800768671445, "percentage": 98.34, "elapsed_time": "3 days, 3:07:05", "remaining_time": "1:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9468, "total_steps": 9627, "loss": 1.6331, "learning_rate": 6.729063426211824e-08, "epoch": 0.9834839513867248, "percentage": 98.35, "elapsed_time": "3 days, 3:07:38", "remaining_time": "1:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9469, "total_steps": 9627, "loss": 1.6337, "learning_rate": 6.644705983229194e-08, "epoch": 0.9835878259063052, "percentage": 98.36, "elapsed_time": "3 days, 3:08:10", "remaining_time": "1:15:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9470, "total_steps": 9627, "loss": 1.7527, "learning_rate": 6.560880293636218e-08, "epoch": 0.9836917004258855, "percentage": 98.37, "elapsed_time": "3 days, 3:08:42", "remaining_time": "1:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9471, "total_steps": 9627, "loss": 1.6945, "learning_rate": 6.477586366358535e-08, "epoch": 0.9837955749454659, "percentage": 98.38, "elapsed_time": "3 days, 3:09:14", "remaining_time": "1:14:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9472, "total_steps": 9627, "loss": 1.4567, "learning_rate": 6.394824210266826e-08, "epoch": 0.9838994494650463, "percentage": 98.39, "elapsed_time": "3 days, 3:09:47", "remaining_time": "1:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9473, "total_steps": 9627, "loss": 1.5229, "learning_rate": 6.312593834175152e-08, "epoch": 0.9840033239846265, "percentage": 98.4, "elapsed_time": "3 days, 3:10:19", "remaining_time": "1:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9474, "total_steps": 9627, "loss": 1.5506, "learning_rate": 6.230895246840396e-08, "epoch": 0.9841071985042069, "percentage": 98.41, "elapsed_time": "3 days, 3:10:51", "remaining_time": "1:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9475, "total_steps": 9627, "loss": 1.6544, "learning_rate": 6.149728456961712e-08, "epoch": 0.9842110730237873, "percentage": 98.42, "elapsed_time": "3 days, 3:11:23", "remaining_time": "1:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9476, "total_steps": 9627, "loss": 1.7364, "learning_rate": 6.069093473183296e-08, "epoch": 0.9843149475433676, "percentage": 98.43, "elapsed_time": "3 days, 3:11:56", "remaining_time": "1:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9477, "total_steps": 9627, "loss": 1.5175, "learning_rate": 5.988990304092724e-08, "epoch": 0.984418822062948, "percentage": 98.44, "elapsed_time": "3 days, 3:12:28", "remaining_time": "1:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9478, "total_steps": 9627, "loss": 1.6242, "learning_rate": 5.9094189582198366e-08, "epoch": 0.9845226965825283, "percentage": 98.45, "elapsed_time": "3 days, 3:13:00", "remaining_time": "1:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9479, "total_steps": 9627, "loss": 1.6943, "learning_rate": 5.830379444038414e-08, "epoch": 0.9846265711021086, "percentage": 98.46, "elapsed_time": "3 days, 3:13:32", "remaining_time": "1:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9480, "total_steps": 9627, "loss": 1.5377, "learning_rate": 5.751871769965056e-08, "epoch": 0.984730445621689, "percentage": 98.47, "elapsed_time": "3 days, 3:14:05", "remaining_time": "1:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9481, "total_steps": 9627, "loss": 1.7265, "learning_rate": 5.673895944361407e-08, "epoch": 0.9848343201412694, "percentage": 98.48, "elapsed_time": "3 days, 3:14:37", "remaining_time": "1:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9482, "total_steps": 9627, "loss": 1.6865, "learning_rate": 5.59645197553027e-08, "epoch": 0.9849381946608496, "percentage": 98.49, "elapsed_time": "3 days, 3:15:09", "remaining_time": "1:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9483, "total_steps": 9627, "loss": 1.8202, "learning_rate": 5.5195398717194926e-08, "epoch": 0.98504206918043, "percentage": 98.5, "elapsed_time": "3 days, 3:15:42", "remaining_time": "1:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9484, "total_steps": 9627, "loss": 1.6619, "learning_rate": 5.443159641118634e-08, "epoch": 0.9851459437000104, "percentage": 98.51, "elapsed_time": "3 days, 3:16:14", "remaining_time": "1:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9485, "total_steps": 9627, "loss": 1.7641, "learning_rate": 5.367311291862853e-08, "epoch": 0.9852498182195908, "percentage": 98.52, "elapsed_time": "3 days, 3:16:46", "remaining_time": "1:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9486, "total_steps": 9627, "loss": 1.5296, "learning_rate": 5.291994832028469e-08, "epoch": 0.9853536927391711, "percentage": 98.54, "elapsed_time": "3 days, 3:17:18", "remaining_time": "1:07:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9487, "total_steps": 9627, "loss": 1.4804, "learning_rate": 5.217210269636286e-08, "epoch": 0.9854575672587514, "percentage": 98.55, "elapsed_time": "3 days, 3:17:50", "remaining_time": "1:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9488, "total_steps": 9627, "loss": 1.5122, "learning_rate": 5.1429576126504895e-08, "epoch": 0.9855614417783318, "percentage": 98.56, "elapsed_time": "3 days, 3:18:23", "remaining_time": "1:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9489, "total_steps": 9627, "loss": 1.5971, "learning_rate": 5.069236868978644e-08, "epoch": 0.9856653162979121, "percentage": 98.57, "elapsed_time": "3 days, 3:18:55", "remaining_time": "1:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9490, "total_steps": 9627, "loss": 1.6514, "learning_rate": 4.996048046471136e-08, "epoch": 0.9857691908174925, "percentage": 98.58, "elapsed_time": "3 days, 3:19:27", "remaining_time": "1:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9491, "total_steps": 9627, "loss": 1.6722, "learning_rate": 4.923391152921175e-08, "epoch": 0.9858730653370729, "percentage": 98.59, "elapsed_time": "3 days, 3:19:59", "remaining_time": "1:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9492, "total_steps": 9627, "loss": 1.6484, "learning_rate": 4.851266196068127e-08, "epoch": 0.9859769398566531, "percentage": 98.6, "elapsed_time": "3 days, 3:20:31", "remaining_time": "1:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9493, "total_steps": 9627, "loss": 1.8121, "learning_rate": 4.779673183590849e-08, "epoch": 0.9860808143762335, "percentage": 98.61, "elapsed_time": "3 days, 3:21:03", "remaining_time": "1:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9494, "total_steps": 9627, "loss": 1.7639, "learning_rate": 4.708612123114353e-08, "epoch": 0.9861846888958139, "percentage": 98.62, "elapsed_time": "3 days, 3:21:36", "remaining_time": "1:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9495, "total_steps": 9627, "loss": 1.7797, "learning_rate": 4.638083022205364e-08, "epoch": 0.9862885634153942, "percentage": 98.63, "elapsed_time": "3 days, 3:22:08", "remaining_time": "1:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9496, "total_steps": 9627, "loss": 1.6323, "learning_rate": 4.56808588837565e-08, "epoch": 0.9863924379349746, "percentage": 98.64, "elapsed_time": "3 days, 3:22:40", "remaining_time": "1:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9497, "total_steps": 9627, "loss": 1.7339, "learning_rate": 4.4986207290792505e-08, "epoch": 0.9864963124545549, "percentage": 98.65, "elapsed_time": "3 days, 3:23:12", "remaining_time": "1:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9498, "total_steps": 9627, "loss": 1.6974, "learning_rate": 4.4296875517130243e-08, "epoch": 0.9866001869741352, "percentage": 98.66, "elapsed_time": "3 days, 3:23:45", "remaining_time": "1:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9499, "total_steps": 9627, "loss": 1.5564, "learning_rate": 4.361286363618322e-08, "epoch": 0.9867040614937156, "percentage": 98.67, "elapsed_time": "3 days, 3:24:17", "remaining_time": "1:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9500, "total_steps": 9627, "loss": 1.5828, "learning_rate": 4.293417172078762e-08, "epoch": 0.986807936013296, "percentage": 98.68, "elapsed_time": "3 days, 3:24:50", "remaining_time": "1:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9501, "total_steps": 9627, "loss": 1.5301, "learning_rate": 4.226079984322451e-08, "epoch": 0.9869118105328762, "percentage": 98.69, "elapsed_time": "3 days, 3:25:22", "remaining_time": "1:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9502, "total_steps": 9627, "loss": 1.6214, "learning_rate": 4.159274807520319e-08, "epoch": 0.9870156850524566, "percentage": 98.7, "elapsed_time": "3 days, 3:25:55", "remaining_time": "0:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9503, "total_steps": 9627, "loss": 1.7306, "learning_rate": 4.0930016487861214e-08, "epoch": 0.987119559572037, "percentage": 98.71, "elapsed_time": "3 days, 3:26:27", "remaining_time": "0:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9504, "total_steps": 9627, "loss": 1.8203, "learning_rate": 4.027260515177544e-08, "epoch": 0.9872234340916173, "percentage": 98.72, "elapsed_time": "3 days, 3:26:59", "remaining_time": "0:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9505, "total_steps": 9627, "loss": 1.5731, "learning_rate": 3.962051413695656e-08, "epoch": 0.9873273086111977, "percentage": 98.73, "elapsed_time": "3 days, 3:27:31", "remaining_time": "0:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9506, "total_steps": 9627, "loss": 1.7339, "learning_rate": 3.897374351284899e-08, "epoch": 0.987431183130778, "percentage": 98.74, "elapsed_time": "3 days, 3:28:03", "remaining_time": "0:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9507, "total_steps": 9627, "loss": 1.993, "learning_rate": 3.8332293348325444e-08, "epoch": 0.9875350576503583, "percentage": 98.75, "elapsed_time": "3 days, 3:28:35", "remaining_time": "0:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9508, "total_steps": 9627, "loss": 1.708, "learning_rate": 3.769616371169793e-08, "epoch": 0.9876389321699387, "percentage": 98.76, "elapsed_time": "3 days, 3:29:07", "remaining_time": "0:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9509, "total_steps": 9627, "loss": 1.9389, "learning_rate": 3.706535467070671e-08, "epoch": 0.9877428066895191, "percentage": 98.77, "elapsed_time": "3 days, 3:29:39", "remaining_time": "0:56:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9510, "total_steps": 9627, "loss": 1.6609, "learning_rate": 3.6439866292531376e-08, "epoch": 0.9878466812090994, "percentage": 98.78, "elapsed_time": "3 days, 3:30:11", "remaining_time": "0:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9511, "total_steps": 9627, "loss": 1.7568, "learning_rate": 3.5819698643779764e-08, "epoch": 0.9879505557286797, "percentage": 98.8, "elapsed_time": "3 days, 3:30:43", "remaining_time": "0:55:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9512, "total_steps": 9627, "loss": 1.6101, "learning_rate": 3.520485179048794e-08, "epoch": 0.9880544302482601, "percentage": 98.81, "elapsed_time": "3 days, 3:31:16", "remaining_time": "0:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9513, "total_steps": 9627, "loss": 1.7143, "learning_rate": 3.459532579814795e-08, "epoch": 0.9881583047678405, "percentage": 98.82, "elapsed_time": "3 days, 3:31:47", "remaining_time": "0:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9514, "total_steps": 9627, "loss": 1.5954, "learning_rate": 3.399112073165789e-08, "epoch": 0.9882621792874208, "percentage": 98.83, "elapsed_time": "3 days, 3:32:20", "remaining_time": "0:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9515, "total_steps": 9627, "loss": 1.8197, "learning_rate": 3.339223665536073e-08, "epoch": 0.9883660538070012, "percentage": 98.84, "elapsed_time": "3 days, 3:32:52", "remaining_time": "0:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9516, "total_steps": 9627, "loss": 1.6981, "learning_rate": 3.279867363303879e-08, "epoch": 0.9884699283265815, "percentage": 98.85, "elapsed_time": "3 days, 3:33:23", "remaining_time": "0:52:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9517, "total_steps": 9627, "loss": 1.5851, "learning_rate": 3.221043172789706e-08, "epoch": 0.9885738028461618, "percentage": 98.86, "elapsed_time": "3 days, 3:33:56", "remaining_time": "0:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9518, "total_steps": 9627, "loss": 1.6064, "learning_rate": 3.162751100257988e-08, "epoch": 0.9886776773657422, "percentage": 98.87, "elapsed_time": "3 days, 3:34:27", "remaining_time": "0:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9519, "total_steps": 9627, "loss": 1.6993, "learning_rate": 3.1049911519165365e-08, "epoch": 0.9887815518853226, "percentage": 98.88, "elapsed_time": "3 days, 3:34:59", "remaining_time": "0:51:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9520, "total_steps": 9627, "loss": 1.6729, "learning_rate": 3.047763333916542e-08, "epoch": 0.9888854264049028, "percentage": 98.89, "elapsed_time": "3 days, 3:35:32", "remaining_time": "0:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9521, "total_steps": 9627, "loss": 1.6401, "learning_rate": 2.991067652351465e-08, "epoch": 0.9889893009244832, "percentage": 98.9, "elapsed_time": "3 days, 3:36:04", "remaining_time": "0:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9522, "total_steps": 9627, "loss": 1.6012, "learning_rate": 2.9349041132598065e-08, "epoch": 0.9890931754440636, "percentage": 98.91, "elapsed_time": "3 days, 3:36:35", "remaining_time": "0:50:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9523, "total_steps": 9627, "loss": 1.5285, "learning_rate": 2.8792727226223393e-08, "epoch": 0.9891970499636439, "percentage": 98.92, "elapsed_time": "3 days, 3:37:08", "remaining_time": "0:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9524, "total_steps": 9627, "loss": 1.7036, "learning_rate": 2.824173486363213e-08, "epoch": 0.9893009244832243, "percentage": 98.93, "elapsed_time": "3 days, 3:37:40", "remaining_time": "0:49:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9525, "total_steps": 9627, "loss": 1.7136, "learning_rate": 2.7696064103505116e-08, "epoch": 0.9894047990028046, "percentage": 98.94, "elapsed_time": "3 days, 3:38:13", "remaining_time": "0:48:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9526, "total_steps": 9627, "loss": 1.6265, "learning_rate": 2.715571500394587e-08, "epoch": 0.9895086735223849, "percentage": 98.95, "elapsed_time": "3 days, 3:38:45", "remaining_time": "0:48:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9527, "total_steps": 9627, "loss": 1.6818, "learning_rate": 2.6620687622497255e-08, "epoch": 0.9896125480419653, "percentage": 98.96, "elapsed_time": "3 days, 3:39:17", "remaining_time": "0:47:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9528, "total_steps": 9627, "loss": 1.6076, "learning_rate": 2.609098201613591e-08, "epoch": 0.9897164225615457, "percentage": 98.97, "elapsed_time": "3 days, 3:39:48", "remaining_time": "0:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9529, "total_steps": 9627, "loss": 1.6429, "learning_rate": 2.556659824127783e-08, "epoch": 0.989820297081126, "percentage": 98.98, "elapsed_time": "3 days, 3:40:20", "remaining_time": "0:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9530, "total_steps": 9627, "loss": 1.5681, "learning_rate": 2.504753635376167e-08, "epoch": 0.9899241716007063, "percentage": 98.99, "elapsed_time": "3 days, 3:40:52", "remaining_time": "0:46:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9531, "total_steps": 9627, "loss": 1.6556, "learning_rate": 2.453379640886544e-08, "epoch": 0.9900280461202867, "percentage": 99.0, "elapsed_time": "3 days, 3:41:23", "remaining_time": "0:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9532, "total_steps": 9627, "loss": 1.502, "learning_rate": 2.4025378461289828e-08, "epoch": 0.990131920639867, "percentage": 99.01, "elapsed_time": "3 days, 3:41:56", "remaining_time": "0:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9533, "total_steps": 9627, "loss": 1.6831, "learning_rate": 2.352228256519151e-08, "epoch": 0.9902357951594474, "percentage": 99.02, "elapsed_time": "3 days, 3:42:27", "remaining_time": "0:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9534, "total_steps": 9627, "loss": 1.6327, "learning_rate": 2.3024508774133204e-08, "epoch": 0.9903396696790278, "percentage": 99.03, "elapsed_time": "3 days, 3:42:59", "remaining_time": "0:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9535, "total_steps": 9627, "loss": 1.5492, "learning_rate": 2.2532057141128048e-08, "epoch": 0.990443544198608, "percentage": 99.04, "elapsed_time": "3 days, 3:43:30", "remaining_time": "0:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9536, "total_steps": 9627, "loss": 1.5991, "learning_rate": 2.2044927718622987e-08, "epoch": 0.9905474187181884, "percentage": 99.05, "elapsed_time": "3 days, 3:44:03", "remaining_time": "0:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9537, "total_steps": 9627, "loss": 1.5447, "learning_rate": 2.1563120558487638e-08, "epoch": 0.9906512932377688, "percentage": 99.07, "elapsed_time": "3 days, 3:44:35", "remaining_time": "0:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9538, "total_steps": 9627, "loss": 1.6873, "learning_rate": 2.1086635712036507e-08, "epoch": 0.9907551677573492, "percentage": 99.08, "elapsed_time": "3 days, 3:45:05", "remaining_time": "0:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9539, "total_steps": 9627, "loss": 1.7317, "learning_rate": 2.061547323000679e-08, "epoch": 0.9908590422769294, "percentage": 99.09, "elapsed_time": "3 days, 3:45:38", "remaining_time": "0:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9540, "total_steps": 9627, "loss": 1.5926, "learning_rate": 2.014963316257501e-08, "epoch": 0.9909629167965098, "percentage": 99.1, "elapsed_time": "3 days, 3:46:09", "remaining_time": "0:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9541, "total_steps": 9627, "loss": 1.5653, "learning_rate": 1.9689115559345938e-08, "epoch": 0.9910667913160902, "percentage": 99.11, "elapsed_time": "3 days, 3:46:41", "remaining_time": "0:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9542, "total_steps": 9627, "loss": 1.5923, "learning_rate": 1.9233920469369225e-08, "epoch": 0.9911706658356705, "percentage": 99.12, "elapsed_time": "3 days, 3:47:14", "remaining_time": "0:40:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9543, "total_steps": 9627, "loss": 1.7091, "learning_rate": 1.878404794111166e-08, "epoch": 0.9912745403552509, "percentage": 99.13, "elapsed_time": "3 days, 3:47:46", "remaining_time": "0:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9544, "total_steps": 9627, "loss": 1.7469, "learning_rate": 1.8339498022490465e-08, "epoch": 0.9913784148748312, "percentage": 99.14, "elapsed_time": "3 days, 3:48:17", "remaining_time": "0:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9545, "total_steps": 9627, "loss": 1.6314, "learning_rate": 1.790027076083445e-08, "epoch": 0.9914822893944115, "percentage": 99.15, "elapsed_time": "3 days, 3:48:49", "remaining_time": "0:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9546, "total_steps": 9627, "loss": 1.6766, "learning_rate": 1.7466366202928408e-08, "epoch": 0.9915861639139919, "percentage": 99.16, "elapsed_time": "3 days, 3:49:21", "remaining_time": "0:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9547, "total_steps": 9627, "loss": 1.6412, "learning_rate": 1.7037784394968724e-08, "epoch": 0.9916900384335723, "percentage": 99.17, "elapsed_time": "3 days, 3:49:54", "remaining_time": "0:38:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9548, "total_steps": 9627, "loss": 1.5854, "learning_rate": 1.6614525382613323e-08, "epoch": 0.9917939129531526, "percentage": 99.18, "elapsed_time": "3 days, 3:50:26", "remaining_time": "0:37:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9549, "total_steps": 9627, "loss": 1.5208, "learning_rate": 1.6196589210915046e-08, "epoch": 0.9918977874727329, "percentage": 99.19, "elapsed_time": "3 days, 3:50:58", "remaining_time": "0:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9550, "total_steps": 9627, "loss": 1.8193, "learning_rate": 1.5783975924399398e-08, "epoch": 0.9920016619923133, "percentage": 99.2, "elapsed_time": "3 days, 3:51:30", "remaining_time": "0:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9551, "total_steps": 9627, "loss": 1.5834, "learning_rate": 1.5376685566992345e-08, "epoch": 0.9921055365118936, "percentage": 99.21, "elapsed_time": "3 days, 3:52:03", "remaining_time": "0:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9552, "total_steps": 9627, "loss": 1.5352, "learning_rate": 1.4974718182075853e-08, "epoch": 0.992209411031474, "percentage": 99.22, "elapsed_time": "3 days, 3:52:34", "remaining_time": "0:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9553, "total_steps": 9627, "loss": 1.6593, "learning_rate": 1.4578073812454574e-08, "epoch": 0.9923132855510544, "percentage": 99.23, "elapsed_time": "3 days, 3:53:05", "remaining_time": "0:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9554, "total_steps": 9627, "loss": 1.7582, "learning_rate": 1.418675250036694e-08, "epoch": 0.9924171600706346, "percentage": 99.24, "elapsed_time": "3 days, 3:53:38", "remaining_time": "0:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9555, "total_steps": 9627, "loss": 1.6358, "learning_rate": 1.3800754287485174e-08, "epoch": 0.992521034590215, "percentage": 99.25, "elapsed_time": "3 days, 3:54:10", "remaining_time": "0:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9556, "total_steps": 9627, "loss": 1.5889, "learning_rate": 1.3420079214915282e-08, "epoch": 0.9926249091097954, "percentage": 99.26, "elapsed_time": "3 days, 3:54:41", "remaining_time": "0:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9557, "total_steps": 9627, "loss": 1.6185, "learning_rate": 1.3044727323202611e-08, "epoch": 0.9927287836293757, "percentage": 99.27, "elapsed_time": "3 days, 3:55:13", "remaining_time": "0:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9558, "total_steps": 9627, "loss": 1.6872, "learning_rate": 1.2674698652304085e-08, "epoch": 0.992832658148956, "percentage": 99.28, "elapsed_time": "3 days, 3:55:45", "remaining_time": "0:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9559, "total_steps": 9627, "loss": 1.7338, "learning_rate": 1.2309993241638173e-08, "epoch": 0.9929365326685364, "percentage": 99.29, "elapsed_time": "3 days, 3:56:17", "remaining_time": "0:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9560, "total_steps": 9627, "loss": 1.8372, "learning_rate": 1.1950611130040479e-08, "epoch": 0.9930404071881167, "percentage": 99.3, "elapsed_time": "3 days, 3:56:49", "remaining_time": "0:31:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9561, "total_steps": 9627, "loss": 1.5309, "learning_rate": 1.1596552355780388e-08, "epoch": 0.9931442817076971, "percentage": 99.31, "elapsed_time": "3 days, 3:57:21", "remaining_time": "0:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9562, "total_steps": 9627, "loss": 1.6077, "learning_rate": 1.1247816956561075e-08, "epoch": 0.9932481562272775, "percentage": 99.32, "elapsed_time": "3 days, 3:57:53", "remaining_time": "0:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9563, "total_steps": 9627, "loss": 1.6831, "learning_rate": 1.0904404969525051e-08, "epoch": 0.9933520307468579, "percentage": 99.34, "elapsed_time": "3 days, 3:58:25", "remaining_time": "0:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9564, "total_steps": 9627, "loss": 1.7443, "learning_rate": 1.0566316431237511e-08, "epoch": 0.9934559052664381, "percentage": 99.35, "elapsed_time": "3 days, 3:58:57", "remaining_time": "0:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9565, "total_steps": 9627, "loss": 1.7238, "learning_rate": 1.0233551377702988e-08, "epoch": 0.9935597797860185, "percentage": 99.36, "elapsed_time": "3 days, 3:59:29", "remaining_time": "0:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9566, "total_steps": 9627, "loss": 1.6286, "learning_rate": 9.906109844359802e-09, "epoch": 0.9936636543055989, "percentage": 99.37, "elapsed_time": "3 days, 4:00:00", "remaining_time": "0:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9567, "total_steps": 9627, "loss": 1.5039, "learning_rate": 9.583991866080055e-09, "epoch": 0.9937675288251792, "percentage": 99.38, "elapsed_time": "3 days, 4:00:33", "remaining_time": "0:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9568, "total_steps": 9627, "loss": 1.6008, "learning_rate": 9.267197477169643e-09, "epoch": 0.9938714033447595, "percentage": 99.39, "elapsed_time": "3 days, 4:01:04", "remaining_time": "0:28:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9569, "total_steps": 9627, "loss": 1.6676, "learning_rate": 8.955726711351586e-09, "epoch": 0.9939752778643399, "percentage": 99.4, "elapsed_time": "3 days, 4:01:36", "remaining_time": "0:27:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9570, "total_steps": 9627, "loss": 1.4568, "learning_rate": 8.649579601810453e-09, "epoch": 0.9940791523839202, "percentage": 99.41, "elapsed_time": "3 days, 4:02:08", "remaining_time": "0:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9571, "total_steps": 9627, "loss": 1.7452, "learning_rate": 8.34875618113684e-09, "epoch": 0.9941830269035006, "percentage": 99.42, "elapsed_time": "3 days, 4:02:41", "remaining_time": "0:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9572, "total_steps": 9627, "loss": 1.7141, "learning_rate": 8.053256481371785e-09, "epoch": 0.994286901423081, "percentage": 99.43, "elapsed_time": "3 days, 4:03:11", "remaining_time": "0:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9573, "total_steps": 9627, "loss": 1.7414, "learning_rate": 7.763080533984557e-09, "epoch": 0.9943907759426612, "percentage": 99.44, "elapsed_time": "3 days, 4:03:43", "remaining_time": "0:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9574, "total_steps": 9627, "loss": 1.7477, "learning_rate": 7.478228369872664e-09, "epoch": 0.9944946504622416, "percentage": 99.45, "elapsed_time": "3 days, 4:04:16", "remaining_time": "0:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9575, "total_steps": 9627, "loss": 1.7388, "learning_rate": 7.198700019378502e-09, "epoch": 0.994598524981822, "percentage": 99.46, "elapsed_time": "3 days, 4:04:48", "remaining_time": "0:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9576, "total_steps": 9627, "loss": 1.6223, "learning_rate": 6.924495512256046e-09, "epoch": 0.9947023995014023, "percentage": 99.47, "elapsed_time": "3 days, 4:05:20", "remaining_time": "0:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9577, "total_steps": 9627, "loss": 1.6013, "learning_rate": 6.655614877720817e-09, "epoch": 0.9948062740209827, "percentage": 99.48, "elapsed_time": "3 days, 4:05:50", "remaining_time": "0:23:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9578, "total_steps": 9627, "loss": 1.6791, "learning_rate": 6.392058144394364e-09, "epoch": 0.994910148540563, "percentage": 99.49, "elapsed_time": "3 days, 4:06:23", "remaining_time": "0:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9579, "total_steps": 9627, "loss": 1.6949, "learning_rate": 6.133825340348675e-09, "epoch": 0.9950140230601433, "percentage": 99.5, "elapsed_time": "3 days, 4:06:55", "remaining_time": "0:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9580, "total_steps": 9627, "loss": 1.6022, "learning_rate": 5.8809164930839765e-09, "epoch": 0.9951178975797237, "percentage": 99.51, "elapsed_time": "3 days, 4:07:28", "remaining_time": "0:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9581, "total_steps": 9627, "loss": 1.8264, "learning_rate": 5.6333316295342775e-09, "epoch": 0.9952217720993041, "percentage": 99.52, "elapsed_time": "3 days, 4:07:59", "remaining_time": "0:21:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9582, "total_steps": 9627, "loss": 1.5983, "learning_rate": 5.391070776061824e-09, "epoch": 0.9953256466188843, "percentage": 99.53, "elapsed_time": "3 days, 4:08:31", "remaining_time": "0:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9583, "total_steps": 9627, "loss": 1.6543, "learning_rate": 5.154133958468199e-09, "epoch": 0.9954295211384647, "percentage": 99.54, "elapsed_time": "3 days, 4:09:03", "remaining_time": "0:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9584, "total_steps": 9627, "loss": 1.6388, "learning_rate": 4.922521201988772e-09, "epoch": 0.9955333956580451, "percentage": 99.55, "elapsed_time": "3 days, 4:09:35", "remaining_time": "0:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9585, "total_steps": 9627, "loss": 1.5859, "learning_rate": 4.6962325312760455e-09, "epoch": 0.9956372701776254, "percentage": 99.56, "elapsed_time": "3 days, 4:10:06", "remaining_time": "0:20:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9586, "total_steps": 9627, "loss": 1.8203, "learning_rate": 4.475267970444064e-09, "epoch": 0.9957411446972058, "percentage": 99.57, "elapsed_time": "3 days, 4:10:38", "remaining_time": "0:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9587, "total_steps": 9627, "loss": 1.6721, "learning_rate": 4.259627543012901e-09, "epoch": 0.9958450192167861, "percentage": 99.58, "elapsed_time": "3 days, 4:11:09", "remaining_time": "0:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9588, "total_steps": 9627, "loss": 1.5659, "learning_rate": 4.04931127194752e-09, "epoch": 0.9959488937363664, "percentage": 99.59, "elapsed_time": "3 days, 4:11:41", "remaining_time": "0:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9589, "total_steps": 9627, "loss": 1.6087, "learning_rate": 3.844319179646671e-09, "epoch": 0.9960527682559468, "percentage": 99.61, "elapsed_time": "3 days, 4:12:13", "remaining_time": "0:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9590, "total_steps": 9627, "loss": 1.654, "learning_rate": 3.6446512879428907e-09, "epoch": 0.9961566427755272, "percentage": 99.62, "elapsed_time": "3 days, 4:12:46", "remaining_time": "0:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9591, "total_steps": 9627, "loss": 1.661, "learning_rate": 3.4503076180969486e-09, "epoch": 0.9962605172951076, "percentage": 99.63, "elapsed_time": "3 days, 4:13:18", "remaining_time": "0:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9592, "total_steps": 9627, "loss": 1.6552, "learning_rate": 3.2612881908089533e-09, "epoch": 0.9963643918146878, "percentage": 99.64, "elapsed_time": "3 days, 4:13:50", "remaining_time": "0:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9593, "total_steps": 9627, "loss": 1.6067, "learning_rate": 3.0775930261961462e-09, "epoch": 0.9964682663342682, "percentage": 99.65, "elapsed_time": "3 days, 4:14:22", "remaining_time": "0:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9594, "total_steps": 9627, "loss": 1.6194, "learning_rate": 2.89922214383731e-09, "epoch": 0.9965721408538486, "percentage": 99.66, "elapsed_time": "3 days, 4:14:54", "remaining_time": "0:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9595, "total_steps": 9627, "loss": 1.5895, "learning_rate": 2.726175562711708e-09, "epoch": 0.9966760153734289, "percentage": 99.67, "elapsed_time": "3 days, 4:15:27", "remaining_time": "0:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9596, "total_steps": 9627, "loss": 1.5636, "learning_rate": 2.558453301260144e-09, "epoch": 0.9967798898930093, "percentage": 99.68, "elapsed_time": "3 days, 4:15:59", "remaining_time": "0:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9597, "total_steps": 9627, "loss": 1.6763, "learning_rate": 2.3960553773350046e-09, "epoch": 0.9968837644125896, "percentage": 99.69, "elapsed_time": "3 days, 4:16:29", "remaining_time": "0:14:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9598, "total_steps": 9627, "loss": 1.6111, "learning_rate": 2.2389818082335645e-09, "epoch": 0.9969876389321699, "percentage": 99.7, "elapsed_time": "3 days, 4:17:02", "remaining_time": "0:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9599, "total_steps": 9627, "loss": 1.7814, "learning_rate": 2.0872326106868845e-09, "epoch": 0.9970915134517503, "percentage": 99.71, "elapsed_time": "3 days, 4:17:34", "remaining_time": "0:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9600, "total_steps": 9627, "loss": 1.6691, "learning_rate": 1.9408078008431586e-09, "epoch": 0.9971953879713307, "percentage": 99.72, "elapsed_time": "3 days, 4:18:06", "remaining_time": "0:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9601, "total_steps": 9627, "loss": 1.6991, "learning_rate": 1.7997073943121222e-09, "epoch": 0.9972992624909109, "percentage": 99.73, "elapsed_time": "3 days, 4:18:38", "remaining_time": "0:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9602, "total_steps": 9627, "loss": 1.6752, "learning_rate": 1.6639314061095422e-09, "epoch": 0.9974031370104913, "percentage": 99.74, "elapsed_time": "3 days, 4:19:10", "remaining_time": "0:11:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9603, "total_steps": 9627, "loss": 1.4994, "learning_rate": 1.5334798506905224e-09, "epoch": 0.9975070115300717, "percentage": 99.75, "elapsed_time": "3 days, 4:19:41", "remaining_time": "0:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9604, "total_steps": 9627, "loss": 1.8033, "learning_rate": 1.4083527419606058e-09, "epoch": 0.997610886049652, "percentage": 99.76, "elapsed_time": "3 days, 4:20:14", "remaining_time": "0:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9605, "total_steps": 9627, "loss": 1.8291, "learning_rate": 1.2885500932313666e-09, "epoch": 0.9977147605692324, "percentage": 99.77, "elapsed_time": "3 days, 4:20:46", "remaining_time": "0:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9606, "total_steps": 9627, "loss": 1.6905, "learning_rate": 1.1740719172703697e-09, "epoch": 0.9978186350888127, "percentage": 99.78, "elapsed_time": "3 days, 4:21:17", "remaining_time": "0:10:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9607, "total_steps": 9627, "loss": 1.6493, "learning_rate": 1.0649182262623125e-09, "epoch": 0.997922509608393, "percentage": 99.79, "elapsed_time": "3 days, 4:21:48", "remaining_time": "0:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9608, "total_steps": 9627, "loss": 1.6764, "learning_rate": 9.610890318312305e-10, "epoch": 0.9980263841279734, "percentage": 99.8, "elapsed_time": "3 days, 4:22:21", "remaining_time": "0:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9609, "total_steps": 9627, "loss": 1.6347, "learning_rate": 8.625843450404958e-10, "epoch": 0.9981302586475538, "percentage": 99.81, "elapsed_time": "3 days, 4:22:53", "remaining_time": "0:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9610, "total_steps": 9627, "loss": 1.7052, "learning_rate": 7.69404176376165e-10, "epoch": 0.998234133167134, "percentage": 99.82, "elapsed_time": "3 days, 4:23:26", "remaining_time": "0:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9611, "total_steps": 9627, "loss": 1.5105, "learning_rate": 6.81548535763632e-10, "epoch": 0.9983380076867144, "percentage": 99.83, "elapsed_time": "3 days, 4:23:58", "remaining_time": "0:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9612, "total_steps": 9627, "loss": 1.6361, "learning_rate": 5.990174325509745e-10, "epoch": 0.9984418822062948, "percentage": 99.84, "elapsed_time": "3 days, 4:24:29", "remaining_time": "0:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9613, "total_steps": 9627, "loss": 1.6404, "learning_rate": 5.218108755367102e-10, "epoch": 0.9985457567258751, "percentage": 99.85, "elapsed_time": "3 days, 4:25:01", "remaining_time": "0:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9614, "total_steps": 9627, "loss": 1.642, "learning_rate": 4.499288729364892e-10, "epoch": 0.9986496312454555, "percentage": 99.86, "elapsed_time": "3 days, 4:25:34", "remaining_time": "0:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9615, "total_steps": 9627, "loss": 1.7038, "learning_rate": 3.833714324108506e-10, "epoch": 0.9987535057650359, "percentage": 99.88, "elapsed_time": "3 days, 4:26:06", "remaining_time": "0:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9616, "total_steps": 9627, "loss": 1.8699, "learning_rate": 3.221385610430172e-10, "epoch": 0.9988573802846162, "percentage": 99.89, "elapsed_time": "3 days, 4:26:38", "remaining_time": "0:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9617, "total_steps": 9627, "loss": 1.7067, "learning_rate": 2.6623026534999817e-10, "epoch": 0.9989612548041965, "percentage": 99.9, "elapsed_time": "3 days, 4:27:10", "remaining_time": "0:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9618, "total_steps": 9627, "loss": 1.9236, "learning_rate": 2.1564655129369115e-10, "epoch": 0.9990651293237769, "percentage": 99.91, "elapsed_time": "3 days, 4:27:42", "remaining_time": "0:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9619, "total_steps": 9627, "loss": 1.8674, "learning_rate": 1.7038742425867781e-10, "epoch": 0.9991690038433573, "percentage": 99.92, "elapsed_time": "3 days, 4:28:15", "remaining_time": "0:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9620, "total_steps": 9627, "loss": 1.591, "learning_rate": 1.3045288906332608e-10, "epoch": 0.9992728783629375, "percentage": 99.93, "elapsed_time": "3 days, 4:28:47", "remaining_time": "0:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9621, "total_steps": 9627, "loss": 1.3563, "learning_rate": 9.584294995979015e-11, "epoch": 0.9993767528825179, "percentage": 99.94, "elapsed_time": "3 days, 4:29:18", "remaining_time": "0:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9622, "total_steps": 9627, "loss": 1.7152, "learning_rate": 6.655761063956157e-11, "epoch": 0.9994806274020983, "percentage": 99.95, "elapsed_time": "3 days, 4:29:51", "remaining_time": "0:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9623, "total_steps": 9627, "loss": 1.6796, "learning_rate": 4.259687421126479e-11, "epoch": 0.9995845019216786, "percentage": 99.96, "elapsed_time": "3 days, 4:30:22", "remaining_time": "0:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9624, "total_steps": 9627, "loss": 1.8781, "learning_rate": 2.3960743233963913e-11, "epoch": 0.999688376441259, "percentage": 99.97, "elapsed_time": "3 days, 4:30:55", "remaining_time": "0:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9625, "total_steps": 9627, "loss": 1.5272, "learning_rate": 1.0649219683855905e-11, "epoch": 0.9997922509608393, "percentage": 99.98, "elapsed_time": "3 days, 4:31:26", "remaining_time": "0:00:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9626, "total_steps": 9627, "loss": 1.7282, "learning_rate": 2.6623049931284727e-12, "epoch": 0.9998961254804196, "percentage": 99.99, "elapsed_time": "3 days, 4:31:58", "remaining_time": "0:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9627, "total_steps": 9627, "loss": 1.8582, "learning_rate": 0.0, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "3 days, 4:32:22", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9627, "total_steps": 9627, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "3 days, 4:32:24", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}