diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" --- "a/trainer_log.jsonl" +++ "b/trainer_log.jsonl" @@ -25532,3 +25532,1346 @@ {"current_steps": 127566, "total_steps": 134280, "eval_loss": 0.799495279788971, "epoch": 19.0, "percentage": 95.0, "elapsed_time": "7:53:19", "remaining_time": "0:24:54", "throughput": 2607.97, "total_tokens": 74065984} {"current_steps": 127570, "total_steps": 134280, "loss": 0.8254, "lr": 0.00022768061753676848, "epoch": 19.000595770032767, "percentage": 95.0, "elapsed_time": "7:53:22", "remaining_time": "0:24:53", "throughput": 2607.82, "total_tokens": 74068512} {"current_steps": 127575, "total_steps": 134280, "loss": 0.8153, "lr": 0.0002273423383878509, "epoch": 19.001340482573728, "percentage": 95.01, "elapsed_time": "7:53:23", "remaining_time": "0:24:52", "throughput": 2607.82, "total_tokens": 74071232} +{"current_steps": 127580, "total_steps": 134280, "loss": 0.808, "lr": 0.00022700430880796872, "epoch": 19.002085195114685, "percentage": 95.01, "elapsed_time": "7:53:24", "remaining_time": "0:24:51", "throughput": 2607.83, "total_tokens": 74074112} +{"current_steps": 127585, "total_steps": 134280, "loss": 0.7901, "lr": 0.00022666652880283576, "epoch": 19.002829907655645, "percentage": 95.01, "elapsed_time": "7:53:25", "remaining_time": "0:24:50", "throughput": 2607.83, "total_tokens": 74076992} +{"current_steps": 127590, "total_steps": 134280, "loss": 0.8185, "lr": 0.00022632899837815744, "epoch": 19.003574620196606, "percentage": 95.02, "elapsed_time": "7:53:26", "remaining_time": "0:24:49", "throughput": 2607.84, "total_tokens": 74080160} +{"current_steps": 127595, "total_steps": 134280, "loss": 0.7981, "lr": 0.0002259917175396342, "epoch": 19.004319332737563, "percentage": 95.02, "elapsed_time": "7:53:27", "remaining_time": "0:24:48", "throughput": 2607.85, "total_tokens": 74083264} +{"current_steps": 127600, "total_steps": 134280, "loss": 0.7958, "lr": 0.0002256546862929648, "epoch": 19.005064045278523, "percentage": 95.03, "elapsed_time": "7:53:28", "remaining_time": "0:24:47", "throughput": 2607.86, "total_tokens": 74086176} +{"current_steps": 127605, "total_steps": 134280, "loss": 0.7837, "lr": 0.00022531790464384304, "epoch": 19.00580875781948, "percentage": 95.03, "elapsed_time": "7:53:29", "remaining_time": "0:24:46", "throughput": 2607.86, "total_tokens": 74089184} +{"current_steps": 127610, "total_steps": 134280, "loss": 0.8297, "lr": 0.00022498137259796102, "epoch": 19.00655347036044, "percentage": 95.03, "elapsed_time": "7:53:30", "remaining_time": "0:24:45", "throughput": 2607.87, "total_tokens": 74092096} +{"current_steps": 127615, "total_steps": 134280, "loss": 0.8101, "lr": 0.00022464509016100086, "epoch": 19.0072981829014, "percentage": 95.04, "elapsed_time": "7:53:32", "remaining_time": "0:24:43", "throughput": 2607.87, "total_tokens": 74094976} +{"current_steps": 127620, "total_steps": 134280, "loss": 0.7928, "lr": 0.0002243090573386447, "epoch": 19.008042895442358, "percentage": 95.04, "elapsed_time": "7:53:33", "remaining_time": "0:24:42", "throughput": 2607.88, "total_tokens": 74097856} +{"current_steps": 127625, "total_steps": 134280, "loss": 0.7969, "lr": 0.0002239732741365713, "epoch": 19.00878760798332, "percentage": 95.04, "elapsed_time": "7:53:34", "remaining_time": "0:24:41", "throughput": 2607.88, "total_tokens": 74100768} +{"current_steps": 127630, "total_steps": 134280, "loss": 0.8086, "lr": 0.00022363774056045115, "epoch": 19.00953232052428, "percentage": 95.05, "elapsed_time": "7:53:35", "remaining_time": "0:24:40", "throughput": 2607.88, "total_tokens": 74103488} +{"current_steps": 127635, "total_steps": 134280, "loss": 0.8003, "lr": 0.00022330245661595304, "epoch": 19.010277033065236, "percentage": 95.05, "elapsed_time": "7:53:36", "remaining_time": "0:24:39", "throughput": 2607.89, "total_tokens": 74106400} +{"current_steps": 127640, "total_steps": 134280, "loss": 0.784, "lr": 0.00022296742230874076, "epoch": 19.011021745606197, "percentage": 95.06, "elapsed_time": "7:53:37", "remaining_time": "0:24:38", "throughput": 2607.89, "total_tokens": 74109184} +{"current_steps": 127645, "total_steps": 134280, "loss": 0.8033, "lr": 0.00022263263764447648, "epoch": 19.011766458147154, "percentage": 95.06, "elapsed_time": "7:53:38", "remaining_time": "0:24:37", "throughput": 2607.9, "total_tokens": 74112096} +{"current_steps": 127650, "total_steps": 134280, "loss": 0.7927, "lr": 0.00022229810262881233, "epoch": 19.012511170688114, "percentage": 95.06, "elapsed_time": "7:53:39", "remaining_time": "0:24:36", "throughput": 2607.9, "total_tokens": 74115040} +{"current_steps": 127655, "total_steps": 134280, "loss": 0.7871, "lr": 0.00022196381726740543, "epoch": 19.013255883229075, "percentage": 95.07, "elapsed_time": "7:53:40", "remaining_time": "0:24:34", "throughput": 2607.91, "total_tokens": 74118176} +{"current_steps": 127660, "total_steps": 134280, "loss": 0.8108, "lr": 0.00022162978156589795, "epoch": 19.01400059577003, "percentage": 95.07, "elapsed_time": "7:53:41", "remaining_time": "0:24:33", "throughput": 2607.91, "total_tokens": 74120800} +{"current_steps": 127665, "total_steps": 134280, "loss": 0.7993, "lr": 0.00022129599552993539, "epoch": 19.014745308310992, "percentage": 95.07, "elapsed_time": "7:53:42", "remaining_time": "0:24:32", "throughput": 2607.92, "total_tokens": 74123680} +{"current_steps": 127670, "total_steps": 134280, "loss": 0.7897, "lr": 0.0002209624591651582, "epoch": 19.015490020851953, "percentage": 95.08, "elapsed_time": "7:53:43", "remaining_time": "0:24:31", "throughput": 2607.92, "total_tokens": 74126528} +{"current_steps": 127675, "total_steps": 134280, "loss": 0.7991, "lr": 0.00022062917247719693, "epoch": 19.01623473339291, "percentage": 95.08, "elapsed_time": "7:53:44", "remaining_time": "0:24:30", "throughput": 2607.92, "total_tokens": 74129280} +{"current_steps": 127680, "total_steps": 134280, "loss": 0.8117, "lr": 0.00022029613547168702, "epoch": 19.01697944593387, "percentage": 95.08, "elapsed_time": "7:53:45", "remaining_time": "0:24:29", "throughput": 2607.93, "total_tokens": 74132384} +{"current_steps": 127685, "total_steps": 134280, "loss": 0.7837, "lr": 0.00021996334815425065, "epoch": 19.017724158474827, "percentage": 95.09, "elapsed_time": "7:53:46", "remaining_time": "0:24:28", "throughput": 2607.93, "total_tokens": 74134976} +{"current_steps": 127690, "total_steps": 134280, "loss": 0.7863, "lr": 0.00021963081053051335, "epoch": 19.018468871015788, "percentage": 95.09, "elapsed_time": "7:53:47", "remaining_time": "0:24:27", "throughput": 2607.94, "total_tokens": 74138208} +{"current_steps": 127695, "total_steps": 134280, "loss": 0.7841, "lr": 0.00021929852260609229, "epoch": 19.01921358355675, "percentage": 95.1, "elapsed_time": "7:53:48", "remaining_time": "0:24:26", "throughput": 2607.94, "total_tokens": 74141088} +{"current_steps": 127700, "total_steps": 134280, "loss": 0.7948, "lr": 0.0002189664843865996, "epoch": 19.019958296097705, "percentage": 95.1, "elapsed_time": "7:53:49", "remaining_time": "0:24:24", "throughput": 2607.95, "total_tokens": 74143936} +{"current_steps": 127705, "total_steps": 134280, "loss": 0.7821, "lr": 0.00021863469587764416, "epoch": 19.020703008638666, "percentage": 95.1, "elapsed_time": "7:53:51", "remaining_time": "0:24:23", "throughput": 2607.95, "total_tokens": 74146688} +{"current_steps": 127710, "total_steps": 134280, "loss": 0.7954, "lr": 0.00021830315708483316, "epoch": 19.021447721179623, "percentage": 95.11, "elapsed_time": "7:53:52", "remaining_time": "0:24:22", "throughput": 2607.95, "total_tokens": 74149472} +{"current_steps": 127715, "total_steps": 134280, "loss": 0.8013, "lr": 0.0002179718680137671, "epoch": 19.022192433720583, "percentage": 95.11, "elapsed_time": "7:53:53", "remaining_time": "0:24:21", "throughput": 2607.96, "total_tokens": 74152512} +{"current_steps": 127720, "total_steps": 134280, "loss": 0.8049, "lr": 0.00021764082867004153, "epoch": 19.022937146261544, "percentage": 95.11, "elapsed_time": "7:53:54", "remaining_time": "0:24:20", "throughput": 2607.97, "total_tokens": 74155488} +{"current_steps": 127725, "total_steps": 134280, "loss": 0.8229, "lr": 0.00021731003905925026, "epoch": 19.0236818588025, "percentage": 95.12, "elapsed_time": "7:53:55", "remaining_time": "0:24:19", "throughput": 2607.97, "total_tokens": 74158240} +{"current_steps": 127730, "total_steps": 134280, "loss": 0.7845, "lr": 0.00021697949918698055, "epoch": 19.02442657134346, "percentage": 95.12, "elapsed_time": "7:53:56", "remaining_time": "0:24:18", "throughput": 2607.97, "total_tokens": 74160992} +{"current_steps": 127735, "total_steps": 134280, "loss": 0.8069, "lr": 0.00021664920905881956, "epoch": 19.025171283884422, "percentage": 95.13, "elapsed_time": "7:53:57", "remaining_time": "0:24:17", "throughput": 2607.99, "total_tokens": 74164192} +{"current_steps": 127740, "total_steps": 134280, "loss": 0.7855, "lr": 0.00021631916868034283, "epoch": 19.02591599642538, "percentage": 95.13, "elapsed_time": "7:53:58", "remaining_time": "0:24:15", "throughput": 2607.99, "total_tokens": 74167104} +{"current_steps": 127745, "total_steps": 134280, "loss": 0.7783, "lr": 0.0002159893780571309, "epoch": 19.02666070896634, "percentage": 95.13, "elapsed_time": "7:53:59", "remaining_time": "0:24:14", "throughput": 2607.99, "total_tokens": 74169888} +{"current_steps": 127750, "total_steps": 134280, "loss": 0.7977, "lr": 0.00021565983719475101, "epoch": 19.027405421507297, "percentage": 95.14, "elapsed_time": "7:54:00", "remaining_time": "0:24:13", "throughput": 2608.0, "total_tokens": 74172960} +{"current_steps": 127755, "total_steps": 134280, "loss": 0.797, "lr": 0.00021533054609877366, "epoch": 19.028150134048257, "percentage": 95.14, "elapsed_time": "7:54:01", "remaining_time": "0:24:12", "throughput": 2608.0, "total_tokens": 74175712} +{"current_steps": 127760, "total_steps": 134280, "loss": 0.7994, "lr": 0.00021500150477475944, "epoch": 19.028894846589218, "percentage": 95.14, "elapsed_time": "7:54:02", "remaining_time": "0:24:11", "throughput": 2608.01, "total_tokens": 74178592} +{"current_steps": 127765, "total_steps": 134280, "loss": 0.8268, "lr": 0.00021467271322826552, "epoch": 19.029639559130175, "percentage": 95.15, "elapsed_time": "7:54:03", "remaining_time": "0:24:10", "throughput": 2608.02, "total_tokens": 74181888} +{"current_steps": 127770, "total_steps": 134280, "loss": 0.8034, "lr": 0.0002143441714648525, "epoch": 19.030384271671135, "percentage": 95.15, "elapsed_time": "7:54:04", "remaining_time": "0:24:09", "throughput": 2608.02, "total_tokens": 74184672} +{"current_steps": 127775, "total_steps": 134280, "loss": 0.7946, "lr": 0.0002140158794900643, "epoch": 19.031128984212096, "percentage": 95.16, "elapsed_time": "7:54:05", "remaining_time": "0:24:08", "throughput": 2608.02, "total_tokens": 74187456} +{"current_steps": 127780, "total_steps": 134280, "loss": 0.8432, "lr": 0.0002136878373094514, "epoch": 19.031873696753053, "percentage": 95.16, "elapsed_time": "7:54:06", "remaining_time": "0:24:07", "throughput": 2608.03, "total_tokens": 74190496} +{"current_steps": 127785, "total_steps": 134280, "loss": 0.8042, "lr": 0.00021336004492855442, "epoch": 19.032618409294013, "percentage": 95.16, "elapsed_time": "7:54:07", "remaining_time": "0:24:05", "throughput": 2608.04, "total_tokens": 74193408} +{"current_steps": 127790, "total_steps": 134280, "loss": 0.8109, "lr": 0.0002130325023529106, "epoch": 19.03336312183497, "percentage": 95.17, "elapsed_time": "7:54:09", "remaining_time": "0:24:04", "throughput": 2608.04, "total_tokens": 74196096} +{"current_steps": 127795, "total_steps": 134280, "loss": 0.7996, "lr": 0.00021270520958805548, "epoch": 19.03410783437593, "percentage": 95.17, "elapsed_time": "7:54:10", "remaining_time": "0:24:03", "throughput": 2608.05, "total_tokens": 74199104} +{"current_steps": 127800, "total_steps": 134280, "loss": 0.8019, "lr": 0.00021237816663951468, "epoch": 19.03485254691689, "percentage": 95.17, "elapsed_time": "7:54:11", "remaining_time": "0:24:02", "throughput": 2608.05, "total_tokens": 74201952} +{"current_steps": 127805, "total_steps": 134280, "loss": 0.7941, "lr": 0.00021205137351281542, "epoch": 19.035597259457848, "percentage": 95.18, "elapsed_time": "7:54:12", "remaining_time": "0:24:01", "throughput": 2608.05, "total_tokens": 74204640} +{"current_steps": 127810, "total_steps": 134280, "loss": 0.806, "lr": 0.0002117248302134783, "epoch": 19.03634197199881, "percentage": 95.18, "elapsed_time": "7:54:13", "remaining_time": "0:24:00", "throughput": 2608.06, "total_tokens": 74207584} +{"current_steps": 127815, "total_steps": 134280, "loss": 0.7772, "lr": 0.00021139853674702225, "epoch": 19.03708668453977, "percentage": 95.19, "elapsed_time": "7:54:14", "remaining_time": "0:23:59", "throughput": 2608.06, "total_tokens": 74210304} +{"current_steps": 127820, "total_steps": 134280, "loss": 0.7958, "lr": 0.00021107249311895615, "epoch": 19.037831397080726, "percentage": 95.19, "elapsed_time": "7:54:15", "remaining_time": "0:23:58", "throughput": 2608.06, "total_tokens": 74213184} +{"current_steps": 127825, "total_steps": 134280, "loss": 0.8072, "lr": 0.00021074669933478894, "epoch": 19.038576109621687, "percentage": 95.19, "elapsed_time": "7:54:16", "remaining_time": "0:23:57", "throughput": 2608.07, "total_tokens": 74216512} +{"current_steps": 127830, "total_steps": 134280, "loss": 0.8072, "lr": 0.00021042115540002626, "epoch": 19.039320822162644, "percentage": 95.2, "elapsed_time": "7:54:17", "remaining_time": "0:23:55", "throughput": 2608.08, "total_tokens": 74219328} +{"current_steps": 127835, "total_steps": 134280, "loss": 0.7993, "lr": 0.00021009586132016532, "epoch": 19.040065534703604, "percentage": 95.2, "elapsed_time": "7:54:18", "remaining_time": "0:23:54", "throughput": 2608.09, "total_tokens": 74222432} +{"current_steps": 127840, "total_steps": 134280, "loss": 0.8277, "lr": 0.00020977081710070344, "epoch": 19.040810247244565, "percentage": 95.2, "elapsed_time": "7:54:19", "remaining_time": "0:23:53", "throughput": 2608.09, "total_tokens": 74225376} +{"current_steps": 127845, "total_steps": 134280, "loss": 0.7847, "lr": 0.0002094460227471312, "epoch": 19.041554959785522, "percentage": 95.21, "elapsed_time": "7:54:20", "remaining_time": "0:23:52", "throughput": 2608.1, "total_tokens": 74228384} +{"current_steps": 127850, "total_steps": 134280, "loss": 0.8017, "lr": 0.00020912147826493755, "epoch": 19.042299672326482, "percentage": 95.21, "elapsed_time": "7:54:21", "remaining_time": "0:23:51", "throughput": 2608.11, "total_tokens": 74231424} +{"current_steps": 127855, "total_steps": 134280, "loss": 0.8033, "lr": 0.00020879718365960143, "epoch": 19.043044384867443, "percentage": 95.22, "elapsed_time": "7:54:22", "remaining_time": "0:23:50", "throughput": 2608.12, "total_tokens": 74234720} +{"current_steps": 127860, "total_steps": 134280, "loss": 0.8078, "lr": 0.00020847313893660512, "epoch": 19.0437890974084, "percentage": 95.22, "elapsed_time": "7:54:23", "remaining_time": "0:23:49", "throughput": 2608.12, "total_tokens": 74237472} +{"current_steps": 127865, "total_steps": 134280, "loss": 0.7968, "lr": 0.00020814934410142094, "epoch": 19.04453380994936, "percentage": 95.22, "elapsed_time": "7:54:24", "remaining_time": "0:23:48", "throughput": 2608.13, "total_tokens": 74240288} +{"current_steps": 127870, "total_steps": 134280, "loss": 0.7992, "lr": 0.00020782579915952113, "epoch": 19.045278522490317, "percentage": 95.23, "elapsed_time": "7:54:26", "remaining_time": "0:23:46", "throughput": 2608.13, "total_tokens": 74242976} +{"current_steps": 127875, "total_steps": 134280, "loss": 0.7901, "lr": 0.00020750250411636972, "epoch": 19.046023235031278, "percentage": 95.23, "elapsed_time": "7:54:27", "remaining_time": "0:23:45", "throughput": 2608.13, "total_tokens": 74245664} +{"current_steps": 127880, "total_steps": 134280, "loss": 0.8017, "lr": 0.00020717945897742894, "epoch": 19.04676794757224, "percentage": 95.23, "elapsed_time": "7:54:28", "remaining_time": "0:23:44", "throughput": 2608.13, "total_tokens": 74248576} +{"current_steps": 127885, "total_steps": 134280, "loss": 0.8025, "lr": 0.00020685666374815613, "epoch": 19.047512660113195, "percentage": 95.24, "elapsed_time": "7:54:29", "remaining_time": "0:23:43", "throughput": 2608.14, "total_tokens": 74251392} +{"current_steps": 127890, "total_steps": 134280, "loss": 0.7863, "lr": 0.00020653411843400693, "epoch": 19.048257372654156, "percentage": 95.24, "elapsed_time": "7:54:30", "remaining_time": "0:23:42", "throughput": 2608.14, "total_tokens": 74254432} +{"current_steps": 127895, "total_steps": 134280, "loss": 0.7938, "lr": 0.00020621182304042694, "epoch": 19.049002085195113, "percentage": 95.25, "elapsed_time": "7:54:31", "remaining_time": "0:23:41", "throughput": 2608.15, "total_tokens": 74257248} +{"current_steps": 127900, "total_steps": 134280, "loss": 0.7958, "lr": 0.00020588977757286185, "epoch": 19.049746797736073, "percentage": 95.25, "elapsed_time": "7:54:32", "remaining_time": "0:23:40", "throughput": 2608.15, "total_tokens": 74260032} +{"current_steps": 127905, "total_steps": 134280, "loss": 0.7928, "lr": 0.0002055679820367523, "epoch": 19.050491510277034, "percentage": 95.25, "elapsed_time": "7:54:33", "remaining_time": "0:23:39", "throughput": 2608.16, "total_tokens": 74263040} +{"current_steps": 127910, "total_steps": 134280, "loss": 0.8015, "lr": 0.00020524643643753725, "epoch": 19.05123622281799, "percentage": 95.26, "elapsed_time": "7:54:34", "remaining_time": "0:23:38", "throughput": 2608.17, "total_tokens": 74266176} +{"current_steps": 127915, "total_steps": 134280, "loss": 0.7951, "lr": 0.00020492514078064572, "epoch": 19.05198093535895, "percentage": 95.26, "elapsed_time": "7:54:35", "remaining_time": "0:23:36", "throughput": 2608.17, "total_tokens": 74268992} +{"current_steps": 127920, "total_steps": 134280, "loss": 0.816, "lr": 0.00020460409507150833, "epoch": 19.052725647899912, "percentage": 95.26, "elapsed_time": "7:54:36", "remaining_time": "0:23:35", "throughput": 2608.18, "total_tokens": 74271872} +{"current_steps": 127925, "total_steps": 134280, "loss": 0.8078, "lr": 0.00020428329931554412, "epoch": 19.05347036044087, "percentage": 95.27, "elapsed_time": "7:54:37", "remaining_time": "0:23:34", "throughput": 2608.18, "total_tokens": 74274688} +{"current_steps": 127930, "total_steps": 134280, "loss": 0.7916, "lr": 0.0002039627535181787, "epoch": 19.05421507298183, "percentage": 95.27, "elapsed_time": "7:54:38", "remaining_time": "0:23:33", "throughput": 2608.19, "total_tokens": 74277824} +{"current_steps": 127935, "total_steps": 134280, "loss": 0.7968, "lr": 0.0002036424576848228, "epoch": 19.054959785522787, "percentage": 95.27, "elapsed_time": "7:54:39", "remaining_time": "0:23:32", "throughput": 2608.2, "total_tokens": 74280768} +{"current_steps": 127940, "total_steps": 134280, "loss": 0.7985, "lr": 0.00020332241182089206, "epoch": 19.055704498063747, "percentage": 95.28, "elapsed_time": "7:54:40", "remaining_time": "0:23:31", "throughput": 2608.21, "total_tokens": 74283936} +{"current_steps": 127945, "total_steps": 134280, "loss": 0.8019, "lr": 0.00020300261593178713, "epoch": 19.056449210604708, "percentage": 95.28, "elapsed_time": "7:54:41", "remaining_time": "0:23:30", "throughput": 2608.21, "total_tokens": 74286976} +{"current_steps": 127950, "total_steps": 134280, "loss": 0.7867, "lr": 0.00020268307002291707, "epoch": 19.057193923145665, "percentage": 95.29, "elapsed_time": "7:54:42", "remaining_time": "0:23:29", "throughput": 2608.22, "total_tokens": 74289888} +{"current_steps": 127955, "total_steps": 134280, "loss": 0.8003, "lr": 0.00020236377409967588, "epoch": 19.057938635686625, "percentage": 95.29, "elapsed_time": "7:54:44", "remaining_time": "0:23:28", "throughput": 2608.22, "total_tokens": 74292704} +{"current_steps": 127960, "total_steps": 134280, "loss": 0.795, "lr": 0.0002020447281674592, "epoch": 19.058683348227586, "percentage": 95.29, "elapsed_time": "7:54:45", "remaining_time": "0:23:26", "throughput": 2608.23, "total_tokens": 74295968} +{"current_steps": 127965, "total_steps": 134280, "loss": 0.8012, "lr": 0.00020172593223165614, "epoch": 19.059428060768543, "percentage": 95.3, "elapsed_time": "7:54:46", "remaining_time": "0:23:25", "throughput": 2608.24, "total_tokens": 74299168} +{"current_steps": 127970, "total_steps": 134280, "loss": 0.7869, "lr": 0.00020140738629765396, "epoch": 19.060172773309503, "percentage": 95.3, "elapsed_time": "7:54:47", "remaining_time": "0:23:24", "throughput": 2608.25, "total_tokens": 74302112} +{"current_steps": 127975, "total_steps": 134280, "loss": 0.8064, "lr": 0.00020108909037083343, "epoch": 19.06091748585046, "percentage": 95.3, "elapsed_time": "7:54:48", "remaining_time": "0:23:23", "throughput": 2608.25, "total_tokens": 74304800} +{"current_steps": 127980, "total_steps": 134280, "loss": 0.7967, "lr": 0.00020077104445657024, "epoch": 19.06166219839142, "percentage": 95.31, "elapsed_time": "7:54:49", "remaining_time": "0:23:22", "throughput": 2608.25, "total_tokens": 74307648} +{"current_steps": 127985, "total_steps": 134280, "loss": 0.7803, "lr": 0.00020045324856024003, "epoch": 19.06240691093238, "percentage": 95.31, "elapsed_time": "7:54:50", "remaining_time": "0:23:21", "throughput": 2608.26, "total_tokens": 74310496} +{"current_steps": 127990, "total_steps": 134280, "loss": 0.7796, "lr": 0.0002001357026872119, "epoch": 19.06315162347334, "percentage": 95.32, "elapsed_time": "7:54:51", "remaining_time": "0:23:20", "throughput": 2608.27, "total_tokens": 74313600} +{"current_steps": 127995, "total_steps": 134280, "loss": 0.8018, "lr": 0.00019981840684284657, "epoch": 19.0638963360143, "percentage": 95.32, "elapsed_time": "7:54:52", "remaining_time": "0:23:19", "throughput": 2608.27, "total_tokens": 74316544} +{"current_steps": 128000, "total_steps": 134280, "loss": 0.8006, "lr": 0.0001995013610325097, "epoch": 19.06464104855526, "percentage": 95.32, "elapsed_time": "7:54:53", "remaining_time": "0:23:17", "throughput": 2608.28, "total_tokens": 74319392} +{"current_steps": 128005, "total_steps": 134280, "loss": 0.7995, "lr": 0.00019918456526155204, "epoch": 19.065385761096216, "percentage": 95.33, "elapsed_time": "7:54:54", "remaining_time": "0:23:16", "throughput": 2608.28, "total_tokens": 74322464} +{"current_steps": 128010, "total_steps": 134280, "loss": 0.7921, "lr": 0.00019886801953533095, "epoch": 19.066130473637177, "percentage": 95.33, "elapsed_time": "7:54:55", "remaining_time": "0:23:15", "throughput": 2608.29, "total_tokens": 74325376} +{"current_steps": 128015, "total_steps": 134280, "loss": 0.7778, "lr": 0.00019855172385918883, "epoch": 19.066875186178134, "percentage": 95.33, "elapsed_time": "7:54:56", "remaining_time": "0:23:14", "throughput": 2608.29, "total_tokens": 74328224} +{"current_steps": 128020, "total_steps": 134280, "loss": 0.7902, "lr": 0.00019823567823847477, "epoch": 19.067619898719094, "percentage": 95.34, "elapsed_time": "7:54:57", "remaining_time": "0:23:13", "throughput": 2608.3, "total_tokens": 74331424} +{"current_steps": 128025, "total_steps": 134280, "loss": 0.7865, "lr": 0.0001979198826785228, "epoch": 19.068364611260055, "percentage": 95.34, "elapsed_time": "7:54:59", "remaining_time": "0:23:12", "throughput": 2608.31, "total_tokens": 74334464} +{"current_steps": 128030, "total_steps": 134280, "loss": 0.8002, "lr": 0.00019760433718467196, "epoch": 19.069109323801012, "percentage": 95.35, "elapsed_time": "7:55:00", "remaining_time": "0:23:11", "throughput": 2608.32, "total_tokens": 74337504} +{"current_steps": 128035, "total_steps": 134280, "loss": 0.7925, "lr": 0.00019728904176225136, "epoch": 19.069854036341972, "percentage": 95.35, "elapsed_time": "7:55:01", "remaining_time": "0:23:10", "throughput": 2608.32, "total_tokens": 74340352} +{"current_steps": 128040, "total_steps": 134280, "loss": 0.8008, "lr": 0.00019697399641658506, "epoch": 19.070598748882933, "percentage": 95.35, "elapsed_time": "7:55:02", "remaining_time": "0:23:09", "throughput": 2608.33, "total_tokens": 74343264} +{"current_steps": 128045, "total_steps": 134280, "loss": 0.81, "lr": 0.0001966592011530005, "epoch": 19.07134346142389, "percentage": 95.36, "elapsed_time": "7:55:03", "remaining_time": "0:23:07", "throughput": 2608.33, "total_tokens": 74345952} +{"current_steps": 128050, "total_steps": 134280, "loss": 0.7987, "lr": 0.0001963446559768117, "epoch": 19.07208817396485, "percentage": 95.36, "elapsed_time": "7:55:04", "remaining_time": "0:23:06", "throughput": 2608.33, "total_tokens": 74348768} +{"current_steps": 128055, "total_steps": 134280, "loss": 0.8006, "lr": 0.00019603036089333448, "epoch": 19.072832886505807, "percentage": 95.36, "elapsed_time": "7:55:05", "remaining_time": "0:23:05", "throughput": 2608.34, "total_tokens": 74351776} +{"current_steps": 128060, "total_steps": 134280, "loss": 0.7961, "lr": 0.00019571631590787784, "epoch": 19.073577599046768, "percentage": 95.37, "elapsed_time": "7:55:06", "remaining_time": "0:23:04", "throughput": 2608.35, "total_tokens": 74354592} +{"current_steps": 128065, "total_steps": 134280, "loss": 0.796, "lr": 0.00019540252102574928, "epoch": 19.07432231158773, "percentage": 95.37, "elapsed_time": "7:55:07", "remaining_time": "0:23:03", "throughput": 2608.35, "total_tokens": 74357664} +{"current_steps": 128070, "total_steps": 134280, "loss": 0.7843, "lr": 0.00019508897625224785, "epoch": 19.075067024128685, "percentage": 95.38, "elapsed_time": "7:55:08", "remaining_time": "0:23:02", "throughput": 2608.36, "total_tokens": 74360480} +{"current_steps": 128075, "total_steps": 134280, "loss": 0.8079, "lr": 0.000194775681592671, "epoch": 19.075811736669646, "percentage": 95.38, "elapsed_time": "7:55:09", "remaining_time": "0:23:01", "throughput": 2608.37, "total_tokens": 74363584} +{"current_steps": 128080, "total_steps": 134280, "loss": 0.7991, "lr": 0.00019446263705231114, "epoch": 19.076556449210603, "percentage": 95.38, "elapsed_time": "7:55:10", "remaining_time": "0:23:00", "throughput": 2608.37, "total_tokens": 74366432} +{"current_steps": 128085, "total_steps": 134280, "loss": 0.7859, "lr": 0.0001941498426364574, "epoch": 19.077301161751564, "percentage": 95.39, "elapsed_time": "7:55:11", "remaining_time": "0:22:59", "throughput": 2608.38, "total_tokens": 74369472} +{"current_steps": 128090, "total_steps": 134280, "loss": 0.807, "lr": 0.00019383729835039553, "epoch": 19.078045874292524, "percentage": 95.39, "elapsed_time": "7:55:12", "remaining_time": "0:22:57", "throughput": 2608.38, "total_tokens": 74372288} +{"current_steps": 128095, "total_steps": 134280, "loss": 0.7953, "lr": 0.00019352500419940133, "epoch": 19.07879058683348, "percentage": 95.39, "elapsed_time": "7:55:13", "remaining_time": "0:22:56", "throughput": 2608.38, "total_tokens": 74375040} +{"current_steps": 128100, "total_steps": 134280, "loss": 0.819, "lr": 0.00019321296018875555, "epoch": 19.07953529937444, "percentage": 95.4, "elapsed_time": "7:55:14", "remaining_time": "0:22:55", "throughput": 2608.38, "total_tokens": 74377792} +{"current_steps": 128105, "total_steps": 134280, "loss": 0.8107, "lr": 0.00019290116632372732, "epoch": 19.080280011915402, "percentage": 95.4, "elapsed_time": "7:55:15", "remaining_time": "0:22:54", "throughput": 2608.39, "total_tokens": 74380864} +{"current_steps": 128110, "total_steps": 134280, "loss": 0.8398, "lr": 0.00019258962260958578, "epoch": 19.08102472445636, "percentage": 95.41, "elapsed_time": "7:55:17", "remaining_time": "0:22:53", "throughput": 2608.41, "total_tokens": 74384160} +{"current_steps": 128115, "total_steps": 134280, "loss": 0.7876, "lr": 0.00019227832905159168, "epoch": 19.08176943699732, "percentage": 95.41, "elapsed_time": "7:55:18", "remaining_time": "0:22:52", "throughput": 2608.41, "total_tokens": 74387072} +{"current_steps": 128120, "total_steps": 134280, "loss": 0.7899, "lr": 0.00019196728565500586, "epoch": 19.082514149538277, "percentage": 95.41, "elapsed_time": "7:55:19", "remaining_time": "0:22:51", "throughput": 2608.42, "total_tokens": 74389920} +{"current_steps": 128125, "total_steps": 134280, "loss": 0.8274, "lr": 0.0001916564924250824, "epoch": 19.083258862079237, "percentage": 95.42, "elapsed_time": "7:55:20", "remaining_time": "0:22:50", "throughput": 2608.42, "total_tokens": 74392896} +{"current_steps": 128130, "total_steps": 134280, "loss": 0.8116, "lr": 0.0001913459493670705, "epoch": 19.084003574620198, "percentage": 95.42, "elapsed_time": "7:55:21", "remaining_time": "0:22:48", "throughput": 2608.43, "total_tokens": 74395776} +{"current_steps": 128135, "total_steps": 134280, "loss": 0.795, "lr": 0.0001910356564862209, "epoch": 19.084748287161155, "percentage": 95.42, "elapsed_time": "7:55:22", "remaining_time": "0:22:47", "throughput": 2608.43, "total_tokens": 74398624} +{"current_steps": 128140, "total_steps": 134280, "loss": 0.801, "lr": 0.0001907256137877694, "epoch": 19.085492999702115, "percentage": 95.43, "elapsed_time": "7:55:23", "remaining_time": "0:22:46", "throughput": 2608.44, "total_tokens": 74401568} +{"current_steps": 128145, "total_steps": 134280, "loss": 0.8215, "lr": 0.00019041582127696022, "epoch": 19.086237712243076, "percentage": 95.43, "elapsed_time": "7:55:24", "remaining_time": "0:22:45", "throughput": 2608.45, "total_tokens": 74404544} +{"current_steps": 128150, "total_steps": 134280, "loss": 0.7945, "lr": 0.00019010627895902244, "epoch": 19.086982424784033, "percentage": 95.43, "elapsed_time": "7:55:25", "remaining_time": "0:22:44", "throughput": 2608.45, "total_tokens": 74407392} +{"current_steps": 128155, "total_steps": 134280, "loss": 0.8114, "lr": 0.00018979698683918854, "epoch": 19.087727137324993, "percentage": 95.44, "elapsed_time": "7:55:26", "remaining_time": "0:22:43", "throughput": 2608.45, "total_tokens": 74410112} +{"current_steps": 128160, "total_steps": 134280, "loss": 0.7794, "lr": 0.00018948794492268105, "epoch": 19.08847184986595, "percentage": 95.44, "elapsed_time": "7:55:27", "remaining_time": "0:22:42", "throughput": 2608.45, "total_tokens": 74412832} +{"current_steps": 128165, "total_steps": 134280, "loss": 0.8009, "lr": 0.0001891791532147208, "epoch": 19.08921656240691, "percentage": 95.45, "elapsed_time": "7:55:28", "remaining_time": "0:22:41", "throughput": 2608.46, "total_tokens": 74415648} +{"current_steps": 128170, "total_steps": 134280, "loss": 0.8126, "lr": 0.00018887061172052688, "epoch": 19.08996127494787, "percentage": 95.45, "elapsed_time": "7:55:29", "remaining_time": "0:22:40", "throughput": 2608.46, "total_tokens": 74418592} +{"current_steps": 128175, "total_steps": 134280, "loss": 0.8162, "lr": 0.00018856232044531018, "epoch": 19.09070598748883, "percentage": 95.45, "elapsed_time": "7:55:30", "remaining_time": "0:22:38", "throughput": 2608.47, "total_tokens": 74421632} +{"current_steps": 128180, "total_steps": 134280, "loss": 0.7847, "lr": 0.00018825427939427985, "epoch": 19.09145070002979, "percentage": 95.46, "elapsed_time": "7:55:31", "remaining_time": "0:22:37", "throughput": 2608.48, "total_tokens": 74424576} +{"current_steps": 128185, "total_steps": 134280, "loss": 0.7852, "lr": 0.0001879464885726384, "epoch": 19.09219541257075, "percentage": 95.46, "elapsed_time": "7:55:32", "remaining_time": "0:22:36", "throughput": 2608.48, "total_tokens": 74427296} +{"current_steps": 128190, "total_steps": 134280, "loss": 0.8124, "lr": 0.00018763894798558834, "epoch": 19.092940125111706, "percentage": 95.46, "elapsed_time": "7:55:33", "remaining_time": "0:22:35", "throughput": 2608.48, "total_tokens": 74430048} +{"current_steps": 128195, "total_steps": 134280, "loss": 0.8524, "lr": 0.00018733165763832382, "epoch": 19.093684837652667, "percentage": 95.47, "elapsed_time": "7:55:34", "remaining_time": "0:22:34", "throughput": 2608.49, "total_tokens": 74432992} +{"current_steps": 128200, "total_steps": 134280, "loss": 0.8098, "lr": 0.00018702461753603404, "epoch": 19.094429550193624, "percentage": 95.47, "elapsed_time": "7:55:36", "remaining_time": "0:22:33", "throughput": 2608.49, "total_tokens": 74436032} +{"current_steps": 128205, "total_steps": 134280, "loss": 0.7878, "lr": 0.00018671782768390986, "epoch": 19.095174262734584, "percentage": 95.48, "elapsed_time": "7:55:37", "remaining_time": "0:22:32", "throughput": 2608.5, "total_tokens": 74439008} +{"current_steps": 128210, "total_steps": 134280, "loss": 0.7952, "lr": 0.00018641128808713047, "epoch": 19.095918975275545, "percentage": 95.48, "elapsed_time": "7:55:38", "remaining_time": "0:22:31", "throughput": 2608.5, "total_tokens": 74441760} +{"current_steps": 128215, "total_steps": 134280, "loss": 0.827, "lr": 0.00018610499875087837, "epoch": 19.096663687816502, "percentage": 95.48, "elapsed_time": "7:55:39", "remaining_time": "0:22:29", "throughput": 2608.5, "total_tokens": 74444544} +{"current_steps": 128220, "total_steps": 134280, "loss": 0.7851, "lr": 0.0001857989596803261, "epoch": 19.097408400357462, "percentage": 95.49, "elapsed_time": "7:55:40", "remaining_time": "0:22:28", "throughput": 2608.51, "total_tokens": 74447456} +{"current_steps": 128225, "total_steps": 134280, "loss": 0.7959, "lr": 0.00018549317088064287, "epoch": 19.098153112898423, "percentage": 95.49, "elapsed_time": "7:55:41", "remaining_time": "0:22:27", "throughput": 2608.51, "total_tokens": 74450304} +{"current_steps": 128230, "total_steps": 134280, "loss": 0.7768, "lr": 0.0001851876323569962, "epoch": 19.09889782543938, "percentage": 95.49, "elapsed_time": "7:55:42", "remaining_time": "0:22:26", "throughput": 2608.52, "total_tokens": 74453184} +{"current_steps": 128235, "total_steps": 134280, "loss": 0.7997, "lr": 0.00018488234411454695, "epoch": 19.09964253798034, "percentage": 95.5, "elapsed_time": "7:55:43", "remaining_time": "0:22:25", "throughput": 2608.52, "total_tokens": 74456096} +{"current_steps": 128240, "total_steps": 134280, "loss": 0.7843, "lr": 0.00018457730615845436, "epoch": 19.100387250521297, "percentage": 95.5, "elapsed_time": "7:55:44", "remaining_time": "0:22:24", "throughput": 2608.52, "total_tokens": 74458816} +{"current_steps": 128245, "total_steps": 134280, "loss": 0.7902, "lr": 0.00018427251849386926, "epoch": 19.101131963062258, "percentage": 95.51, "elapsed_time": "7:55:45", "remaining_time": "0:22:23", "throughput": 2608.53, "total_tokens": 74461888} +{"current_steps": 128250, "total_steps": 134280, "loss": 0.8022, "lr": 0.00018396798112594258, "epoch": 19.10187667560322, "percentage": 95.51, "elapsed_time": "7:55:46", "remaining_time": "0:22:22", "throughput": 2608.54, "total_tokens": 74464960} +{"current_steps": 128255, "total_steps": 134280, "loss": 0.8085, "lr": 0.00018366369405981687, "epoch": 19.102621388144176, "percentage": 95.51, "elapsed_time": "7:55:47", "remaining_time": "0:22:21", "throughput": 2608.55, "total_tokens": 74468000} +{"current_steps": 128260, "total_steps": 134280, "loss": 0.8058, "lr": 0.0001833596573006363, "epoch": 19.103366100685136, "percentage": 95.52, "elapsed_time": "7:55:48", "remaining_time": "0:22:19", "throughput": 2608.56, "total_tokens": 74470976} +{"current_steps": 128265, "total_steps": 134280, "loss": 0.7899, "lr": 0.00018305587085353515, "epoch": 19.104110813226093, "percentage": 95.52, "elapsed_time": "7:55:49", "remaining_time": "0:22:18", "throughput": 2608.56, "total_tokens": 74473920} +{"current_steps": 128270, "total_steps": 134280, "loss": 0.8055, "lr": 0.00018275233472364594, "epoch": 19.104855525767054, "percentage": 95.52, "elapsed_time": "7:55:50", "remaining_time": "0:22:17", "throughput": 2608.56, "total_tokens": 74476544} +{"current_steps": 128275, "total_steps": 134280, "loss": 0.7782, "lr": 0.00018244904891609625, "epoch": 19.105600238308014, "percentage": 95.53, "elapsed_time": "7:55:51", "remaining_time": "0:22:16", "throughput": 2608.57, "total_tokens": 74479424} +{"current_steps": 128280, "total_steps": 134280, "loss": 0.7882, "lr": 0.00018214601343600865, "epoch": 19.10634495084897, "percentage": 95.53, "elapsed_time": "7:55:52", "remaining_time": "0:22:15", "throughput": 2608.58, "total_tokens": 74482656} +{"current_steps": 128285, "total_steps": 134280, "loss": 0.7863, "lr": 0.00018184322828850575, "epoch": 19.10708966338993, "percentage": 95.54, "elapsed_time": "7:55:54", "remaining_time": "0:22:14", "throughput": 2608.58, "total_tokens": 74485408} +{"current_steps": 128290, "total_steps": 134280, "loss": 0.7954, "lr": 0.00018154069347870006, "epoch": 19.107834375930892, "percentage": 95.54, "elapsed_time": "7:55:55", "remaining_time": "0:22:13", "throughput": 2608.59, "total_tokens": 74488800} +{"current_steps": 128295, "total_steps": 134280, "loss": 0.8325, "lr": 0.0001812384090117042, "epoch": 19.10857908847185, "percentage": 95.54, "elapsed_time": "7:55:56", "remaining_time": "0:22:12", "throughput": 2608.6, "total_tokens": 74491904} +{"current_steps": 128300, "total_steps": 134280, "loss": 0.7968, "lr": 0.00018093637489262403, "epoch": 19.10932380101281, "percentage": 95.55, "elapsed_time": "7:55:57", "remaining_time": "0:22:11", "throughput": 2608.6, "total_tokens": 74494496} +{"current_steps": 128305, "total_steps": 134280, "loss": 0.798, "lr": 0.00018063459112656222, "epoch": 19.110068513553767, "percentage": 95.55, "elapsed_time": "7:55:58", "remaining_time": "0:22:09", "throughput": 2608.61, "total_tokens": 74497472} +{"current_steps": 128310, "total_steps": 134280, "loss": 0.7914, "lr": 0.0001803330577186163, "epoch": 19.110813226094727, "percentage": 95.55, "elapsed_time": "7:55:59", "remaining_time": "0:22:08", "throughput": 2608.61, "total_tokens": 74500288} +{"current_steps": 128315, "total_steps": 134280, "loss": 0.7889, "lr": 0.00018003177467388386, "epoch": 19.111557938635688, "percentage": 95.56, "elapsed_time": "7:56:00", "remaining_time": "0:22:07", "throughput": 2608.64, "total_tokens": 74504576} +{"current_steps": 128320, "total_steps": 134280, "loss": 0.8044, "lr": 0.00017973074199745086, "epoch": 19.112302651176645, "percentage": 95.56, "elapsed_time": "7:56:01", "remaining_time": "0:22:06", "throughput": 2608.64, "total_tokens": 74507360} +{"current_steps": 128325, "total_steps": 134280, "loss": 0.7932, "lr": 0.00017942995969440323, "epoch": 19.113047363717605, "percentage": 95.57, "elapsed_time": "7:56:02", "remaining_time": "0:22:05", "throughput": 2608.64, "total_tokens": 74510112} +{"current_steps": 128330, "total_steps": 134280, "loss": 0.8119, "lr": 0.00017912942776982522, "epoch": 19.113792076258566, "percentage": 95.57, "elapsed_time": "7:56:03", "remaining_time": "0:22:04", "throughput": 2608.65, "total_tokens": 74512960} +{"current_steps": 128335, "total_steps": 134280, "loss": 0.8058, "lr": 0.00017882914622878942, "epoch": 19.114536788799523, "percentage": 95.57, "elapsed_time": "7:56:04", "remaining_time": "0:22:03", "throughput": 2608.66, "total_tokens": 74515936} +{"current_steps": 128340, "total_steps": 134280, "loss": 0.8082, "lr": 0.00017852911507637513, "epoch": 19.115281501340483, "percentage": 95.58, "elapsed_time": "7:56:05", "remaining_time": "0:22:02", "throughput": 2608.66, "total_tokens": 74518816} +{"current_steps": 128345, "total_steps": 134280, "loss": 0.8361, "lr": 0.00017822933431764498, "epoch": 19.11602621388144, "percentage": 95.58, "elapsed_time": "7:56:06", "remaining_time": "0:22:01", "throughput": 2608.66, "total_tokens": 74521472} +{"current_steps": 128350, "total_steps": 134280, "loss": 0.7928, "lr": 0.00017792980395766822, "epoch": 19.1167709264224, "percentage": 95.58, "elapsed_time": "7:56:08", "remaining_time": "0:21:59", "throughput": 2608.66, "total_tokens": 74524352} +{"current_steps": 128355, "total_steps": 134280, "loss": 0.7933, "lr": 0.00017763052400150247, "epoch": 19.11751563896336, "percentage": 95.59, "elapsed_time": "7:56:09", "remaining_time": "0:21:58", "throughput": 2608.67, "total_tokens": 74527264} +{"current_steps": 128360, "total_steps": 134280, "loss": 0.8001, "lr": 0.0001773314944542037, "epoch": 19.11826035150432, "percentage": 95.59, "elapsed_time": "7:56:10", "remaining_time": "0:21:57", "throughput": 2608.67, "total_tokens": 74529952} +{"current_steps": 128365, "total_steps": 134280, "loss": 0.7926, "lr": 0.00017703271532082453, "epoch": 19.11900506404528, "percentage": 95.6, "elapsed_time": "7:56:11", "remaining_time": "0:21:56", "throughput": 2608.68, "total_tokens": 74532896} +{"current_steps": 128370, "total_steps": 134280, "loss": 0.8039, "lr": 0.00017673418660641094, "epoch": 19.11974977658624, "percentage": 95.6, "elapsed_time": "7:56:12", "remaining_time": "0:21:55", "throughput": 2608.68, "total_tokens": 74535872} +{"current_steps": 128375, "total_steps": 134280, "loss": 0.7992, "lr": 0.00017643590831600885, "epoch": 19.120494489127196, "percentage": 95.6, "elapsed_time": "7:56:13", "remaining_time": "0:21:54", "throughput": 2608.69, "total_tokens": 74538912} +{"current_steps": 128380, "total_steps": 134280, "loss": 0.7981, "lr": 0.00017613788045465594, "epoch": 19.121239201668157, "percentage": 95.61, "elapsed_time": "7:56:14", "remaining_time": "0:21:53", "throughput": 2608.69, "total_tokens": 74541760} +{"current_steps": 128385, "total_steps": 134280, "loss": 0.8015, "lr": 0.0001758401030273865, "epoch": 19.121983914209114, "percentage": 95.61, "elapsed_time": "7:56:15", "remaining_time": "0:21:52", "throughput": 2608.7, "total_tokens": 74544896} +{"current_steps": 128390, "total_steps": 134280, "loss": 0.7834, "lr": 0.0001755425760392315, "epoch": 19.122728626750074, "percentage": 95.61, "elapsed_time": "7:56:16", "remaining_time": "0:21:50", "throughput": 2608.71, "total_tokens": 74547616} +{"current_steps": 128395, "total_steps": 134280, "loss": 0.7976, "lr": 0.00017524529949522027, "epoch": 19.123473339291035, "percentage": 95.62, "elapsed_time": "7:56:17", "remaining_time": "0:21:49", "throughput": 2608.71, "total_tokens": 74550432} +{"current_steps": 128400, "total_steps": 134280, "loss": 0.795, "lr": 0.00017494827340037045, "epoch": 19.124218051831992, "percentage": 95.62, "elapsed_time": "7:56:18", "remaining_time": "0:21:48", "throughput": 2608.71, "total_tokens": 74553408} +{"current_steps": 128405, "total_steps": 134280, "loss": 0.7911, "lr": 0.000174651497759703, "epoch": 19.124962764372953, "percentage": 95.62, "elapsed_time": "7:56:19", "remaining_time": "0:21:47", "throughput": 2608.72, "total_tokens": 74556480} +{"current_steps": 128410, "total_steps": 134280, "loss": 0.8006, "lr": 0.00017435497257823062, "epoch": 19.12570747691391, "percentage": 95.63, "elapsed_time": "7:56:20", "remaining_time": "0:21:46", "throughput": 2608.73, "total_tokens": 74559296} +{"current_steps": 128415, "total_steps": 134280, "loss": 0.8229, "lr": 0.00017405869786096261, "epoch": 19.12645218945487, "percentage": 95.63, "elapsed_time": "7:56:21", "remaining_time": "0:21:45", "throughput": 2608.74, "total_tokens": 74562400} +{"current_steps": 128420, "total_steps": 134280, "loss": 0.7762, "lr": 0.00017376267361290498, "epoch": 19.12719690199583, "percentage": 95.64, "elapsed_time": "7:56:22", "remaining_time": "0:21:44", "throughput": 2608.74, "total_tokens": 74565344} +{"current_steps": 128425, "total_steps": 134280, "loss": 0.8204, "lr": 0.00017346689983905705, "epoch": 19.127941614536788, "percentage": 95.64, "elapsed_time": "7:56:23", "remaining_time": "0:21:43", "throughput": 2608.75, "total_tokens": 74568320} +{"current_steps": 128430, "total_steps": 134280, "loss": 0.809, "lr": 0.00017317137654441816, "epoch": 19.128686327077748, "percentage": 95.64, "elapsed_time": "7:56:25", "remaining_time": "0:21:42", "throughput": 2608.75, "total_tokens": 74571296} +{"current_steps": 128435, "total_steps": 134280, "loss": 0.7712, "lr": 0.0001728761037339793, "epoch": 19.12943103961871, "percentage": 95.65, "elapsed_time": "7:56:26", "remaining_time": "0:21:40", "throughput": 2608.76, "total_tokens": 74574240} +{"current_steps": 128440, "total_steps": 134280, "loss": 0.8091, "lr": 0.0001725810814127282, "epoch": 19.130175752159666, "percentage": 95.65, "elapsed_time": "7:56:27", "remaining_time": "0:21:39", "throughput": 2608.76, "total_tokens": 74576992} +{"current_steps": 128445, "total_steps": 134280, "loss": 0.8158, "lr": 0.00017228630958564917, "epoch": 19.130920464700626, "percentage": 95.65, "elapsed_time": "7:56:28", "remaining_time": "0:21:38", "throughput": 2608.76, "total_tokens": 74579808} +{"current_steps": 128450, "total_steps": 134280, "loss": 0.7944, "lr": 0.0001719917882577232, "epoch": 19.131665177241583, "percentage": 95.66, "elapsed_time": "7:56:29", "remaining_time": "0:21:37", "throughput": 2608.77, "total_tokens": 74582784} +{"current_steps": 128455, "total_steps": 134280, "loss": 0.7933, "lr": 0.00017169751743392636, "epoch": 19.132409889782544, "percentage": 95.66, "elapsed_time": "7:56:30", "remaining_time": "0:21:36", "throughput": 2608.77, "total_tokens": 74585632} +{"current_steps": 128460, "total_steps": 134280, "loss": 0.8119, "lr": 0.00017140349711922964, "epoch": 19.133154602323504, "percentage": 95.67, "elapsed_time": "7:56:31", "remaining_time": "0:21:35", "throughput": 2608.77, "total_tokens": 74588288} +{"current_steps": 128465, "total_steps": 134280, "loss": 0.7956, "lr": 0.00017110972731859908, "epoch": 19.13389931486446, "percentage": 95.67, "elapsed_time": "7:56:32", "remaining_time": "0:21:34", "throughput": 2608.78, "total_tokens": 74591424} +{"current_steps": 128470, "total_steps": 134280, "loss": 0.7986, "lr": 0.00017081620803699736, "epoch": 19.13464402740542, "percentage": 95.67, "elapsed_time": "7:56:33", "remaining_time": "0:21:33", "throughput": 2608.79, "total_tokens": 74594368} +{"current_steps": 128475, "total_steps": 134280, "loss": 0.7878, "lr": 0.00017052293927938554, "epoch": 19.135388739946382, "percentage": 95.68, "elapsed_time": "7:56:34", "remaining_time": "0:21:32", "throughput": 2608.79, "total_tokens": 74597056} +{"current_steps": 128480, "total_steps": 134280, "loss": 0.8242, "lr": 0.0001702299210507163, "epoch": 19.13613345248734, "percentage": 95.68, "elapsed_time": "7:56:35", "remaining_time": "0:21:30", "throughput": 2608.8, "total_tokens": 74600000} +{"current_steps": 128485, "total_steps": 134280, "loss": 0.8113, "lr": 0.00016993715335593905, "epoch": 19.1368781650283, "percentage": 95.68, "elapsed_time": "7:56:36", "remaining_time": "0:21:29", "throughput": 2608.8, "total_tokens": 74602944} +{"current_steps": 128490, "total_steps": 134280, "loss": 0.7895, "lr": 0.00016964463620000312, "epoch": 19.137622877569257, "percentage": 95.69, "elapsed_time": "7:56:37", "remaining_time": "0:21:28", "throughput": 2608.81, "total_tokens": 74605760} +{"current_steps": 128495, "total_steps": 134280, "loss": 0.7923, "lr": 0.00016935236958784628, "epoch": 19.138367590110217, "percentage": 95.69, "elapsed_time": "7:56:38", "remaining_time": "0:21:27", "throughput": 2608.81, "total_tokens": 74608800} +{"current_steps": 128500, "total_steps": 134280, "loss": 0.7943, "lr": 0.00016906035352440784, "epoch": 19.139112302651178, "percentage": 95.7, "elapsed_time": "7:56:39", "remaining_time": "0:21:26", "throughput": 2608.82, "total_tokens": 74611648} +{"current_steps": 128505, "total_steps": 134280, "loss": 0.807, "lr": 0.00016876858801462223, "epoch": 19.139857015192135, "percentage": 95.7, "elapsed_time": "7:56:40", "remaining_time": "0:21:25", "throughput": 2608.83, "total_tokens": 74614720} +{"current_steps": 128510, "total_steps": 134280, "loss": 0.8162, "lr": 0.00016847707306341718, "epoch": 19.140601727733095, "percentage": 95.7, "elapsed_time": "7:56:41", "remaining_time": "0:21:24", "throughput": 2608.83, "total_tokens": 74617696} +{"current_steps": 128515, "total_steps": 134280, "loss": 0.8045, "lr": 0.00016818580867571873, "epoch": 19.141346440274056, "percentage": 95.71, "elapsed_time": "7:56:43", "remaining_time": "0:21:23", "throughput": 2608.83, "total_tokens": 74620512} +{"current_steps": 128520, "total_steps": 134280, "loss": 0.7806, "lr": 0.00016789479485644464, "epoch": 19.142091152815013, "percentage": 95.71, "elapsed_time": "7:56:44", "remaining_time": "0:21:21", "throughput": 2608.84, "total_tokens": 74623424} +{"current_steps": 128525, "total_steps": 134280, "loss": 0.8044, "lr": 0.00016760403161051595, "epoch": 19.142835865355973, "percentage": 95.71, "elapsed_time": "7:56:45", "remaining_time": "0:21:20", "throughput": 2608.84, "total_tokens": 74626272} +{"current_steps": 128530, "total_steps": 134280, "loss": 0.814, "lr": 0.00016731351894283875, "epoch": 19.14358057789693, "percentage": 95.72, "elapsed_time": "7:56:46", "remaining_time": "0:21:19", "throughput": 2608.84, "total_tokens": 74628960} +{"current_steps": 128535, "total_steps": 134280, "loss": 0.8052, "lr": 0.00016702325685832742, "epoch": 19.14432529043789, "percentage": 95.72, "elapsed_time": "7:56:47", "remaining_time": "0:21:18", "throughput": 2608.85, "total_tokens": 74631936} +{"current_steps": 128540, "total_steps": 134280, "loss": 0.7944, "lr": 0.00016673324536188138, "epoch": 19.14507000297885, "percentage": 95.73, "elapsed_time": "7:56:48", "remaining_time": "0:21:17", "throughput": 2608.86, "total_tokens": 74634976} +{"current_steps": 128545, "total_steps": 134280, "loss": 0.7974, "lr": 0.00016644348445840173, "epoch": 19.14581471551981, "percentage": 95.73, "elapsed_time": "7:56:49", "remaining_time": "0:21:16", "throughput": 2608.86, "total_tokens": 74637888} +{"current_steps": 128550, "total_steps": 134280, "loss": 0.7972, "lr": 0.00016615397415278287, "epoch": 19.14655942806077, "percentage": 95.73, "elapsed_time": "7:56:50", "remaining_time": "0:21:15", "throughput": 2608.87, "total_tokens": 74640768} +{"current_steps": 128555, "total_steps": 134280, "loss": 0.798, "lr": 0.00016586471444991757, "epoch": 19.14730414060173, "percentage": 95.74, "elapsed_time": "7:56:51", "remaining_time": "0:21:14", "throughput": 2608.87, "total_tokens": 74643648} +{"current_steps": 128560, "total_steps": 134280, "loss": 0.797, "lr": 0.00016557570535469024, "epoch": 19.148048853142686, "percentage": 95.74, "elapsed_time": "7:56:52", "remaining_time": "0:21:13", "throughput": 2608.88, "total_tokens": 74646720} +{"current_steps": 128565, "total_steps": 134280, "loss": 0.7935, "lr": 0.00016528694687198363, "epoch": 19.148793565683647, "percentage": 95.74, "elapsed_time": "7:56:53", "remaining_time": "0:21:11", "throughput": 2608.88, "total_tokens": 74649312} +{"current_steps": 128570, "total_steps": 134280, "loss": 0.8174, "lr": 0.0001649984390066772, "epoch": 19.149538278224604, "percentage": 95.75, "elapsed_time": "7:56:54", "remaining_time": "0:21:10", "throughput": 2608.89, "total_tokens": 74652256} +{"current_steps": 128575, "total_steps": 134280, "loss": 0.7764, "lr": 0.0001647101817636437, "epoch": 19.150282990765565, "percentage": 95.75, "elapsed_time": "7:56:55", "remaining_time": "0:21:09", "throughput": 2608.89, "total_tokens": 74654976} +{"current_steps": 128580, "total_steps": 134280, "loss": 0.8051, "lr": 0.00016442217514775424, "epoch": 19.151027703306525, "percentage": 95.76, "elapsed_time": "7:56:56", "remaining_time": "0:21:08", "throughput": 2608.9, "total_tokens": 74657856} +{"current_steps": 128585, "total_steps": 134280, "loss": 0.8122, "lr": 0.00016413441916387494, "epoch": 19.151772415847482, "percentage": 95.76, "elapsed_time": "7:56:57", "remaining_time": "0:21:07", "throughput": 2608.9, "total_tokens": 74660832} +{"current_steps": 128590, "total_steps": 134280, "loss": 0.7799, "lr": 0.0001638469138168652, "epoch": 19.152517128388443, "percentage": 95.76, "elapsed_time": "7:56:58", "remaining_time": "0:21:06", "throughput": 2608.9, "total_tokens": 74663488} +{"current_steps": 128595, "total_steps": 134280, "loss": 0.8063, "lr": 0.00016355965911158288, "epoch": 19.1532618409294, "percentage": 95.77, "elapsed_time": "7:56:59", "remaining_time": "0:21:05", "throughput": 2608.91, "total_tokens": 74666432} +{"current_steps": 128600, "total_steps": 134280, "loss": 0.7942, "lr": 0.00016327265505288068, "epoch": 19.15400655347036, "percentage": 95.77, "elapsed_time": "7:57:00", "remaining_time": "0:21:04", "throughput": 2608.91, "total_tokens": 74669184} +{"current_steps": 128605, "total_steps": 134280, "loss": 0.7974, "lr": 0.00016298590164560978, "epoch": 19.15475126601132, "percentage": 95.77, "elapsed_time": "7:57:01", "remaining_time": "0:21:03", "throughput": 2608.91, "total_tokens": 74671968} +{"current_steps": 128610, "total_steps": 134280, "loss": 0.8111, "lr": 0.0001626993988946096, "epoch": 19.155495978552278, "percentage": 95.78, "elapsed_time": "7:57:02", "remaining_time": "0:21:01", "throughput": 2608.91, "total_tokens": 74674816} +{"current_steps": 128615, "total_steps": 134280, "loss": 0.7904, "lr": 0.00016241314680472463, "epoch": 19.156240691093238, "percentage": 95.78, "elapsed_time": "7:57:04", "remaining_time": "0:21:00", "throughput": 2608.92, "total_tokens": 74677728} +{"current_steps": 128620, "total_steps": 134280, "loss": 0.7901, "lr": 0.0001621271453807893, "epoch": 19.1569854036342, "percentage": 95.78, "elapsed_time": "7:57:05", "remaining_time": "0:20:59", "throughput": 2608.92, "total_tokens": 74680672} +{"current_steps": 128625, "total_steps": 134280, "loss": 0.8083, "lr": 0.00016184139462763647, "epoch": 19.157730116175156, "percentage": 95.79, "elapsed_time": "7:57:06", "remaining_time": "0:20:58", "throughput": 2608.93, "total_tokens": 74683584} +{"current_steps": 128630, "total_steps": 134280, "loss": 0.7842, "lr": 0.00016155589455009054, "epoch": 19.158474828716116, "percentage": 95.79, "elapsed_time": "7:57:07", "remaining_time": "0:20:57", "throughput": 2608.93, "total_tokens": 74686368} +{"current_steps": 128635, "total_steps": 134280, "loss": 0.8035, "lr": 0.00016127064515297773, "epoch": 19.159219541257073, "percentage": 95.8, "elapsed_time": "7:57:08", "remaining_time": "0:20:56", "throughput": 2608.93, "total_tokens": 74688992} +{"current_steps": 128640, "total_steps": 134280, "loss": 0.8193, "lr": 0.0001609856464411158, "epoch": 19.159964253798034, "percentage": 95.8, "elapsed_time": "7:57:09", "remaining_time": "0:20:55", "throughput": 2608.94, "total_tokens": 74691904} +{"current_steps": 128645, "total_steps": 134280, "loss": 0.7972, "lr": 0.00016070089841931757, "epoch": 19.160708966338994, "percentage": 95.8, "elapsed_time": "7:57:10", "remaining_time": "0:20:54", "throughput": 2608.94, "total_tokens": 74694848} +{"current_steps": 128650, "total_steps": 134280, "loss": 0.8342, "lr": 0.00016041640109239918, "epoch": 19.16145367887995, "percentage": 95.81, "elapsed_time": "7:57:11", "remaining_time": "0:20:52", "throughput": 2608.95, "total_tokens": 74697952} +{"current_steps": 128655, "total_steps": 134280, "loss": 0.8265, "lr": 0.00016013215446516015, "epoch": 19.16219839142091, "percentage": 95.81, "elapsed_time": "7:57:12", "remaining_time": "0:20:51", "throughput": 2608.95, "total_tokens": 74700736} +{"current_steps": 128660, "total_steps": 134280, "loss": 0.8066, "lr": 0.0001598481585424083, "epoch": 19.162943103961872, "percentage": 95.81, "elapsed_time": "7:57:13", "remaining_time": "0:20:50", "throughput": 2608.95, "total_tokens": 74703520} +{"current_steps": 128665, "total_steps": 134280, "loss": 0.7938, "lr": 0.00015956441332893643, "epoch": 19.16368781650283, "percentage": 95.82, "elapsed_time": "7:57:14", "remaining_time": "0:20:49", "throughput": 2608.96, "total_tokens": 74706336} +{"current_steps": 128670, "total_steps": 134280, "loss": 0.7916, "lr": 0.00015928091882954243, "epoch": 19.16443252904379, "percentage": 95.82, "elapsed_time": "7:57:15", "remaining_time": "0:20:48", "throughput": 2608.96, "total_tokens": 74709088} +{"current_steps": 128675, "total_steps": 134280, "loss": 0.7966, "lr": 0.00015899767504901408, "epoch": 19.165177241584747, "percentage": 95.83, "elapsed_time": "7:57:16", "remaining_time": "0:20:47", "throughput": 2608.97, "total_tokens": 74712224} +{"current_steps": 128680, "total_steps": 134280, "loss": 0.8019, "lr": 0.0001587146819921359, "epoch": 19.165921954125707, "percentage": 95.83, "elapsed_time": "7:57:17", "remaining_time": "0:20:46", "throughput": 2608.97, "total_tokens": 74715200} +{"current_steps": 128685, "total_steps": 134280, "loss": 0.7838, "lr": 0.00015843193966368906, "epoch": 19.166666666666668, "percentage": 95.83, "elapsed_time": "7:57:18", "remaining_time": "0:20:45", "throughput": 2608.98, "total_tokens": 74718176} +{"current_steps": 128690, "total_steps": 134280, "loss": 0.8092, "lr": 0.00015814944806845143, "epoch": 19.167411379207625, "percentage": 95.84, "elapsed_time": "7:57:19", "remaining_time": "0:20:44", "throughput": 2608.98, "total_tokens": 74720928} +{"current_steps": 128695, "total_steps": 134280, "loss": 0.8068, "lr": 0.00015786720721119252, "epoch": 19.168156091748585, "percentage": 95.84, "elapsed_time": "7:57:20", "remaining_time": "0:20:42", "throughput": 2608.99, "total_tokens": 74723936} +{"current_steps": 128700, "total_steps": 134280, "loss": 0.7948, "lr": 0.0001575852170966835, "epoch": 19.168900804289546, "percentage": 95.84, "elapsed_time": "7:57:21", "remaining_time": "0:20:41", "throughput": 2609.0, "total_tokens": 74726784} +{"current_steps": 128705, "total_steps": 134280, "loss": 0.8148, "lr": 0.0001573034777296872, "epoch": 19.169645516830503, "percentage": 95.85, "elapsed_time": "7:57:22", "remaining_time": "0:20:40", "throughput": 2609.0, "total_tokens": 74729408} +{"current_steps": 128710, "total_steps": 134280, "loss": 0.8254, "lr": 0.00015702198911496157, "epoch": 19.170390229371463, "percentage": 95.85, "elapsed_time": "7:57:24", "remaining_time": "0:20:39", "throughput": 2609.01, "total_tokens": 74732640} +{"current_steps": 128715, "total_steps": 134280, "loss": 0.7913, "lr": 0.00015674075125726437, "epoch": 19.17113494191242, "percentage": 95.86, "elapsed_time": "7:57:25", "remaining_time": "0:20:38", "throughput": 2609.01, "total_tokens": 74735296} +{"current_steps": 128720, "total_steps": 134280, "loss": 0.8031, "lr": 0.00015645976416134687, "epoch": 19.17187965445338, "percentage": 95.86, "elapsed_time": "7:57:26", "remaining_time": "0:20:37", "throughput": 2609.01, "total_tokens": 74738112} +{"current_steps": 128725, "total_steps": 134280, "loss": 0.8035, "lr": 0.00015617902783195524, "epoch": 19.17262436699434, "percentage": 95.86, "elapsed_time": "7:57:27", "remaining_time": "0:20:36", "throughput": 2609.01, "total_tokens": 74740864} +{"current_steps": 128730, "total_steps": 134280, "loss": 0.8023, "lr": 0.00015589854227383238, "epoch": 19.1733690795353, "percentage": 95.87, "elapsed_time": "7:57:28", "remaining_time": "0:20:35", "throughput": 2609.01, "total_tokens": 74743520} +{"current_steps": 128735, "total_steps": 134280, "loss": 0.7863, "lr": 0.00015561830749171612, "epoch": 19.17411379207626, "percentage": 95.87, "elapsed_time": "7:57:29", "remaining_time": "0:20:34", "throughput": 2609.02, "total_tokens": 74746400} +{"current_steps": 128740, "total_steps": 134280, "loss": 0.7936, "lr": 0.00015533832349034105, "epoch": 19.17485850461722, "percentage": 95.87, "elapsed_time": "7:57:30", "remaining_time": "0:20:32", "throughput": 2609.02, "total_tokens": 74749280} +{"current_steps": 128745, "total_steps": 134280, "loss": 0.7776, "lr": 0.00015505859027443834, "epoch": 19.175603217158177, "percentage": 95.88, "elapsed_time": "7:57:31", "remaining_time": "0:20:31", "throughput": 2609.02, "total_tokens": 74752192} +{"current_steps": 128750, "total_steps": 134280, "loss": 0.8084, "lr": 0.00015477910784873427, "epoch": 19.176347929699137, "percentage": 95.88, "elapsed_time": "7:57:32", "remaining_time": "0:20:30", "throughput": 2609.03, "total_tokens": 74755360} +{"current_steps": 128755, "total_steps": 134280, "loss": 0.8093, "lr": 0.0001544998762179467, "epoch": 19.177092642240094, "percentage": 95.89, "elapsed_time": "7:57:33", "remaining_time": "0:20:29", "throughput": 2609.04, "total_tokens": 74758304} +{"current_steps": 128760, "total_steps": 134280, "loss": 0.8136, "lr": 0.00015422089538679685, "epoch": 19.177837354781055, "percentage": 95.89, "elapsed_time": "7:57:34", "remaining_time": "0:20:28", "throughput": 2609.06, "total_tokens": 74761856} +{"current_steps": 128765, "total_steps": 134280, "loss": 0.7974, "lr": 0.00015394216535999594, "epoch": 19.178582067322015, "percentage": 95.89, "elapsed_time": "7:57:35", "remaining_time": "0:20:27", "throughput": 2609.07, "total_tokens": 74764864} +{"current_steps": 128770, "total_steps": 134280, "loss": 0.7901, "lr": 0.00015366368614225356, "epoch": 19.179326779862972, "percentage": 95.9, "elapsed_time": "7:57:36", "remaining_time": "0:20:26", "throughput": 2609.07, "total_tokens": 74767488} +{"current_steps": 128775, "total_steps": 134280, "loss": 0.8021, "lr": 0.00015338545773827428, "epoch": 19.180071492403933, "percentage": 95.9, "elapsed_time": "7:57:37", "remaining_time": "0:20:25", "throughput": 2609.07, "total_tokens": 74770368} +{"current_steps": 128780, "total_steps": 134280, "loss": 0.8021, "lr": 0.00015310748015275765, "epoch": 19.18081620494489, "percentage": 95.9, "elapsed_time": "7:57:38", "remaining_time": "0:20:23", "throughput": 2609.07, "total_tokens": 74773120} +{"current_steps": 128785, "total_steps": 134280, "loss": 0.788, "lr": 0.0001528297533904016, "epoch": 19.18156091748585, "percentage": 95.91, "elapsed_time": "7:57:39", "remaining_time": "0:20:22", "throughput": 2609.08, "total_tokens": 74776000} +{"current_steps": 128790, "total_steps": 134280, "loss": 0.8082, "lr": 0.00015255227745589406, "epoch": 19.18230563002681, "percentage": 95.91, "elapsed_time": "7:57:40", "remaining_time": "0:20:21", "throughput": 2609.08, "total_tokens": 74778720} +{"current_steps": 128795, "total_steps": 134280, "loss": 0.7885, "lr": 0.00015227505235392792, "epoch": 19.183050342567768, "percentage": 95.92, "elapsed_time": "7:57:42", "remaining_time": "0:20:20", "throughput": 2609.09, "total_tokens": 74781824} +{"current_steps": 128800, "total_steps": 134280, "loss": 0.796, "lr": 0.0001519980780891844, "epoch": 19.183795055108728, "percentage": 95.92, "elapsed_time": "7:57:43", "remaining_time": "0:20:19", "throughput": 2609.09, "total_tokens": 74784800} +{"current_steps": 128805, "total_steps": 134280, "loss": 0.7813, "lr": 0.0001517213546663415, "epoch": 19.18453976764969, "percentage": 95.92, "elapsed_time": "7:57:44", "remaining_time": "0:20:18", "throughput": 2609.1, "total_tokens": 74787872} +{"current_steps": 128810, "total_steps": 134280, "loss": 0.7794, "lr": 0.00015144488209007544, "epoch": 19.185284480190646, "percentage": 95.93, "elapsed_time": "7:57:45", "remaining_time": "0:20:17", "throughput": 2609.1, "total_tokens": 74790496} +{"current_steps": 128815, "total_steps": 134280, "loss": 0.8014, "lr": 0.00015116866036505748, "epoch": 19.186029192731606, "percentage": 95.93, "elapsed_time": "7:57:46", "remaining_time": "0:20:16", "throughput": 2609.1, "total_tokens": 74793120} +{"current_steps": 128820, "total_steps": 134280, "loss": 0.794, "lr": 0.00015089268949595392, "epoch": 19.186773905272563, "percentage": 95.93, "elapsed_time": "7:57:47", "remaining_time": "0:20:15", "throughput": 2609.1, "total_tokens": 74795808} +{"current_steps": 128825, "total_steps": 134280, "loss": 0.8031, "lr": 0.0001506169694874243, "epoch": 19.187518617813524, "percentage": 95.94, "elapsed_time": "7:57:48", "remaining_time": "0:20:13", "throughput": 2609.11, "total_tokens": 74798688} +{"current_steps": 128830, "total_steps": 134280, "loss": 0.8012, "lr": 0.00015034150034412997, "epoch": 19.188263330354484, "percentage": 95.94, "elapsed_time": "7:57:49", "remaining_time": "0:20:12", "throughput": 2609.1, "total_tokens": 74801248} +{"current_steps": 128835, "total_steps": 134280, "loss": 0.783, "lr": 0.00015006628207072214, "epoch": 19.18900804289544, "percentage": 95.95, "elapsed_time": "7:57:50", "remaining_time": "0:20:11", "throughput": 2609.1, "total_tokens": 74803936} +{"current_steps": 128840, "total_steps": 134280, "loss": 0.8133, "lr": 0.0001497913146718538, "epoch": 19.189752755436402, "percentage": 95.95, "elapsed_time": "7:57:51", "remaining_time": "0:20:10", "throughput": 2609.11, "total_tokens": 74807008} +{"current_steps": 128845, "total_steps": 134280, "loss": 0.7861, "lr": 0.0001495165981521662, "epoch": 19.190497467977362, "percentage": 95.95, "elapsed_time": "7:57:52", "remaining_time": "0:20:09", "throughput": 2609.12, "total_tokens": 74809952} +{"current_steps": 128850, "total_steps": 134280, "loss": 0.7878, "lr": 0.00014924213251630235, "epoch": 19.19124218051832, "percentage": 95.96, "elapsed_time": "7:57:53", "remaining_time": "0:20:08", "throughput": 2609.12, "total_tokens": 74813024} +{"current_steps": 128855, "total_steps": 134280, "loss": 0.8017, "lr": 0.00014896791776890017, "epoch": 19.19198689305928, "percentage": 95.96, "elapsed_time": "7:57:54", "remaining_time": "0:20:07", "throughput": 2609.13, "total_tokens": 74816032} +{"current_steps": 128860, "total_steps": 134280, "loss": 0.7955, "lr": 0.00014869395391459093, "epoch": 19.192731605600237, "percentage": 95.96, "elapsed_time": "7:57:55", "remaining_time": "0:20:06", "throughput": 2609.14, "total_tokens": 74819200} +{"current_steps": 128865, "total_steps": 134280, "loss": 0.7809, "lr": 0.00014842024095800265, "epoch": 19.193476318141197, "percentage": 95.97, "elapsed_time": "7:57:56", "remaining_time": "0:20:05", "throughput": 2609.14, "total_tokens": 74821888} +{"current_steps": 128870, "total_steps": 134280, "loss": 0.7868, "lr": 0.00014814677890375992, "epoch": 19.194221030682158, "percentage": 95.97, "elapsed_time": "7:57:58", "remaining_time": "0:20:03", "throughput": 2609.17, "total_tokens": 74825952} +{"current_steps": 128875, "total_steps": 134280, "loss": 0.7959, "lr": 0.0001478735677564824, "epoch": 19.194965743223115, "percentage": 95.97, "elapsed_time": "7:57:59", "remaining_time": "0:20:02", "throughput": 2609.17, "total_tokens": 74828896} +{"current_steps": 128880, "total_steps": 134280, "loss": 0.806, "lr": 0.00014760060752078808, "epoch": 19.195710455764075, "percentage": 95.98, "elapsed_time": "7:58:00", "remaining_time": "0:20:01", "throughput": 2609.17, "total_tokens": 74831648} +{"current_steps": 128885, "total_steps": 134280, "loss": 0.8071, "lr": 0.00014732789820128488, "epoch": 19.196455168305036, "percentage": 95.98, "elapsed_time": "7:58:01", "remaining_time": "0:20:00", "throughput": 2609.18, "total_tokens": 74834592} +{"current_steps": 128890, "total_steps": 134280, "loss": 0.7814, "lr": 0.00014705543980258085, "epoch": 19.197199880845993, "percentage": 95.99, "elapsed_time": "7:58:02", "remaining_time": "0:19:59", "throughput": 2609.19, "total_tokens": 74837504} +{"current_steps": 128895, "total_steps": 134280, "loss": 0.7638, "lr": 0.0001467832323292789, "epoch": 19.197944593386953, "percentage": 95.99, "elapsed_time": "7:58:03", "remaining_time": "0:19:58", "throughput": 2609.19, "total_tokens": 74840352} +{"current_steps": 128900, "total_steps": 134280, "loss": 0.7925, "lr": 0.00014651127578597876, "epoch": 19.19868930592791, "percentage": 95.99, "elapsed_time": "7:58:04", "remaining_time": "0:19:57", "throughput": 2609.2, "total_tokens": 74843456} +{"current_steps": 128905, "total_steps": 134280, "loss": 0.8455, "lr": 0.0001462395701772734, "epoch": 19.19943401846887, "percentage": 96.0, "elapsed_time": "7:58:05", "remaining_time": "0:19:56", "throughput": 2609.2, "total_tokens": 74846240} +{"current_steps": 128910, "total_steps": 134280, "loss": 0.7873, "lr": 0.00014596811550775411, "epoch": 19.20017873100983, "percentage": 96.0, "elapsed_time": "7:58:06", "remaining_time": "0:19:54", "throughput": 2609.21, "total_tokens": 74849184} +{"current_steps": 128915, "total_steps": 134280, "loss": 0.8201, "lr": 0.00014569691178200727, "epoch": 19.20092344355079, "percentage": 96.0, "elapsed_time": "7:58:07", "remaining_time": "0:19:53", "throughput": 2609.21, "total_tokens": 74852160} +{"current_steps": 128920, "total_steps": 134280, "loss": 0.8406, "lr": 0.0001454259590046142, "epoch": 19.20166815609175, "percentage": 96.01, "elapsed_time": "7:58:08", "remaining_time": "0:19:52", "throughput": 2609.22, "total_tokens": 74855136} +{"current_steps": 128925, "total_steps": 134280, "loss": 0.7838, "lr": 0.0001451552571801512, "epoch": 19.202412868632706, "percentage": 96.01, "elapsed_time": "7:58:09", "remaining_time": "0:19:51", "throughput": 2609.23, "total_tokens": 74858272} +{"current_steps": 128930, "total_steps": 134280, "loss": 0.7904, "lr": 0.00014488480631319134, "epoch": 19.203157581173667, "percentage": 96.02, "elapsed_time": "7:58:10", "remaining_time": "0:19:50", "throughput": 2609.24, "total_tokens": 74861440} +{"current_steps": 128935, "total_steps": 134280, "loss": 0.8275, "lr": 0.00014461460640830592, "epoch": 19.203902293714627, "percentage": 96.02, "elapsed_time": "7:58:11", "remaining_time": "0:19:49", "throughput": 2609.24, "total_tokens": 74864160} +{"current_steps": 128940, "total_steps": 134280, "loss": 0.7898, "lr": 0.00014434465747005797, "epoch": 19.204647006255584, "percentage": 96.02, "elapsed_time": "7:58:12", "remaining_time": "0:19:48", "throughput": 2609.24, "total_tokens": 74866976} +{"current_steps": 128945, "total_steps": 134280, "loss": 0.8023, "lr": 0.00014407495950300884, "epoch": 19.205391718796545, "percentage": 96.03, "elapsed_time": "7:58:14", "remaining_time": "0:19:47", "throughput": 2609.24, "total_tokens": 74869664} +{"current_steps": 128950, "total_steps": 134280, "loss": 0.7927, "lr": 0.00014380551251171492, "epoch": 19.206136431337505, "percentage": 96.03, "elapsed_time": "7:58:15", "remaining_time": "0:19:46", "throughput": 2609.24, "total_tokens": 74872480} +{"current_steps": 128955, "total_steps": 134280, "loss": 0.8095, "lr": 0.0001435363165007275, "epoch": 19.206881143878462, "percentage": 96.03, "elapsed_time": "7:58:16", "remaining_time": "0:19:44", "throughput": 2609.25, "total_tokens": 74875232} +{"current_steps": 128960, "total_steps": 134280, "loss": 0.7875, "lr": 0.00014326737147459466, "epoch": 19.207625856419423, "percentage": 96.04, "elapsed_time": "7:58:17", "remaining_time": "0:19:43", "throughput": 2609.25, "total_tokens": 74878080} +{"current_steps": 128965, "total_steps": 134280, "loss": 0.7895, "lr": 0.00014299867743785777, "epoch": 19.20837056896038, "percentage": 96.04, "elapsed_time": "7:58:18", "remaining_time": "0:19:42", "throughput": 2609.26, "total_tokens": 74880992} +{"current_steps": 128970, "total_steps": 134280, "loss": 0.8062, "lr": 0.00014273023439505982, "epoch": 19.20911528150134, "percentage": 96.05, "elapsed_time": "7:58:19", "remaining_time": "0:19:41", "throughput": 2609.27, "total_tokens": 74884288} +{"current_steps": 128975, "total_steps": 134280, "loss": 0.7921, "lr": 0.0001424620423507339, "epoch": 19.2098599940423, "percentage": 96.05, "elapsed_time": "7:58:20", "remaining_time": "0:19:40", "throughput": 2609.27, "total_tokens": 74887008} +{"current_steps": 128980, "total_steps": 134280, "loss": 0.7849, "lr": 0.00014219410130941135, "epoch": 19.210604706583258, "percentage": 96.05, "elapsed_time": "7:58:21", "remaining_time": "0:19:39", "throughput": 2609.27, "total_tokens": 74889856} +{"current_steps": 128985, "total_steps": 134280, "loss": 0.7778, "lr": 0.00014192641127561855, "epoch": 19.21134941912422, "percentage": 96.06, "elapsed_time": "7:58:22", "remaining_time": "0:19:38", "throughput": 2609.27, "total_tokens": 74892544} +{"current_steps": 128990, "total_steps": 134280, "loss": 0.7846, "lr": 0.00014165897225387858, "epoch": 19.21209413166518, "percentage": 96.06, "elapsed_time": "7:58:23", "remaining_time": "0:19:37", "throughput": 2609.28, "total_tokens": 74895360} +{"current_steps": 128995, "total_steps": 134280, "loss": 0.7889, "lr": 0.0001413917842487078, "epoch": 19.212838844206136, "percentage": 96.06, "elapsed_time": "7:58:24", "remaining_time": "0:19:36", "throughput": 2609.28, "total_tokens": 74898240} +{"current_steps": 129000, "total_steps": 134280, "loss": 0.79, "lr": 0.0001411248472646226, "epoch": 19.213583556747096, "percentage": 96.07, "elapsed_time": "7:58:25", "remaining_time": "0:19:34", "throughput": 2609.29, "total_tokens": 74901152} +{"current_steps": 129005, "total_steps": 134280, "loss": 0.7905, "lr": 0.00014085816130613105, "epoch": 19.214328269288053, "percentage": 96.07, "elapsed_time": "7:58:26", "remaining_time": "0:19:33", "throughput": 2609.29, "total_tokens": 74903968} +{"current_steps": 129010, "total_steps": 134280, "loss": 0.7998, "lr": 0.00014059172637773788, "epoch": 19.215072981829014, "percentage": 96.08, "elapsed_time": "7:58:27", "remaining_time": "0:19:32", "throughput": 2609.29, "total_tokens": 74906816} +{"current_steps": 129015, "total_steps": 134280, "loss": 0.7988, "lr": 0.00014032554248394612, "epoch": 19.215817694369974, "percentage": 96.08, "elapsed_time": "7:58:28", "remaining_time": "0:19:31", "throughput": 2609.29, "total_tokens": 74909632} +{"current_steps": 129020, "total_steps": 134280, "loss": 0.7908, "lr": 0.00014005960962925056, "epoch": 19.21656240691093, "percentage": 96.08, "elapsed_time": "7:58:29", "remaining_time": "0:19:30", "throughput": 2609.29, "total_tokens": 74912224} +{"current_steps": 129025, "total_steps": 134280, "loss": 0.7896, "lr": 0.00013979392781814592, "epoch": 19.217307119451892, "percentage": 96.09, "elapsed_time": "7:58:30", "remaining_time": "0:19:29", "throughput": 2609.3, "total_tokens": 74915200} +{"current_steps": 129030, "total_steps": 134280, "loss": 0.7943, "lr": 0.0001395284970551186, "epoch": 19.218051831992852, "percentage": 96.09, "elapsed_time": "7:58:31", "remaining_time": "0:19:28", "throughput": 2609.3, "total_tokens": 74917984} +{"current_steps": 129035, "total_steps": 134280, "loss": 0.7946, "lr": 0.00013926331734465501, "epoch": 19.21879654453381, "percentage": 96.09, "elapsed_time": "7:58:32", "remaining_time": "0:19:27", "throughput": 2609.31, "total_tokens": 74920928} +{"current_steps": 129040, "total_steps": 134280, "loss": 0.8115, "lr": 0.00013899838869123327, "epoch": 19.21954125707477, "percentage": 96.1, "elapsed_time": "7:58:33", "remaining_time": "0:19:26", "throughput": 2609.31, "total_tokens": 74923520} +{"current_steps": 129045, "total_steps": 134280, "loss": 0.782, "lr": 0.00013873371109932974, "epoch": 19.220285969615727, "percentage": 96.1, "elapsed_time": "7:58:35", "remaining_time": "0:19:24", "throughput": 2609.32, "total_tokens": 74926528} +{"current_steps": 129050, "total_steps": 134280, "loss": 0.8154, "lr": 0.0001384692845734159, "epoch": 19.221030682156687, "percentage": 96.11, "elapsed_time": "7:58:36", "remaining_time": "0:19:23", "throughput": 2609.31, "total_tokens": 74929152} +{"current_steps": 129055, "total_steps": 134280, "loss": 0.7981, "lr": 0.00013820510911795813, "epoch": 19.221775394697648, "percentage": 96.11, "elapsed_time": "7:58:37", "remaining_time": "0:19:22", "throughput": 2609.32, "total_tokens": 74932160} +{"current_steps": 129060, "total_steps": 134280, "loss": 0.806, "lr": 0.00013794118473742123, "epoch": 19.222520107238605, "percentage": 96.11, "elapsed_time": "7:58:38", "remaining_time": "0:19:21", "throughput": 2609.32, "total_tokens": 74934688} +{"current_steps": 129065, "total_steps": 134280, "loss": 0.8143, "lr": 0.00013767751143626162, "epoch": 19.223264819779565, "percentage": 96.12, "elapsed_time": "7:58:39", "remaining_time": "0:19:20", "throughput": 2609.33, "total_tokens": 74937568} +{"current_steps": 129070, "total_steps": 134280, "loss": 0.8036, "lr": 0.00013741408921893572, "epoch": 19.224009532320526, "percentage": 96.12, "elapsed_time": "7:58:40", "remaining_time": "0:19:19", "throughput": 2609.34, "total_tokens": 74940864} +{"current_steps": 129075, "total_steps": 134280, "loss": 0.8106, "lr": 0.0001371509180898933, "epoch": 19.224754244861483, "percentage": 96.12, "elapsed_time": "7:58:41", "remaining_time": "0:19:18", "throughput": 2609.34, "total_tokens": 74943776} +{"current_steps": 129080, "total_steps": 134280, "loss": 0.8095, "lr": 0.00013688799805358087, "epoch": 19.225498957402444, "percentage": 96.13, "elapsed_time": "7:58:42", "remaining_time": "0:19:17", "throughput": 2609.35, "total_tokens": 74946592} +{"current_steps": 129085, "total_steps": 134280, "loss": 0.7978, "lr": 0.00013662532911443815, "epoch": 19.2262436699434, "percentage": 96.13, "elapsed_time": "7:58:43", "remaining_time": "0:19:15", "throughput": 2609.36, "total_tokens": 74949696} +{"current_steps": 129090, "total_steps": 134280, "loss": 0.7697, "lr": 0.0001363629112769049, "epoch": 19.22698838248436, "percentage": 96.13, "elapsed_time": "7:58:44", "remaining_time": "0:19:14", "throughput": 2609.36, "total_tokens": 74952512} +{"current_steps": 129095, "total_steps": 134280, "loss": 0.7871, "lr": 0.0001361007445454143, "epoch": 19.22773309502532, "percentage": 96.14, "elapsed_time": "7:58:45", "remaining_time": "0:19:13", "throughput": 2609.36, "total_tokens": 74955296} +{"current_steps": 129100, "total_steps": 134280, "loss": 0.8085, "lr": 0.0001358388289243928, "epoch": 19.22847780756628, "percentage": 96.14, "elapsed_time": "7:58:46", "remaining_time": "0:19:12", "throughput": 2609.36, "total_tokens": 74958208} +{"current_steps": 129105, "total_steps": 134280, "loss": 0.8117, "lr": 0.0001355771644182685, "epoch": 19.22922252010724, "percentage": 96.15, "elapsed_time": "7:58:47", "remaining_time": "0:19:11", "throughput": 2609.37, "total_tokens": 74961056} +{"current_steps": 129110, "total_steps": 134280, "loss": 0.7992, "lr": 0.00013531575103145954, "epoch": 19.229967232648196, "percentage": 96.15, "elapsed_time": "7:58:48", "remaining_time": "0:19:10", "throughput": 2609.38, "total_tokens": 74964064} +{"current_steps": 129115, "total_steps": 134280, "loss": 0.8018, "lr": 0.00013505458876838405, "epoch": 19.230711945189157, "percentage": 96.15, "elapsed_time": "7:58:49", "remaining_time": "0:19:09", "throughput": 2609.38, "total_tokens": 74966848} +{"current_steps": 129120, "total_steps": 134280, "loss": 0.7985, "lr": 0.0001347936776334535, "epoch": 19.231456657730117, "percentage": 96.16, "elapsed_time": "7:58:50", "remaining_time": "0:19:08", "throughput": 2609.38, "total_tokens": 74969664} +{"current_steps": 129125, "total_steps": 134280, "loss": 0.7951, "lr": 0.00013453301763107273, "epoch": 19.232201370271074, "percentage": 96.16, "elapsed_time": "7:58:51", "remaining_time": "0:19:07", "throughput": 2609.38, "total_tokens": 74972384} +{"current_steps": 129130, "total_steps": 134280, "loss": 0.7919, "lr": 0.0001342726087656515, "epoch": 19.232946082812035, "percentage": 96.16, "elapsed_time": "7:58:52", "remaining_time": "0:19:05", "throughput": 2609.39, "total_tokens": 74975360} +{"current_steps": 129135, "total_steps": 134280, "loss": 0.8068, "lr": 0.000134012451041583, "epoch": 19.233690795352995, "percentage": 96.17, "elapsed_time": "7:58:53", "remaining_time": "0:19:04", "throughput": 2609.39, "total_tokens": 74978272} +{"current_steps": 129140, "total_steps": 134280, "loss": 0.807, "lr": 0.000133752544463267, "epoch": 19.234435507893952, "percentage": 96.17, "elapsed_time": "7:58:55", "remaining_time": "0:19:03", "throughput": 2609.4, "total_tokens": 74981088} +{"current_steps": 129145, "total_steps": 134280, "loss": 0.814, "lr": 0.0001334928890350917, "epoch": 19.235180220434913, "percentage": 96.18, "elapsed_time": "7:58:56", "remaining_time": "0:19:02", "throughput": 2609.4, "total_tokens": 74983840} +{"current_steps": 129150, "total_steps": 134280, "loss": 0.801, "lr": 0.0001332334847614436, "epoch": 19.23592493297587, "percentage": 96.18, "elapsed_time": "7:58:57", "remaining_time": "0:19:01", "throughput": 2609.4, "total_tokens": 74986784} +{"current_steps": 129155, "total_steps": 134280, "loss": 0.7979, "lr": 0.00013297433164670747, "epoch": 19.23666964551683, "percentage": 96.18, "elapsed_time": "7:58:58", "remaining_time": "0:19:00", "throughput": 2609.41, "total_tokens": 74989472} +{"current_steps": 129160, "total_steps": 134280, "loss": 0.7987, "lr": 0.00013271542969525818, "epoch": 19.23741435805779, "percentage": 96.19, "elapsed_time": "7:58:59", "remaining_time": "0:18:59", "throughput": 2609.41, "total_tokens": 74992416} +{"current_steps": 129165, "total_steps": 134280, "loss": 0.7949, "lr": 0.00013245677891147222, "epoch": 19.238159070598748, "percentage": 96.19, "elapsed_time": "7:59:00", "remaining_time": "0:18:58", "throughput": 2609.42, "total_tokens": 74995392} +{"current_steps": 129170, "total_steps": 134280, "loss": 0.7922, "lr": 0.00013219837929971778, "epoch": 19.23890378313971, "percentage": 96.19, "elapsed_time": "7:59:01", "remaining_time": "0:18:57", "throughput": 2609.42, "total_tokens": 74998112} +{"current_steps": 129175, "total_steps": 134280, "loss": 0.7865, "lr": 0.00013194023086436133, "epoch": 19.23964849568067, "percentage": 96.2, "elapsed_time": "7:59:02", "remaining_time": "0:18:55", "throughput": 2609.42, "total_tokens": 75001024} +{"current_steps": 129180, "total_steps": 134280, "loss": 0.7955, "lr": 0.00013168233360976277, "epoch": 19.240393208221626, "percentage": 96.2, "elapsed_time": "7:59:03", "remaining_time": "0:18:54", "throughput": 2609.43, "total_tokens": 75004256} +{"current_steps": 129185, "total_steps": 134280, "loss": 0.7797, "lr": 0.00013142468754028024, "epoch": 19.241137920762586, "percentage": 96.21, "elapsed_time": "7:59:04", "remaining_time": "0:18:53", "throughput": 2609.44, "total_tokens": 75007040} +{"current_steps": 129190, "total_steps": 134280, "loss": 0.7867, "lr": 0.00013116729266026528, "epoch": 19.241882633303543, "percentage": 96.21, "elapsed_time": "7:59:05", "remaining_time": "0:18:52", "throughput": 2609.44, "total_tokens": 75009888} +{"current_steps": 129195, "total_steps": 134280, "loss": 0.8038, "lr": 0.0001309101489740677, "epoch": 19.242627345844504, "percentage": 96.21, "elapsed_time": "7:59:06", "remaining_time": "0:18:51", "throughput": 2609.44, "total_tokens": 75012448} +{"current_steps": 129200, "total_steps": 134280, "loss": 0.8028, "lr": 0.00013065325648603076, "epoch": 19.243372058385464, "percentage": 96.22, "elapsed_time": "7:59:07", "remaining_time": "0:18:50", "throughput": 2609.44, "total_tokens": 75015360} +{"current_steps": 129205, "total_steps": 134280, "loss": 0.8018, "lr": 0.00013039661520049427, "epoch": 19.24411677092642, "percentage": 96.22, "elapsed_time": "7:59:08", "remaining_time": "0:18:49", "throughput": 2609.45, "total_tokens": 75018464} +{"current_steps": 129210, "total_steps": 134280, "loss": 0.7961, "lr": 0.0001301402251217948, "epoch": 19.244861483467382, "percentage": 96.22, "elapsed_time": "7:59:09", "remaining_time": "0:18:48", "throughput": 2609.47, "total_tokens": 75021760} +{"current_steps": 129215, "total_steps": 134280, "loss": 0.8046, "lr": 0.00012988408625426217, "epoch": 19.245606196008342, "percentage": 96.23, "elapsed_time": "7:59:10", "remaining_time": "0:18:46", "throughput": 2609.47, "total_tokens": 75024864} +{"current_steps": 129220, "total_steps": 134280, "loss": 0.7812, "lr": 0.00012962819860222463, "epoch": 19.2463509085493, "percentage": 96.23, "elapsed_time": "7:59:11", "remaining_time": "0:18:45", "throughput": 2609.47, "total_tokens": 75027296} +{"current_steps": 129225, "total_steps": 134280, "loss": 0.7727, "lr": 0.00012937256217000537, "epoch": 19.24709562109026, "percentage": 96.24, "elapsed_time": "7:59:12", "remaining_time": "0:18:44", "throughput": 2609.47, "total_tokens": 75030144} +{"current_steps": 129230, "total_steps": 134280, "loss": 0.8139, "lr": 0.00012911717696192427, "epoch": 19.247840333631217, "percentage": 96.24, "elapsed_time": "7:59:14", "remaining_time": "0:18:43", "throughput": 2609.48, "total_tokens": 75033088} +{"current_steps": 129235, "total_steps": 134280, "loss": 0.7939, "lr": 0.0001288620429822912, "epoch": 19.248585046172177, "percentage": 96.24, "elapsed_time": "7:59:15", "remaining_time": "0:18:42", "throughput": 2609.48, "total_tokens": 75035968} +{"current_steps": 129240, "total_steps": 134280, "loss": 0.7785, "lr": 0.00012860716023542273, "epoch": 19.249329758713138, "percentage": 96.25, "elapsed_time": "7:59:16", "remaining_time": "0:18:41", "throughput": 2609.49, "total_tokens": 75038944} +{"current_steps": 129245, "total_steps": 134280, "loss": 0.7943, "lr": 0.00012835252872562042, "epoch": 19.250074471254095, "percentage": 96.25, "elapsed_time": "7:59:17", "remaining_time": "0:18:40", "throughput": 2609.5, "total_tokens": 75041984} +{"current_steps": 129250, "total_steps": 134280, "loss": 0.8077, "lr": 0.0001280981484571858, "epoch": 19.250819183795056, "percentage": 96.25, "elapsed_time": "7:59:18", "remaining_time": "0:18:39", "throughput": 2609.5, "total_tokens": 75044736} +{"current_steps": 129255, "total_steps": 134280, "loss": 0.8036, "lr": 0.00012784401943442047, "epoch": 19.251563896336016, "percentage": 96.26, "elapsed_time": "7:59:19", "remaining_time": "0:18:38", "throughput": 2609.51, "total_tokens": 75047808} +{"current_steps": 129260, "total_steps": 134280, "loss": 0.8073, "lr": 0.00012759014166161263, "epoch": 19.252308608876973, "percentage": 96.26, "elapsed_time": "7:59:20", "remaining_time": "0:18:36", "throughput": 2609.51, "total_tokens": 75050688} +{"current_steps": 129265, "total_steps": 134280, "loss": 0.8086, "lr": 0.00012733651514305555, "epoch": 19.253053321417934, "percentage": 96.27, "elapsed_time": "7:59:21", "remaining_time": "0:18:35", "throughput": 2609.52, "total_tokens": 75053760} +{"current_steps": 129270, "total_steps": 134280, "loss": 0.7939, "lr": 0.00012708313988303078, "epoch": 19.25379803395889, "percentage": 96.27, "elapsed_time": "7:59:22", "remaining_time": "0:18:34", "throughput": 2609.52, "total_tokens": 75056544} +{"current_steps": 129275, "total_steps": 134280, "loss": 0.7955, "lr": 0.00012683001588582155, "epoch": 19.25454274649985, "percentage": 96.27, "elapsed_time": "7:59:23", "remaining_time": "0:18:33", "throughput": 2609.53, "total_tokens": 75059520} +{"current_steps": 129280, "total_steps": 134280, "loss": 0.7926, "lr": 0.0001265771431557028, "epoch": 19.25528745904081, "percentage": 96.28, "elapsed_time": "7:59:24", "remaining_time": "0:18:32", "throughput": 2609.53, "total_tokens": 75062208} +{"current_steps": 129285, "total_steps": 134280, "loss": 0.7783, "lr": 0.00012632452169694607, "epoch": 19.25603217158177, "percentage": 96.28, "elapsed_time": "7:59:25", "remaining_time": "0:18:31", "throughput": 2609.54, "total_tokens": 75065184} +{"current_steps": 129290, "total_steps": 134280, "loss": 0.7982, "lr": 0.00012607215151381966, "epoch": 19.25677688412273, "percentage": 96.28, "elapsed_time": "7:59:26", "remaining_time": "0:18:30", "throughput": 2609.54, "total_tokens": 75067904} +{"current_steps": 129295, "total_steps": 134280, "loss": 0.8093, "lr": 0.00012582003261058682, "epoch": 19.257521596663686, "percentage": 96.29, "elapsed_time": "7:59:27", "remaining_time": "0:18:29", "throughput": 2609.55, "total_tokens": 75070848} +{"current_steps": 129300, "total_steps": 134280, "loss": 0.7808, "lr": 0.00012556816499150746, "epoch": 19.258266309204647, "percentage": 96.29, "elapsed_time": "7:59:28", "remaining_time": "0:18:28", "throughput": 2609.55, "total_tokens": 75073984} +{"current_steps": 129305, "total_steps": 134280, "loss": 0.8046, "lr": 0.00012531654866083485, "epoch": 19.259011021745607, "percentage": 96.3, "elapsed_time": "7:59:29", "remaining_time": "0:18:26", "throughput": 2609.56, "total_tokens": 75076768} +{"current_steps": 129310, "total_steps": 134280, "loss": 0.8015, "lr": 0.00012506518362282227, "epoch": 19.259755734286564, "percentage": 96.3, "elapsed_time": "7:59:31", "remaining_time": "0:18:25", "throughput": 2609.57, "total_tokens": 75079968} +{"current_steps": 129315, "total_steps": 134280, "loss": 0.7875, "lr": 0.00012481406988171462, "epoch": 19.260500446827525, "percentage": 96.3, "elapsed_time": "7:59:32", "remaining_time": "0:18:24", "throughput": 2609.57, "total_tokens": 75082592} +{"current_steps": 129320, "total_steps": 134280, "loss": 0.8142, "lr": 0.00012456320744175687, "epoch": 19.261245159368485, "percentage": 96.31, "elapsed_time": "7:59:33", "remaining_time": "0:18:23", "throughput": 2609.57, "total_tokens": 75085696} +{"current_steps": 129325, "total_steps": 134280, "loss": 0.7838, "lr": 0.00012431259630718227, "epoch": 19.261989871909442, "percentage": 96.31, "elapsed_time": "7:59:34", "remaining_time": "0:18:22", "throughput": 2609.59, "total_tokens": 75089184} +{"current_steps": 129330, "total_steps": 134280, "loss": 0.8058, "lr": 0.00012406223648222912, "epoch": 19.262734584450403, "percentage": 96.31, "elapsed_time": "7:59:35", "remaining_time": "0:18:21", "throughput": 2609.59, "total_tokens": 75091872} +{"current_steps": 129335, "total_steps": 134280, "loss": 0.8059, "lr": 0.00012381212797112572, "epoch": 19.26347929699136, "percentage": 96.32, "elapsed_time": "7:59:36", "remaining_time": "0:18:20", "throughput": 2609.6, "total_tokens": 75094944} +{"current_steps": 129340, "total_steps": 134280, "loss": 0.7953, "lr": 0.00012356227077809533, "epoch": 19.26422400953232, "percentage": 96.32, "elapsed_time": "7:59:37", "remaining_time": "0:18:19", "throughput": 2609.6, "total_tokens": 75097568} +{"current_steps": 129345, "total_steps": 134280, "loss": 0.7809, "lr": 0.00012331266490736125, "epoch": 19.26496872207328, "percentage": 96.32, "elapsed_time": "7:59:38", "remaining_time": "0:18:18", "throughput": 2609.6, "total_tokens": 75100160} +{"current_steps": 129350, "total_steps": 134280, "loss": 0.7956, "lr": 0.0001230633103631401, "epoch": 19.265713434614238, "percentage": 96.33, "elapsed_time": "7:59:39", "remaining_time": "0:18:16", "throughput": 2609.61, "total_tokens": 75103232} +{"current_steps": 129355, "total_steps": 134280, "loss": 0.7971, "lr": 0.00012281420714964353, "epoch": 19.2664581471552, "percentage": 96.33, "elapsed_time": "7:59:40", "remaining_time": "0:18:15", "throughput": 2609.62, "total_tokens": 75106656} +{"current_steps": 129360, "total_steps": 134280, "loss": 0.8313, "lr": 0.00012256535527108148, "epoch": 19.26720285969616, "percentage": 96.34, "elapsed_time": "7:59:41", "remaining_time": "0:18:14", "throughput": 2609.62, "total_tokens": 75109504} +{"current_steps": 129365, "total_steps": 134280, "loss": 0.7762, "lr": 0.0001223167547316556, "epoch": 19.267947572237116, "percentage": 96.34, "elapsed_time": "7:59:42", "remaining_time": "0:18:13", "throughput": 2609.63, "total_tokens": 75112384} +{"current_steps": 129370, "total_steps": 134280, "loss": 0.8116, "lr": 0.00012206840553556753, "epoch": 19.268692284778076, "percentage": 96.34, "elapsed_time": "7:59:43", "remaining_time": "0:18:12", "throughput": 2609.64, "total_tokens": 75115648} +{"current_steps": 129375, "total_steps": 134280, "loss": 0.7923, "lr": 0.00012182030768701223, "epoch": 19.269436997319033, "percentage": 96.35, "elapsed_time": "7:59:44", "remaining_time": "0:18:11", "throughput": 2609.64, "total_tokens": 75118496} +{"current_steps": 129380, "total_steps": 134280, "loss": 0.799, "lr": 0.00012157246119018139, "epoch": 19.270181709859994, "percentage": 96.35, "elapsed_time": "7:59:45", "remaining_time": "0:18:10", "throughput": 2609.64, "total_tokens": 75121088} +{"current_steps": 129385, "total_steps": 134280, "loss": 0.7971, "lr": 0.00012132486604926329, "epoch": 19.270926422400954, "percentage": 96.35, "elapsed_time": "7:59:47", "remaining_time": "0:18:09", "throughput": 2609.64, "total_tokens": 75123776} +{"current_steps": 129390, "total_steps": 134280, "loss": 0.7996, "lr": 0.00012107752226843792, "epoch": 19.27167113494191, "percentage": 96.36, "elapsed_time": "7:59:48", "remaining_time": "0:18:07", "throughput": 2609.65, "total_tokens": 75126912} +{"current_steps": 129395, "total_steps": 134280, "loss": 0.8045, "lr": 0.00012083042985188696, "epoch": 19.272415847482872, "percentage": 96.36, "elapsed_time": "7:59:49", "remaining_time": "0:18:06", "throughput": 2609.65, "total_tokens": 75129696} +{"current_steps": 129400, "total_steps": 134280, "loss": 0.8028, "lr": 0.00012058358880378205, "epoch": 19.273160560023832, "percentage": 96.37, "elapsed_time": "7:59:50", "remaining_time": "0:18:05", "throughput": 2609.66, "total_tokens": 75132512} +{"current_steps": 129405, "total_steps": 134280, "loss": 0.7883, "lr": 0.00012033699912829653, "epoch": 19.27390527256479, "percentage": 96.37, "elapsed_time": "7:59:51", "remaining_time": "0:18:04", "throughput": 2609.66, "total_tokens": 75135360} +{"current_steps": 129410, "total_steps": 134280, "loss": 0.8094, "lr": 0.00012009066082959373, "epoch": 19.27464998510575, "percentage": 96.37, "elapsed_time": "7:59:52", "remaining_time": "0:18:03", "throughput": 2609.67, "total_tokens": 75138240} +{"current_steps": 129415, "total_steps": 134280, "loss": 0.7738, "lr": 0.00011984457391183367, "epoch": 19.275394697646707, "percentage": 96.38, "elapsed_time": "7:59:53", "remaining_time": "0:18:02", "throughput": 2609.67, "total_tokens": 75141152} +{"current_steps": 129420, "total_steps": 134280, "loss": 0.7824, "lr": 0.000119598738379178, "epoch": 19.276139410187668, "percentage": 96.38, "elapsed_time": "7:59:54", "remaining_time": "0:18:01", "throughput": 2609.67, "total_tokens": 75143840} +{"current_steps": 129425, "total_steps": 134280, "loss": 0.7731, "lr": 0.00011935315423577841, "epoch": 19.276884122728628, "percentage": 96.38, "elapsed_time": "7:59:55", "remaining_time": "0:18:00", "throughput": 2609.67, "total_tokens": 75146592} +{"current_steps": 129430, "total_steps": 134280, "loss": 0.7863, "lr": 0.00011910782148578158, "epoch": 19.277628835269585, "percentage": 96.39, "elapsed_time": "7:59:56", "remaining_time": "0:17:59", "throughput": 2609.67, "total_tokens": 75149216} +{"current_steps": 129435, "total_steps": 134280, "loss": 0.786, "lr": 0.00011886274013333586, "epoch": 19.278373547810546, "percentage": 96.39, "elapsed_time": "7:59:57", "remaining_time": "0:17:57", "throughput": 2609.67, "total_tokens": 75151744} +{"current_steps": 129440, "total_steps": 134280, "loss": 0.7894, "lr": 0.00011861791018257794, "epoch": 19.279118260351503, "percentage": 96.4, "elapsed_time": "7:59:58", "remaining_time": "0:17:56", "throughput": 2609.68, "total_tokens": 75154688} +{"current_steps": 129445, "total_steps": 134280, "loss": 0.7889, "lr": 0.00011837333163764618, "epoch": 19.279862972892463, "percentage": 96.4, "elapsed_time": "7:59:59", "remaining_time": "0:17:55", "throughput": 2609.68, "total_tokens": 75157408} +{"current_steps": 129450, "total_steps": 134280, "loss": 0.7952, "lr": 0.00011812900450267228, "epoch": 19.280607685433424, "percentage": 96.4, "elapsed_time": "8:00:00", "remaining_time": "0:17:54", "throughput": 2609.68, "total_tokens": 75160352} +{"current_steps": 129455, "total_steps": 134280, "loss": 0.79, "lr": 0.00011788492878178291, "epoch": 19.28135239797438, "percentage": 96.41, "elapsed_time": "8:00:01", "remaining_time": "0:17:53", "throughput": 2609.69, "total_tokens": 75163328} +{"current_steps": 129460, "total_steps": 134280, "loss": 0.7929, "lr": 0.00011764110447910314, "epoch": 19.28209711051534, "percentage": 96.41, "elapsed_time": "8:00:02", "remaining_time": "0:17:52", "throughput": 2609.69, "total_tokens": 75166176} +{"current_steps": 129465, "total_steps": 134280, "loss": 0.792, "lr": 0.00011739753159874965, "epoch": 19.2828418230563, "percentage": 96.41, "elapsed_time": "8:00:03", "remaining_time": "0:17:51", "throughput": 2609.69, "total_tokens": 75168896} +{"current_steps": 129470, "total_steps": 134280, "loss": 0.7908, "lr": 0.00011715421014484084, "epoch": 19.28358653559726, "percentage": 96.42, "elapsed_time": "8:00:04", "remaining_time": "0:17:50", "throughput": 2609.71, "total_tokens": 75172160} +{"current_steps": 129475, "total_steps": 134280, "loss": 0.8161, "lr": 0.00011691114012148506, "epoch": 19.28433124813822, "percentage": 96.42, "elapsed_time": "8:00:05", "remaining_time": "0:17:49", "throughput": 2609.71, "total_tokens": 75175072} +{"current_steps": 129480, "total_steps": 134280, "loss": 0.8095, "lr": 0.00011666832153278906, "epoch": 19.285075960679176, "percentage": 96.43, "elapsed_time": "8:00:06", "remaining_time": "0:17:47", "throughput": 2609.72, "total_tokens": 75178144} +{"current_steps": 129485, "total_steps": 134280, "loss": 0.7796, "lr": 0.00011642575438285451, "epoch": 19.285820673220137, "percentage": 96.43, "elapsed_time": "8:00:08", "remaining_time": "0:17:46", "throughput": 2609.72, "total_tokens": 75180800} +{"current_steps": 129490, "total_steps": 134280, "loss": 0.7947, "lr": 0.00011618343867577818, "epoch": 19.286565385761097, "percentage": 96.43, "elapsed_time": "8:00:09", "remaining_time": "0:17:45", "throughput": 2609.72, "total_tokens": 75183360} +{"current_steps": 129495, "total_steps": 134280, "loss": 0.8096, "lr": 0.00011594137441565844, "epoch": 19.287310098302054, "percentage": 96.44, "elapsed_time": "8:00:10", "remaining_time": "0:17:44", "throughput": 2609.72, "total_tokens": 75186240} +{"current_steps": 129500, "total_steps": 134280, "loss": 0.7949, "lr": 0.00011569956160657868, "epoch": 19.288054810843015, "percentage": 96.44, "elapsed_time": "8:00:11", "remaining_time": "0:17:43", "throughput": 2609.72, "total_tokens": 75189088} +{"current_steps": 129505, "total_steps": 134280, "loss": 0.8041, "lr": 0.00011545800025262898, "epoch": 19.288799523383975, "percentage": 96.44, "elapsed_time": "8:00:12", "remaining_time": "0:17:42", "throughput": 2609.73, "total_tokens": 75192064} +{"current_steps": 129510, "total_steps": 134280, "loss": 0.8078, "lr": 0.00011521669035788772, "epoch": 19.289544235924932, "percentage": 96.45, "elapsed_time": "8:00:13", "remaining_time": "0:17:41", "throughput": 2609.74, "total_tokens": 75195136} +{"current_steps": 129515, "total_steps": 134280, "loss": 0.8017, "lr": 0.00011497563192643334, "epoch": 19.290288948465893, "percentage": 96.45, "elapsed_time": "8:00:14", "remaining_time": "0:17:40", "throughput": 2609.74, "total_tokens": 75198080} +{"current_steps": 129520, "total_steps": 134280, "loss": 0.801, "lr": 0.00011473482496233589, "epoch": 19.29103366100685, "percentage": 96.46, "elapsed_time": "8:00:15", "remaining_time": "0:17:38", "throughput": 2609.75, "total_tokens": 75201184} +{"current_steps": 129525, "total_steps": 134280, "loss": 0.8088, "lr": 0.00011449426946966545, "epoch": 19.29177837354781, "percentage": 96.46, "elapsed_time": "8:00:16", "remaining_time": "0:17:37", "throughput": 2609.76, "total_tokens": 75204064} +{"current_steps": 129530, "total_steps": 134280, "loss": 0.7945, "lr": 0.00011425396545248545, "epoch": 19.29252308608877, "percentage": 96.46, "elapsed_time": "8:00:17", "remaining_time": "0:17:36", "throughput": 2609.77, "total_tokens": 75207328} +{"current_steps": 129535, "total_steps": 134280, "loss": 0.8012, "lr": 0.00011401391291485596, "epoch": 19.293267798629728, "percentage": 96.47, "elapsed_time": "8:00:18", "remaining_time": "0:17:35", "throughput": 2609.78, "total_tokens": 75210400} +{"current_steps": 129540, "total_steps": 134280, "loss": 0.8014, "lr": 0.00011377411186083208, "epoch": 19.29401251117069, "percentage": 96.47, "elapsed_time": "8:00:19", "remaining_time": "0:17:34", "throughput": 2609.78, "total_tokens": 75213248} +{"current_steps": 129545, "total_steps": 134280, "loss": 0.7998, "lr": 0.0001135345622944639, "epoch": 19.29475722371165, "percentage": 96.47, "elapsed_time": "8:00:20", "remaining_time": "0:17:33", "throughput": 2609.78, "total_tokens": 75215936} +{"current_steps": 129550, "total_steps": 134280, "loss": 0.7949, "lr": 0.00011329526421979985, "epoch": 19.295501936252606, "percentage": 96.48, "elapsed_time": "8:00:21", "remaining_time": "0:17:32", "throughput": 2609.78, "total_tokens": 75218464} +{"current_steps": 129555, "total_steps": 134280, "loss": 0.7924, "lr": 0.00011305621764088169, "epoch": 19.296246648793566, "percentage": 96.48, "elapsed_time": "8:00:22", "remaining_time": "0:17:31", "throughput": 2609.77, "total_tokens": 75221024} +{"current_steps": 129560, "total_steps": 134280, "loss": 0.7895, "lr": 0.00011281742256174954, "epoch": 19.296991361334523, "percentage": 96.48, "elapsed_time": "8:00:23", "remaining_time": "0:17:30", "throughput": 2609.78, "total_tokens": 75223808} +{"current_steps": 129565, "total_steps": 134280, "loss": 0.782, "lr": 0.00011257887898643514, "epoch": 19.297736073875484, "percentage": 96.49, "elapsed_time": "8:00:24", "remaining_time": "0:17:28", "throughput": 2609.78, "total_tokens": 75226784} +{"current_steps": 129570, "total_steps": 134280, "loss": 0.798, "lr": 0.00011234058691896864, "epoch": 19.298480786416444, "percentage": 96.49, "elapsed_time": "8:00:25", "remaining_time": "0:17:27", "throughput": 2609.79, "total_tokens": 75229632} +{"current_steps": 129575, "total_steps": 134280, "loss": 0.8014, "lr": 0.00011210254636337845, "epoch": 19.2992254989574, "percentage": 96.5, "elapsed_time": "8:00:27", "remaining_time": "0:17:26", "throughput": 2609.8, "total_tokens": 75232608} +{"current_steps": 129580, "total_steps": 134280, "loss": 0.8041, "lr": 0.00011186475732368472, "epoch": 19.299970211498362, "percentage": 96.5, "elapsed_time": "8:00:28", "remaining_time": "0:17:25", "throughput": 2609.79, "total_tokens": 75235264} +{"current_steps": 129585, "total_steps": 134280, "loss": 0.815, "lr": 0.00011162721980390421, "epoch": 19.300714924039323, "percentage": 96.5, "elapsed_time": "8:00:29", "remaining_time": "0:17:24", "throughput": 2609.8, "total_tokens": 75238080} +{"current_steps": 129590, "total_steps": 134280, "loss": 0.8007, "lr": 0.00011138993380804874, "epoch": 19.30145963658028, "percentage": 96.51, "elapsed_time": "8:00:30", "remaining_time": "0:17:23", "throughput": 2609.8, "total_tokens": 75240832} +{"current_steps": 129595, "total_steps": 134280, "loss": 0.7985, "lr": 0.00011115289934012839, "epoch": 19.30220434912124, "percentage": 96.51, "elapsed_time": "8:00:31", "remaining_time": "0:17:22", "throughput": 2609.8, "total_tokens": 75243744} +{"current_steps": 129600, "total_steps": 134280, "loss": 0.7933, "lr": 0.00011091611640414833, "epoch": 19.302949061662197, "percentage": 96.51, "elapsed_time": "8:00:32", "remaining_time": "0:17:21", "throughput": 2609.81, "total_tokens": 75246688} +{"current_steps": 129605, "total_steps": 134280, "loss": 0.8066, "lr": 0.00011067958500410701, "epoch": 19.303693774203158, "percentage": 96.52, "elapsed_time": "8:00:33", "remaining_time": "0:17:20", "throughput": 2609.82, "total_tokens": 75249856} +{"current_steps": 129610, "total_steps": 134280, "loss": 0.8037, "lr": 0.0001104433051440029, "epoch": 19.304438486744118, "percentage": 96.52, "elapsed_time": "8:00:34", "remaining_time": "0:17:18", "throughput": 2609.82, "total_tokens": 75252640} +{"current_steps": 129615, "total_steps": 134280, "loss": 0.8167, "lr": 0.0001102072768278245, "epoch": 19.305183199285075, "percentage": 96.53, "elapsed_time": "8:00:35", "remaining_time": "0:17:17", "throughput": 2609.83, "total_tokens": 75255648} +{"current_steps": 129620, "total_steps": 134280, "loss": 0.7907, "lr": 0.00010997150005956191, "epoch": 19.305927911826036, "percentage": 96.53, "elapsed_time": "8:00:36", "remaining_time": "0:17:16", "throughput": 2609.84, "total_tokens": 75258592} +{"current_steps": 129625, "total_steps": 134280, "loss": 0.8336, "lr": 0.0001097359748431953, "epoch": 19.306672624366993, "percentage": 96.53, "elapsed_time": "8:00:37", "remaining_time": "0:17:15", "throughput": 2609.84, "total_tokens": 75261472} +{"current_steps": 129630, "total_steps": 134280, "loss": 0.8076, "lr": 0.00010950070118270816, "epoch": 19.307417336907953, "percentage": 96.54, "elapsed_time": "8:00:38", "remaining_time": "0:17:14", "throughput": 2609.85, "total_tokens": 75264288} +{"current_steps": 129635, "total_steps": 134280, "loss": 0.7928, "lr": 0.00010926567908207062, "epoch": 19.308162049448914, "percentage": 96.54, "elapsed_time": "8:00:39", "remaining_time": "0:17:13", "throughput": 2609.85, "total_tokens": 75267328} +{"current_steps": 129640, "total_steps": 134280, "loss": 0.801, "lr": 0.0001090309085452562, "epoch": 19.30890676198987, "percentage": 96.54, "elapsed_time": "8:00:40", "remaining_time": "0:17:12", "throughput": 2609.86, "total_tokens": 75270272} +{"current_steps": 129645, "total_steps": 134280, "loss": 0.7891, "lr": 0.00010879638957623005, "epoch": 19.30965147453083, "percentage": 96.55, "elapsed_time": "8:00:41", "remaining_time": "0:17:11", "throughput": 2609.86, "total_tokens": 75273120} +{"current_steps": 129650, "total_steps": 134280, "loss": 0.7973, "lr": 0.000108562122178954, "epoch": 19.31039618707179, "percentage": 96.55, "elapsed_time": "8:00:42", "remaining_time": "0:17:10", "throughput": 2609.88, "total_tokens": 75276352} +{"current_steps": 129655, "total_steps": 134280, "loss": 0.786, "lr": 0.00010832810635738654, "epoch": 19.31114089961275, "percentage": 96.56, "elapsed_time": "8:00:43", "remaining_time": "0:17:08", "throughput": 2609.88, "total_tokens": 75279232} +{"current_steps": 129660, "total_steps": 134280, "loss": 0.7878, "lr": 0.00010809434211547953, "epoch": 19.31188561215371, "percentage": 96.56, "elapsed_time": "8:00:44", "remaining_time": "0:17:07", "throughput": 2609.88, "total_tokens": 75281984} +{"current_steps": 129665, "total_steps": 134280, "loss": 0.8081, "lr": 0.00010786082945718311, "epoch": 19.312630324694666, "percentage": 96.56, "elapsed_time": "8:00:46", "remaining_time": "0:17:06", "throughput": 2609.89, "total_tokens": 75284832} +{"current_steps": 129670, "total_steps": 134280, "loss": 0.785, "lr": 0.00010762756838644249, "epoch": 19.313375037235627, "percentage": 96.57, "elapsed_time": "8:00:47", "remaining_time": "0:17:05", "throughput": 2609.89, "total_tokens": 75287680} +{"current_steps": 129675, "total_steps": 134280, "loss": 0.8012, "lr": 0.00010739455890719785, "epoch": 19.314119749776587, "percentage": 96.57, "elapsed_time": "8:00:48", "remaining_time": "0:17:04", "throughput": 2609.89, "total_tokens": 75290400} +{"current_steps": 129680, "total_steps": 134280, "loss": 0.796, "lr": 0.00010716180102338767, "epoch": 19.314864462317544, "percentage": 96.57, "elapsed_time": "8:00:49", "remaining_time": "0:17:03", "throughput": 2609.9, "total_tokens": 75293472} +{"current_steps": 129685, "total_steps": 134280, "loss": 0.7985, "lr": 0.00010692929473894052, "epoch": 19.315609174858505, "percentage": 96.58, "elapsed_time": "8:00:50", "remaining_time": "0:17:02", "throughput": 2609.9, "total_tokens": 75296352} +{"current_steps": 129690, "total_steps": 134280, "loss": 0.8024, "lr": 0.00010669704005778823, "epoch": 19.316353887399465, "percentage": 96.58, "elapsed_time": "8:00:51", "remaining_time": "0:17:01", "throughput": 2609.91, "total_tokens": 75299456} +{"current_steps": 129695, "total_steps": 134280, "loss": 0.7936, "lr": 0.000106465036983851, "epoch": 19.317098599940422, "percentage": 96.59, "elapsed_time": "8:00:52", "remaining_time": "0:16:59", "throughput": 2609.92, "total_tokens": 75302272} +{"current_steps": 129700, "total_steps": 134280, "loss": 0.7961, "lr": 0.00010623328552105072, "epoch": 19.317843312481383, "percentage": 96.59, "elapsed_time": "8:00:53", "remaining_time": "0:16:58", "throughput": 2609.92, "total_tokens": 75305184} +{"current_steps": 129705, "total_steps": 134280, "loss": 0.7932, "lr": 0.00010600178567329921, "epoch": 19.31858802502234, "percentage": 96.59, "elapsed_time": "8:00:54", "remaining_time": "0:16:57", "throughput": 2609.92, "total_tokens": 75307936} +{"current_steps": 129710, "total_steps": 134280, "loss": 0.8193, "lr": 0.00010577053744451337, "epoch": 19.3193327375633, "percentage": 96.6, "elapsed_time": "8:00:55", "remaining_time": "0:16:56", "throughput": 2609.93, "total_tokens": 75310848} +{"current_steps": 129715, "total_steps": 134280, "loss": 0.802, "lr": 0.0001055395408385934, "epoch": 19.32007745010426, "percentage": 96.6, "elapsed_time": "8:00:56", "remaining_time": "0:16:55", "throughput": 2609.93, "total_tokens": 75313664} +{"current_steps": 129720, "total_steps": 134280, "loss": 0.7769, "lr": 0.00010530879585944786, "epoch": 19.320822162645218, "percentage": 96.6, "elapsed_time": "8:00:57", "remaining_time": "0:16:54", "throughput": 2609.94, "total_tokens": 75316640} +{"current_steps": 129725, "total_steps": 134280, "loss": 0.8007, "lr": 0.00010507830251097028, "epoch": 19.32156687518618, "percentage": 96.61, "elapsed_time": "8:00:58", "remaining_time": "0:16:53", "throughput": 2609.94, "total_tokens": 75319680} +{"current_steps": 129730, "total_steps": 134280, "loss": 0.8097, "lr": 0.00010484806079705588, "epoch": 19.32231158772714, "percentage": 96.61, "elapsed_time": "8:00:59", "remaining_time": "0:16:52", "throughput": 2609.96, "total_tokens": 75322912} +{"current_steps": 129735, "total_steps": 134280, "loss": 0.8025, "lr": 0.00010461807072159657, "epoch": 19.323056300268096, "percentage": 96.62, "elapsed_time": "8:01:00", "remaining_time": "0:16:51", "throughput": 2609.97, "total_tokens": 75326272} +{"current_steps": 129740, "total_steps": 134280, "loss": 0.8062, "lr": 0.00010438833228847422, "epoch": 19.323801012809056, "percentage": 96.62, "elapsed_time": "8:01:02", "remaining_time": "0:16:49", "throughput": 2609.98, "total_tokens": 75329248} +{"current_steps": 129745, "total_steps": 134280, "loss": 0.8146, "lr": 0.00010415884550157239, "epoch": 19.324545725350013, "percentage": 96.62, "elapsed_time": "8:01:03", "remaining_time": "0:16:48", "throughput": 2609.98, "total_tokens": 75332128} +{"current_steps": 129750, "total_steps": 134280, "loss": 0.7818, "lr": 0.00010392961036476799, "epoch": 19.325290437890974, "percentage": 96.63, "elapsed_time": "8:01:04", "remaining_time": "0:16:47", "throughput": 2609.98, "total_tokens": 75334784} +{"current_steps": 129755, "total_steps": 134280, "loss": 0.8022, "lr": 0.00010370062688193293, "epoch": 19.326035150431935, "percentage": 96.63, "elapsed_time": "8:01:05", "remaining_time": "0:16:46", "throughput": 2609.99, "total_tokens": 75337888} +{"current_steps": 129760, "total_steps": 134280, "loss": 0.7956, "lr": 0.0001034718950569341, "epoch": 19.32677986297289, "percentage": 96.63, "elapsed_time": "8:01:06", "remaining_time": "0:16:45", "throughput": 2609.99, "total_tokens": 75340672} +{"current_steps": 129765, "total_steps": 134280, "loss": 0.8147, "lr": 0.00010324341489364007, "epoch": 19.327524575513852, "percentage": 96.64, "elapsed_time": "8:01:07", "remaining_time": "0:16:44", "throughput": 2609.99, "total_tokens": 75343520} +{"current_steps": 129770, "total_steps": 134280, "loss": 0.8186, "lr": 0.00010301518639590612, "epoch": 19.328269288054813, "percentage": 96.64, "elapsed_time": "8:01:08", "remaining_time": "0:16:43", "throughput": 2610.0, "total_tokens": 75346304} +{"current_steps": 129775, "total_steps": 134280, "loss": 0.8002, "lr": 0.0001027872095675908, "epoch": 19.32901400059577, "percentage": 96.65, "elapsed_time": "8:01:09", "remaining_time": "0:16:42", "throughput": 2610.0, "total_tokens": 75349024} +{"current_steps": 129780, "total_steps": 134280, "loss": 0.7937, "lr": 0.00010255948441254436, "epoch": 19.32975871313673, "percentage": 96.65, "elapsed_time": "8:01:10", "remaining_time": "0:16:41", "throughput": 2610.01, "total_tokens": 75352064} +{"current_steps": 129785, "total_steps": 134280, "loss": 0.7948, "lr": 0.0001023320109346154, "epoch": 19.330503425677687, "percentage": 96.65, "elapsed_time": "8:01:11", "remaining_time": "0:16:39", "throughput": 2610.01, "total_tokens": 75354880} +{"current_steps": 129790, "total_steps": 134280, "loss": 0.8143, "lr": 0.0001021047891376442, "epoch": 19.331248138218648, "percentage": 96.66, "elapsed_time": "8:01:12", "remaining_time": "0:16:38", "throughput": 2610.01, "total_tokens": 75357600} +{"current_steps": 129795, "total_steps": 134280, "loss": 0.8049, "lr": 0.00010187781902547266, "epoch": 19.331992850759608, "percentage": 96.66, "elapsed_time": "8:01:13", "remaining_time": "0:16:37", "throughput": 2610.01, "total_tokens": 75360384} +{"current_steps": 129800, "total_steps": 134280, "loss": 0.7978, "lr": 0.00010165110060193272, "epoch": 19.332737563300565, "percentage": 96.66, "elapsed_time": "8:01:14", "remaining_time": "0:16:36", "throughput": 2610.02, "total_tokens": 75363296} +{"current_steps": 129805, "total_steps": 134280, "loss": 0.7877, "lr": 0.00010142463387085465, "epoch": 19.333482275841526, "percentage": 96.67, "elapsed_time": "8:01:15", "remaining_time": "0:16:35", "throughput": 2610.02, "total_tokens": 75366080} +{"current_steps": 129810, "total_steps": 134280, "loss": 0.7727, "lr": 0.00010119841883606705, "epoch": 19.334226988382483, "percentage": 96.67, "elapsed_time": "8:01:16", "remaining_time": "0:16:34", "throughput": 2610.03, "total_tokens": 75369216} +{"current_steps": 129815, "total_steps": 134280, "loss": 0.7878, "lr": 0.00010097245550138856, "epoch": 19.334971700923443, "percentage": 96.67, "elapsed_time": "8:01:17", "remaining_time": "0:16:33", "throughput": 2610.03, "total_tokens": 75371968} +{"current_steps": 129820, "total_steps": 134280, "loss": 0.7886, "lr": 0.00010074674387063775, "epoch": 19.335716413464404, "percentage": 96.68, "elapsed_time": "8:01:18", "remaining_time": "0:16:32", "throughput": 2610.03, "total_tokens": 75374784} +{"current_steps": 129825, "total_steps": 134280, "loss": 0.795, "lr": 0.00010052128394762826, "epoch": 19.33646112600536, "percentage": 96.68, "elapsed_time": "8:01:19", "remaining_time": "0:16:31", "throughput": 2610.04, "total_tokens": 75377888} +{"current_steps": 129830, "total_steps": 134280, "loss": 0.8055, "lr": 0.00010029607573616706, "epoch": 19.33720583854632, "percentage": 96.69, "elapsed_time": "8:01:20", "remaining_time": "0:16:29", "throughput": 2610.05, "total_tokens": 75380672} +{"current_steps": 129835, "total_steps": 134280, "loss": 0.7971, "lr": 0.00010007111924006273, "epoch": 19.337950551087282, "percentage": 96.69, "elapsed_time": "8:01:22", "remaining_time": "0:16:28", "throughput": 2610.05, "total_tokens": 75383552} +{"current_steps": 129840, "total_steps": 134280, "loss": 0.8049, "lr": 9.98464144631106e-05, "epoch": 19.33869526362824, "percentage": 96.69, "elapsed_time": "8:01:23", "remaining_time": "0:16:27", "throughput": 2610.06, "total_tokens": 75386688} +{"current_steps": 129845, "total_steps": 134280, "loss": 0.8039, "lr": 9.962196140911095e-05, "epoch": 19.3394399761692, "percentage": 96.7, "elapsed_time": "8:01:24", "remaining_time": "0:16:26", "throughput": 2610.06, "total_tokens": 75389248} +{"current_steps": 129850, "total_steps": 134280, "loss": 0.7969, "lr": 9.939776008185408e-05, "epoch": 19.340184688710156, "percentage": 96.7, "elapsed_time": "8:01:25", "remaining_time": "0:16:25", "throughput": 2610.06, "total_tokens": 75392192} +{"current_steps": 129855, "total_steps": 134280, "loss": 0.805, "lr": 9.917381048512863e-05, "epoch": 19.340929401251117, "percentage": 96.7, "elapsed_time": "8:01:26", "remaining_time": "0:16:24", "throughput": 2610.07, "total_tokens": 75395072} +{"current_steps": 129860, "total_steps": 134280, "loss": 0.8144, "lr": 9.895011262271491e-05, "epoch": 19.341674113792077, "percentage": 96.71, "elapsed_time": "8:01:27", "remaining_time": "0:16:23", "throughput": 2610.08, "total_tokens": 75398112} +{"current_steps": 129865, "total_steps": 134280, "loss": 0.8187, "lr": 9.872666649839656e-05, "epoch": 19.342418826333034, "percentage": 96.71, "elapsed_time": "8:01:28", "remaining_time": "0:16:22", "throughput": 2610.08, "total_tokens": 75400960} +{"current_steps": 129870, "total_steps": 134280, "loss": 0.7836, "lr": 9.85034721159439e-05, "epoch": 19.343163538873995, "percentage": 96.72, "elapsed_time": "8:01:29", "remaining_time": "0:16:21", "throughput": 2610.09, "total_tokens": 75404032} +{"current_steps": 129875, "total_steps": 134280, "loss": 0.7963, "lr": 9.828052947913224e-05, "epoch": 19.343908251414955, "percentage": 96.72, "elapsed_time": "8:01:30", "remaining_time": "0:16:19", "throughput": 2610.09, "total_tokens": 75406816} +{"current_steps": 129880, "total_steps": 134280, "loss": 0.7992, "lr": 9.805783859172524e-05, "epoch": 19.344652963955912, "percentage": 96.72, "elapsed_time": "8:01:31", "remaining_time": "0:16:18", "throughput": 2610.1, "total_tokens": 75409952} +{"current_steps": 129885, "total_steps": 134280, "loss": 0.8014, "lr": 9.783539945748487e-05, "epoch": 19.345397676496873, "percentage": 96.73, "elapsed_time": "8:01:32", "remaining_time": "0:16:17", "throughput": 2610.1, "total_tokens": 75412640} +{"current_steps": 129890, "total_steps": 134280, "loss": 0.7809, "lr": 9.761321208016815e-05, "epoch": 19.34614238903783, "percentage": 96.73, "elapsed_time": "8:01:33", "remaining_time": "0:16:16", "throughput": 2610.1, "total_tokens": 75415488} +{"current_steps": 129895, "total_steps": 134280, "loss": 0.7995, "lr": 9.739127646353207e-05, "epoch": 19.34688710157879, "percentage": 96.73, "elapsed_time": "8:01:34", "remaining_time": "0:16:15", "throughput": 2610.1, "total_tokens": 75418240} +{"current_steps": 129900, "total_steps": 134280, "loss": 0.7983, "lr": 9.716959261132196e-05, "epoch": 19.34763181411975, "percentage": 96.74, "elapsed_time": "8:01:35", "remaining_time": "0:16:14", "throughput": 2610.11, "total_tokens": 75421440} +{"current_steps": 129905, "total_steps": 134280, "loss": 0.8035, "lr": 9.69481605272865e-05, "epoch": 19.348376526660708, "percentage": 96.74, "elapsed_time": "8:01:36", "remaining_time": "0:16:13", "throughput": 2610.12, "total_tokens": 75424256} +{"current_steps": 129910, "total_steps": 134280, "loss": 0.8055, "lr": 9.672698021516602e-05, "epoch": 19.34912123920167, "percentage": 96.75, "elapsed_time": "8:01:37", "remaining_time": "0:16:12", "throughput": 2610.12, "total_tokens": 75427072} +{"current_steps": 129915, "total_steps": 134280, "loss": 0.7957, "lr": 9.650605167869419e-05, "epoch": 19.34986595174263, "percentage": 96.75, "elapsed_time": "8:01:38", "remaining_time": "0:16:10", "throughput": 2610.12, "total_tokens": 75429568} +{"current_steps": 129920, "total_steps": 134280, "loss": 0.8016, "lr": 9.628537492160638e-05, "epoch": 19.350610664283586, "percentage": 96.75, "elapsed_time": "8:01:39", "remaining_time": "0:16:09", "throughput": 2610.12, "total_tokens": 75432416} +{"current_steps": 129925, "total_steps": 134280, "loss": 0.7964, "lr": 9.60649499476296e-05, "epoch": 19.351355376824547, "percentage": 96.76, "elapsed_time": "8:01:41", "remaining_time": "0:16:08", "throughput": 2610.13, "total_tokens": 75435424} +{"current_steps": 129930, "total_steps": 134280, "loss": 0.7927, "lr": 9.584477676048753e-05, "epoch": 19.352100089365504, "percentage": 96.76, "elapsed_time": "8:01:42", "remaining_time": "0:16:07", "throughput": 2610.13, "total_tokens": 75438336} +{"current_steps": 129935, "total_steps": 134280, "loss": 0.8039, "lr": 9.562485536390052e-05, "epoch": 19.352844801906464, "percentage": 96.76, "elapsed_time": "8:01:43", "remaining_time": "0:16:06", "throughput": 2610.13, "total_tokens": 75441024} +{"current_steps": 129940, "total_steps": 134280, "loss": 0.7834, "lr": 9.540518576158396e-05, "epoch": 19.353589514447425, "percentage": 96.77, "elapsed_time": "8:01:44", "remaining_time": "0:16:05", "throughput": 2610.14, "total_tokens": 75444000} +{"current_steps": 129945, "total_steps": 134280, "loss": 0.8099, "lr": 9.51857679572482e-05, "epoch": 19.35433422698838, "percentage": 96.77, "elapsed_time": "8:01:45", "remaining_time": "0:16:04", "throughput": 2610.15, "total_tokens": 75446944} +{"current_steps": 129950, "total_steps": 134280, "loss": 0.8014, "lr": 9.496660195460027e-05, "epoch": 19.355078939529342, "percentage": 96.78, "elapsed_time": "8:01:46", "remaining_time": "0:16:03", "throughput": 2610.15, "total_tokens": 75449888} +{"current_steps": 129955, "total_steps": 134280, "loss": 0.8048, "lr": 9.474768775734055e-05, "epoch": 19.3558236520703, "percentage": 96.78, "elapsed_time": "8:01:47", "remaining_time": "0:16:02", "throughput": 2610.16, "total_tokens": 75452768} +{"current_steps": 129960, "total_steps": 134280, "loss": 0.7901, "lr": 9.452902536917273e-05, "epoch": 19.35656836461126, "percentage": 96.78, "elapsed_time": "8:01:48", "remaining_time": "0:16:00", "throughput": 2610.16, "total_tokens": 75455584} +{"current_steps": 129965, "total_steps": 134280, "loss": 0.8077, "lr": 9.431061479378722e-05, "epoch": 19.35731307715222, "percentage": 96.79, "elapsed_time": "8:01:49", "remaining_time": "0:15:59", "throughput": 2610.16, "total_tokens": 75458176} +{"current_steps": 129970, "total_steps": 134280, "loss": 0.7897, "lr": 9.40924560348727e-05, "epoch": 19.358057789693177, "percentage": 96.79, "elapsed_time": "8:01:50", "remaining_time": "0:15:58", "throughput": 2610.16, "total_tokens": 75461056} +{"current_steps": 129975, "total_steps": 134280, "loss": 0.8092, "lr": 9.387454909611792e-05, "epoch": 19.358802502234138, "percentage": 96.79, "elapsed_time": "8:01:51", "remaining_time": "0:15:57", "throughput": 2610.16, "total_tokens": 75463808} +{"current_steps": 129980, "total_steps": 134280, "loss": 0.8025, "lr": 9.365689398120158e-05, "epoch": 19.359547214775098, "percentage": 96.8, "elapsed_time": "8:01:52", "remaining_time": "0:15:56", "throughput": 2610.18, "total_tokens": 75467040} +{"current_steps": 129985, "total_steps": 134280, "loss": 0.7914, "lr": 9.343949069380242e-05, "epoch": 19.360291927316055, "percentage": 96.8, "elapsed_time": "8:01:53", "remaining_time": "0:15:55", "throughput": 2610.18, "total_tokens": 75469824} +{"current_steps": 129990, "total_steps": 134280, "loss": 0.7945, "lr": 9.322233923759248e-05, "epoch": 19.361036639857016, "percentage": 96.81, "elapsed_time": "8:01:54", "remaining_time": "0:15:54", "throughput": 2610.18, "total_tokens": 75472800} +{"current_steps": 129995, "total_steps": 134280, "loss": 0.7896, "lr": 9.300543961624053e-05, "epoch": 19.361781352397973, "percentage": 96.81, "elapsed_time": "8:01:55", "remaining_time": "0:15:53", "throughput": 2610.19, "total_tokens": 75475680} +{"current_steps": 130000, "total_steps": 134280, "loss": 0.8081, "lr": 9.278879183341193e-05, "epoch": 19.362526064938933, "percentage": 96.81, "elapsed_time": "8:01:56", "remaining_time": "0:15:52", "throughput": 2610.19, "total_tokens": 75478368} +{"current_steps": 130005, "total_steps": 134280, "loss": 0.7963, "lr": 9.257239589276545e-05, "epoch": 19.363270777479894, "percentage": 96.82, "elapsed_time": "8:01:57", "remaining_time": "0:15:50", "throughput": 2610.19, "total_tokens": 75481024} +{"current_steps": 130010, "total_steps": 134280, "loss": 0.8168, "lr": 9.235625179795648e-05, "epoch": 19.36401549002085, "percentage": 96.82, "elapsed_time": "8:01:58", "remaining_time": "0:15:49", "throughput": 2610.19, "total_tokens": 75483936} +{"current_steps": 130015, "total_steps": 134280, "loss": 0.7959, "lr": 9.21403595526371e-05, "epoch": 19.36476020256181, "percentage": 96.82, "elapsed_time": "8:01:59", "remaining_time": "0:15:48", "throughput": 2610.2, "total_tokens": 75487008} +{"current_steps": 130020, "total_steps": 134280, "loss": 0.7671, "lr": 9.192471916045608e-05, "epoch": 19.365504915102772, "percentage": 96.83, "elapsed_time": "8:02:01", "remaining_time": "0:15:47", "throughput": 2610.21, "total_tokens": 75489824} +{"current_steps": 130025, "total_steps": 134280, "loss": 0.7967, "lr": 9.170933062505382e-05, "epoch": 19.36624962764373, "percentage": 96.83, "elapsed_time": "8:02:02", "remaining_time": "0:15:46", "throughput": 2610.21, "total_tokens": 75492640} +{"current_steps": 130030, "total_steps": 134280, "loss": 0.7923, "lr": 9.149419395006907e-05, "epoch": 19.36699434018469, "percentage": 96.83, "elapsed_time": "8:02:03", "remaining_time": "0:15:45", "throughput": 2610.21, "total_tokens": 75495520} +{"current_steps": 130035, "total_steps": 134280, "loss": 0.7899, "lr": 9.127930913913895e-05, "epoch": 19.367739052725646, "percentage": 96.84, "elapsed_time": "8:02:04", "remaining_time": "0:15:44", "throughput": 2610.23, "total_tokens": 75498784} +{"current_steps": 130040, "total_steps": 134280, "loss": 0.8038, "lr": 9.10646761958922e-05, "epoch": 19.368483765266607, "percentage": 96.84, "elapsed_time": "8:02:05", "remaining_time": "0:15:43", "throughput": 2610.23, "total_tokens": 75501600} +{"current_steps": 130045, "total_steps": 134280, "loss": 0.7885, "lr": 9.085029512395593e-05, "epoch": 19.369228477807567, "percentage": 96.85, "elapsed_time": "8:02:06", "remaining_time": "0:15:42", "throughput": 2610.24, "total_tokens": 75504736} +{"current_steps": 130050, "total_steps": 134280, "loss": 0.7986, "lr": 9.063616592695056e-05, "epoch": 19.369973190348524, "percentage": 96.85, "elapsed_time": "8:02:07", "remaining_time": "0:15:40", "throughput": 2610.24, "total_tokens": 75507520} +{"current_steps": 130055, "total_steps": 134280, "loss": 0.7954, "lr": 9.042228860849322e-05, "epoch": 19.370717902889485, "percentage": 96.85, "elapsed_time": "8:02:08", "remaining_time": "0:15:39", "throughput": 2610.24, "total_tokens": 75510400} +{"current_steps": 130060, "total_steps": 134280, "loss": 0.8362, "lr": 9.020866317219766e-05, "epoch": 19.371462615430445, "percentage": 96.86, "elapsed_time": "8:02:09", "remaining_time": "0:15:38", "throughput": 2610.25, "total_tokens": 75513408} +{"current_steps": 130065, "total_steps": 134280, "loss": 0.7962, "lr": 8.999528962167435e-05, "epoch": 19.372207327971402, "percentage": 96.86, "elapsed_time": "8:02:10", "remaining_time": "0:15:37", "throughput": 2610.26, "total_tokens": 75516256} +{"current_steps": 130070, "total_steps": 134280, "loss": 0.8181, "lr": 8.97821679605254e-05, "epoch": 19.372952040512363, "percentage": 96.86, "elapsed_time": "8:02:11", "remaining_time": "0:15:36", "throughput": 2610.26, "total_tokens": 75519328} +{"current_steps": 130075, "total_steps": 134280, "loss": 0.8134, "lr": 8.956929819235293e-05, "epoch": 19.37369675305332, "percentage": 96.87, "elapsed_time": "8:02:12", "remaining_time": "0:15:35", "throughput": 2610.28, "total_tokens": 75522528} +{"current_steps": 130080, "total_steps": 134280, "loss": 0.7993, "lr": 8.935668032075405e-05, "epoch": 19.37444146559428, "percentage": 96.87, "elapsed_time": "8:02:13", "remaining_time": "0:15:34", "throughput": 2610.28, "total_tokens": 75525440} +{"current_steps": 130085, "total_steps": 134280, "loss": 0.7964, "lr": 8.914431434931924e-05, "epoch": 19.37518617813524, "percentage": 96.88, "elapsed_time": "8:02:14", "remaining_time": "0:15:33", "throughput": 2610.28, "total_tokens": 75528288} +{"current_steps": 130090, "total_steps": 134280, "loss": 0.8048, "lr": 8.893220028163562e-05, "epoch": 19.375930890676198, "percentage": 96.88, "elapsed_time": "8:02:15", "remaining_time": "0:15:31", "throughput": 2610.29, "total_tokens": 75531168} +{"current_steps": 130095, "total_steps": 134280, "loss": 0.7864, "lr": 8.872033812128698e-05, "epoch": 19.37667560321716, "percentage": 96.88, "elapsed_time": "8:02:16", "remaining_time": "0:15:30", "throughput": 2610.29, "total_tokens": 75533920} +{"current_steps": 130100, "total_steps": 134280, "loss": 0.8123, "lr": 8.850872787185548e-05, "epoch": 19.37742031575812, "percentage": 96.89, "elapsed_time": "8:02:18", "remaining_time": "0:15:29", "throughput": 2610.29, "total_tokens": 75536736} +{"current_steps": 130105, "total_steps": 134280, "loss": 0.8043, "lr": 8.829736953691158e-05, "epoch": 19.378165028299076, "percentage": 96.89, "elapsed_time": "8:02:19", "remaining_time": "0:15:28", "throughput": 2610.3, "total_tokens": 75539488} +{"current_steps": 130110, "total_steps": 134280, "loss": 0.7939, "lr": 8.80862631200291e-05, "epoch": 19.378909740840037, "percentage": 96.89, "elapsed_time": "8:02:20", "remaining_time": "0:15:27", "throughput": 2610.31, "total_tokens": 75542656} +{"current_steps": 130115, "total_steps": 134280, "loss": 0.7747, "lr": 8.787540862477183e-05, "epoch": 19.379654453380994, "percentage": 96.9, "elapsed_time": "8:02:21", "remaining_time": "0:15:26", "throughput": 2610.3, "total_tokens": 75545248} +{"current_steps": 130120, "total_steps": 134280, "loss": 0.8041, "lr": 8.766480605470527e-05, "epoch": 19.380399165921954, "percentage": 96.9, "elapsed_time": "8:02:22", "remaining_time": "0:15:25", "throughput": 2610.3, "total_tokens": 75547872} +{"current_steps": 130125, "total_steps": 134280, "loss": 0.798, "lr": 8.745445541338492e-05, "epoch": 19.381143878462915, "percentage": 96.91, "elapsed_time": "8:02:23", "remaining_time": "0:15:24", "throughput": 2610.31, "total_tokens": 75550976} +{"current_steps": 130130, "total_steps": 134280, "loss": 0.793, "lr": 8.724435670436458e-05, "epoch": 19.38188859100387, "percentage": 96.91, "elapsed_time": "8:02:24", "remaining_time": "0:15:23", "throughput": 2610.32, "total_tokens": 75553920} +{"current_steps": 130135, "total_steps": 134280, "loss": 0.8073, "lr": 8.703450993119644e-05, "epoch": 19.382633303544832, "percentage": 96.91, "elapsed_time": "8:02:25", "remaining_time": "0:15:21", "throughput": 2610.33, "total_tokens": 75557216} +{"current_steps": 130140, "total_steps": 134280, "loss": 0.7957, "lr": 8.682491509742096e-05, "epoch": 19.38337801608579, "percentage": 96.92, "elapsed_time": "8:02:26", "remaining_time": "0:15:20", "throughput": 2610.33, "total_tokens": 75559904} +{"current_steps": 130145, "total_steps": 134280, "loss": 0.7918, "lr": 8.661557220658367e-05, "epoch": 19.38412272862675, "percentage": 96.92, "elapsed_time": "8:02:27", "remaining_time": "0:15:19", "throughput": 2610.34, "total_tokens": 75562816} +{"current_steps": 130150, "total_steps": 134280, "loss": 0.7783, "lr": 8.640648126221672e-05, "epoch": 19.38486744116771, "percentage": 96.92, "elapsed_time": "8:02:28", "remaining_time": "0:15:18", "throughput": 2610.34, "total_tokens": 75565600} +{"current_steps": 130155, "total_steps": 134280, "loss": 0.7878, "lr": 8.619764226785564e-05, "epoch": 19.385612153708667, "percentage": 96.93, "elapsed_time": "8:02:29", "remaining_time": "0:15:17", "throughput": 2610.35, "total_tokens": 75568640} +{"current_steps": 130160, "total_steps": 134280, "loss": 0.8185, "lr": 8.59890552270276e-05, "epoch": 19.386356866249628, "percentage": 96.93, "elapsed_time": "8:02:30", "remaining_time": "0:15:16", "throughput": 2610.36, "total_tokens": 75571712} +{"current_steps": 130165, "total_steps": 134280, "loss": 0.8013, "lr": 8.578072014325644e-05, "epoch": 19.38710157879059, "percentage": 96.94, "elapsed_time": "8:02:31", "remaining_time": "0:15:15", "throughput": 2610.36, "total_tokens": 75574592} +{"current_steps": 130170, "total_steps": 134280, "loss": 0.7943, "lr": 8.557263702006268e-05, "epoch": 19.387846291331545, "percentage": 96.94, "elapsed_time": "8:02:32", "remaining_time": "0:15:14", "throughput": 2610.36, "total_tokens": 75577376} +{"current_steps": 130175, "total_steps": 134280, "loss": 0.801, "lr": 8.536480586096017e-05, "epoch": 19.388591003872506, "percentage": 96.94, "elapsed_time": "8:02:33", "remaining_time": "0:15:13", "throughput": 2610.36, "total_tokens": 75580064} +{"current_steps": 130180, "total_steps": 134280, "loss": 0.7911, "lr": 8.515722666946113e-05, "epoch": 19.389335716413463, "percentage": 96.95, "elapsed_time": "8:02:34", "remaining_time": "0:15:11", "throughput": 2610.36, "total_tokens": 75582720} +{"current_steps": 130185, "total_steps": 134280, "loss": 0.8094, "lr": 8.494989944907105e-05, "epoch": 19.390080428954423, "percentage": 96.95, "elapsed_time": "8:02:35", "remaining_time": "0:15:10", "throughput": 2610.37, "total_tokens": 75585760} +{"current_steps": 130190, "total_steps": 134280, "loss": 0.7964, "lr": 8.474282420329381e-05, "epoch": 19.390825141495384, "percentage": 96.95, "elapsed_time": "8:02:36", "remaining_time": "0:15:09", "throughput": 2610.37, "total_tokens": 75588544} +{"current_steps": 130195, "total_steps": 134280, "loss": 0.8145, "lr": 8.453600093562829e-05, "epoch": 19.39156985403634, "percentage": 96.96, "elapsed_time": "8:02:38", "remaining_time": "0:15:08", "throughput": 2610.38, "total_tokens": 75591360} +{"current_steps": 130200, "total_steps": 134280, "loss": 0.7861, "lr": 8.432942964956668e-05, "epoch": 19.3923145665773, "percentage": 96.96, "elapsed_time": "8:02:39", "remaining_time": "0:15:07", "throughput": 2610.38, "total_tokens": 75594112} +{"current_steps": 130205, "total_steps": 134280, "loss": 0.7966, "lr": 8.412311034859954e-05, "epoch": 19.393059279118262, "percentage": 96.97, "elapsed_time": "8:02:40", "remaining_time": "0:15:06", "throughput": 2610.38, "total_tokens": 75596896} +{"current_steps": 130210, "total_steps": 134280, "loss": 0.8048, "lr": 8.391704303621405e-05, "epoch": 19.39380399165922, "percentage": 96.97, "elapsed_time": "8:02:41", "remaining_time": "0:15:05", "throughput": 2610.38, "total_tokens": 75599648} +{"current_steps": 130215, "total_steps": 134280, "loss": 0.7753, "lr": 8.371122771588913e-05, "epoch": 19.39454870420018, "percentage": 96.97, "elapsed_time": "8:02:42", "remaining_time": "0:15:04", "throughput": 2610.38, "total_tokens": 75602400} +{"current_steps": 130220, "total_steps": 134280, "loss": 0.8062, "lr": 8.350566439110196e-05, "epoch": 19.395293416741136, "percentage": 96.98, "elapsed_time": "8:02:43", "remaining_time": "0:15:03", "throughput": 2610.39, "total_tokens": 75605184} +{"current_steps": 130225, "total_steps": 134280, "loss": 0.7944, "lr": 8.330035306532812e-05, "epoch": 19.396038129282097, "percentage": 96.98, "elapsed_time": "8:02:44", "remaining_time": "0:15:01", "throughput": 2610.39, "total_tokens": 75608224} +{"current_steps": 130230, "total_steps": 134280, "loss": 0.7892, "lr": 8.309529374203317e-05, "epoch": 19.396782841823057, "percentage": 96.98, "elapsed_time": "8:02:45", "remaining_time": "0:15:00", "throughput": 2610.4, "total_tokens": 75611136} +{"current_steps": 130235, "total_steps": 134280, "loss": 0.8272, "lr": 8.2890486424681e-05, "epoch": 19.397527554364014, "percentage": 96.99, "elapsed_time": "8:02:46", "remaining_time": "0:14:59", "throughput": 2610.41, "total_tokens": 75614112} +{"current_steps": 130240, "total_steps": 134280, "loss": 0.7894, "lr": 8.268593111673383e-05, "epoch": 19.398272266904975, "percentage": 96.99, "elapsed_time": "8:02:47", "remaining_time": "0:14:58", "throughput": 2610.41, "total_tokens": 75616736} +{"current_steps": 130245, "total_steps": 134280, "loss": 0.781, "lr": 8.248162782164725e-05, "epoch": 19.399016979445936, "percentage": 97.0, "elapsed_time": "8:02:48", "remaining_time": "0:14:57", "throughput": 2610.41, "total_tokens": 75619712} +{"current_steps": 130250, "total_steps": 134280, "loss": 0.8142, "lr": 8.227757654287349e-05, "epoch": 19.399761691986892, "percentage": 97.0, "elapsed_time": "8:02:49", "remaining_time": "0:14:56", "throughput": 2610.42, "total_tokens": 75622560} +{"current_steps": 130255, "total_steps": 134280, "loss": 0.8066, "lr": 8.207377728385478e-05, "epoch": 19.400506404527853, "percentage": 97.0, "elapsed_time": "8:02:50", "remaining_time": "0:14:55", "throughput": 2610.42, "total_tokens": 75625504} +{"current_steps": 130260, "total_steps": 134280, "loss": 0.7961, "lr": 8.187023004804005e-05, "epoch": 19.40125111706881, "percentage": 97.01, "elapsed_time": "8:02:51", "remaining_time": "0:14:54", "throughput": 2610.42, "total_tokens": 75628096} +{"current_steps": 130265, "total_steps": 134280, "loss": 0.7933, "lr": 8.166693483886489e-05, "epoch": 19.40199582960977, "percentage": 97.01, "elapsed_time": "8:02:52", "remaining_time": "0:14:52", "throughput": 2610.42, "total_tokens": 75630848} +{"current_steps": 130270, "total_steps": 134280, "loss": 0.8066, "lr": 8.146389165976487e-05, "epoch": 19.40274054215073, "percentage": 97.01, "elapsed_time": "8:02:53", "remaining_time": "0:14:51", "throughput": 2610.43, "total_tokens": 75633664} +{"current_steps": 130275, "total_steps": 134280, "loss": 0.7948, "lr": 8.126110051417056e-05, "epoch": 19.403485254691688, "percentage": 97.02, "elapsed_time": "8:02:54", "remaining_time": "0:14:50", "throughput": 2610.42, "total_tokens": 75636288} +{"current_steps": 130280, "total_steps": 134280, "loss": 0.7985, "lr": 8.10585614055076e-05, "epoch": 19.40422996723265, "percentage": 97.02, "elapsed_time": "8:02:55", "remaining_time": "0:14:49", "throughput": 2610.43, "total_tokens": 75639328} +{"current_steps": 130285, "total_steps": 134280, "loss": 0.7826, "lr": 8.085627433719489e-05, "epoch": 19.40497467977361, "percentage": 97.02, "elapsed_time": "8:02:56", "remaining_time": "0:14:48", "throughput": 2610.43, "total_tokens": 75642048} +{"current_steps": 130290, "total_steps": 134280, "loss": 0.7999, "lr": 8.06542393126547e-05, "epoch": 19.405719392314566, "percentage": 97.03, "elapsed_time": "8:02:57", "remaining_time": "0:14:47", "throughput": 2610.43, "total_tokens": 75644608} +{"current_steps": 130295, "total_steps": 134280, "loss": 0.8025, "lr": 8.045245633529596e-05, "epoch": 19.406464104855527, "percentage": 97.03, "elapsed_time": "8:02:58", "remaining_time": "0:14:46", "throughput": 2610.43, "total_tokens": 75647488} +{"current_steps": 130300, "total_steps": 134280, "loss": 0.7861, "lr": 8.025092540853096e-05, "epoch": 19.407208817396484, "percentage": 97.04, "elapsed_time": "8:02:59", "remaining_time": "0:14:45", "throughput": 2610.44, "total_tokens": 75650560} +{"current_steps": 130305, "total_steps": 134280, "loss": 0.8037, "lr": 8.004964653576196e-05, "epoch": 19.407953529937444, "percentage": 97.04, "elapsed_time": "8:03:01", "remaining_time": "0:14:44", "throughput": 2610.45, "total_tokens": 75653824} +{"current_steps": 130310, "total_steps": 134280, "loss": 0.7967, "lr": 7.984861972038959e-05, "epoch": 19.408698242478405, "percentage": 97.04, "elapsed_time": "8:03:02", "remaining_time": "0:14:42", "throughput": 2610.46, "total_tokens": 75656864} +{"current_steps": 130315, "total_steps": 134280, "loss": 0.7875, "lr": 7.964784496581112e-05, "epoch": 19.40944295501936, "percentage": 97.05, "elapsed_time": "8:03:03", "remaining_time": "0:14:41", "throughput": 2610.46, "total_tokens": 75659616} +{"current_steps": 130320, "total_steps": 134280, "loss": 0.803, "lr": 7.944732227541884e-05, "epoch": 19.410187667560322, "percentage": 97.05, "elapsed_time": "8:03:04", "remaining_time": "0:14:40", "throughput": 2610.46, "total_tokens": 75662240} +{"current_steps": 130325, "total_steps": 134280, "loss": 0.7994, "lr": 7.924705165259837e-05, "epoch": 19.41093238010128, "percentage": 97.05, "elapsed_time": "8:03:05", "remaining_time": "0:14:39", "throughput": 2610.47, "total_tokens": 75665280} +{"current_steps": 130330, "total_steps": 134280, "loss": 0.7877, "lr": 7.904703310073535e-05, "epoch": 19.41167709264224, "percentage": 97.06, "elapsed_time": "8:03:06", "remaining_time": "0:14:38", "throughput": 2610.47, "total_tokens": 75668000} +{"current_steps": 130335, "total_steps": 134280, "loss": 0.7866, "lr": 7.884726662320706e-05, "epoch": 19.4124218051832, "percentage": 97.06, "elapsed_time": "8:03:07", "remaining_time": "0:14:37", "throughput": 2610.47, "total_tokens": 75670784} +{"current_steps": 130340, "total_steps": 134280, "loss": 0.8006, "lr": 7.864775222338915e-05, "epoch": 19.413166517724157, "percentage": 97.07, "elapsed_time": "8:03:08", "remaining_time": "0:14:36", "throughput": 2610.48, "total_tokens": 75673792} +{"current_steps": 130345, "total_steps": 134280, "loss": 0.7851, "lr": 7.844848990465225e-05, "epoch": 19.413911230265118, "percentage": 97.07, "elapsed_time": "8:03:09", "remaining_time": "0:14:35", "throughput": 2610.48, "total_tokens": 75676448} +{"current_steps": 130350, "total_steps": 134280, "loss": 0.7935, "lr": 7.8249479670362e-05, "epoch": 19.41465594280608, "percentage": 97.07, "elapsed_time": "8:03:10", "remaining_time": "0:14:34", "throughput": 2610.49, "total_tokens": 75679424} +{"current_steps": 130355, "total_steps": 134280, "loss": 0.8068, "lr": 7.805072152388071e-05, "epoch": 19.415400655347035, "percentage": 97.08, "elapsed_time": "8:03:11", "remaining_time": "0:14:32", "throughput": 2610.49, "total_tokens": 75682208} +{"current_steps": 130360, "total_steps": 134280, "loss": 0.8127, "lr": 7.785221546856734e-05, "epoch": 19.416145367887996, "percentage": 97.08, "elapsed_time": "8:03:12", "remaining_time": "0:14:31", "throughput": 2610.5, "total_tokens": 75685216} +{"current_steps": 130365, "total_steps": 134280, "loss": 0.8256, "lr": 7.765396150777426e-05, "epoch": 19.416890080428953, "percentage": 97.08, "elapsed_time": "8:03:13", "remaining_time": "0:14:30", "throughput": 2610.5, "total_tokens": 75688000} +{"current_steps": 130370, "total_steps": 134280, "loss": 0.8012, "lr": 7.745595964485041e-05, "epoch": 19.417634792969913, "percentage": 97.09, "elapsed_time": "8:03:14", "remaining_time": "0:14:29", "throughput": 2610.5, "total_tokens": 75690752} +{"current_steps": 130375, "total_steps": 134280, "loss": 0.8008, "lr": 7.725820988314313e-05, "epoch": 19.418379505510874, "percentage": 97.09, "elapsed_time": "8:03:15", "remaining_time": "0:14:28", "throughput": 2610.5, "total_tokens": 75693376} +{"current_steps": 130380, "total_steps": 134280, "loss": 0.7954, "lr": 7.706071222598976e-05, "epoch": 19.41912421805183, "percentage": 97.1, "elapsed_time": "8:03:16", "remaining_time": "0:14:27", "throughput": 2610.51, "total_tokens": 75696384} +{"current_steps": 130385, "total_steps": 134280, "loss": 0.7771, "lr": 7.686346667672927e-05, "epoch": 19.41986893059279, "percentage": 97.1, "elapsed_time": "8:03:17", "remaining_time": "0:14:26", "throughput": 2610.51, "total_tokens": 75699072} +{"current_steps": 130390, "total_steps": 134280, "loss": 0.7791, "lr": 7.666647323869401e-05, "epoch": 19.420613643133752, "percentage": 97.1, "elapsed_time": "8:03:18", "remaining_time": "0:14:25", "throughput": 2610.51, "total_tokens": 75701792} +{"current_steps": 130395, "total_steps": 134280, "loss": 0.8005, "lr": 7.646973191521133e-05, "epoch": 19.42135835567471, "percentage": 97.11, "elapsed_time": "8:03:19", "remaining_time": "0:14:24", "throughput": 2610.51, "total_tokens": 75704416} +{"current_steps": 130400, "total_steps": 134280, "loss": 0.794, "lr": 7.627324270960356e-05, "epoch": 19.42210306821567, "percentage": 97.11, "elapsed_time": "8:03:20", "remaining_time": "0:14:22", "throughput": 2610.51, "total_tokens": 75707200} +{"current_steps": 130405, "total_steps": 134280, "loss": 0.7993, "lr": 7.607700562519303e-05, "epoch": 19.422847780756626, "percentage": 97.11, "elapsed_time": "8:03:22", "remaining_time": "0:14:21", "throughput": 2610.52, "total_tokens": 75710208} +{"current_steps": 130410, "total_steps": 134280, "loss": 0.7877, "lr": 7.588102066529212e-05, "epoch": 19.423592493297587, "percentage": 97.12, "elapsed_time": "8:03:23", "remaining_time": "0:14:20", "throughput": 2610.5, "total_tokens": 75713024} +{"current_steps": 130415, "total_steps": 134280, "loss": 0.7987, "lr": 7.568528783321481e-05, "epoch": 19.424337205838548, "percentage": 97.12, "elapsed_time": "8:03:24", "remaining_time": "0:14:19", "throughput": 2610.51, "total_tokens": 75715776} +{"current_steps": 130420, "total_steps": 134280, "loss": 0.7782, "lr": 7.548980713226517e-05, "epoch": 19.425081918379504, "percentage": 97.13, "elapsed_time": "8:03:25", "remaining_time": "0:14:18", "throughput": 2610.51, "total_tokens": 75718720} +{"current_steps": 130425, "total_steps": 134280, "loss": 0.7983, "lr": 7.529457856574717e-05, "epoch": 19.425826630920465, "percentage": 97.13, "elapsed_time": "8:03:26", "remaining_time": "0:14:17", "throughput": 2610.51, "total_tokens": 75721568} +{"current_steps": 130430, "total_steps": 134280, "loss": 0.7787, "lr": 7.509960213695821e-05, "epoch": 19.426571343461426, "percentage": 97.13, "elapsed_time": "8:03:27", "remaining_time": "0:14:16", "throughput": 2610.52, "total_tokens": 75724448} +{"current_steps": 130435, "total_steps": 134280, "loss": 0.7833, "lr": 7.49048778491923e-05, "epoch": 19.427316056002383, "percentage": 97.14, "elapsed_time": "8:03:28", "remaining_time": "0:14:15", "throughput": 2610.53, "total_tokens": 75727424} +{"current_steps": 130440, "total_steps": 134280, "loss": 0.7814, "lr": 7.47104057057385e-05, "epoch": 19.428060768543343, "percentage": 97.14, "elapsed_time": "8:03:29", "remaining_time": "0:14:14", "throughput": 2610.53, "total_tokens": 75730528} +{"current_steps": 130445, "total_steps": 134280, "loss": 0.8045, "lr": 7.451618570988416e-05, "epoch": 19.4288054810843, "percentage": 97.14, "elapsed_time": "8:03:30", "remaining_time": "0:14:12", "throughput": 2610.54, "total_tokens": 75733472} +{"current_steps": 130450, "total_steps": 134280, "loss": 0.8056, "lr": 7.432221786491e-05, "epoch": 19.42955019362526, "percentage": 97.15, "elapsed_time": "8:03:31", "remaining_time": "0:14:11", "throughput": 2610.55, "total_tokens": 75736800} +{"current_steps": 130455, "total_steps": 134280, "loss": 0.7885, "lr": 7.412850217409006e-05, "epoch": 19.43029490616622, "percentage": 97.15, "elapsed_time": "8:03:33", "remaining_time": "0:14:10", "throughput": 2610.58, "total_tokens": 75740640} +{"current_steps": 130460, "total_steps": 134280, "loss": 0.779, "lr": 7.393503864070006e-05, "epoch": 19.431039618707178, "percentage": 97.16, "elapsed_time": "8:03:34", "remaining_time": "0:14:09", "throughput": 2610.58, "total_tokens": 75743648} +{"current_steps": 130465, "total_steps": 134280, "loss": 0.7993, "lr": 7.374182726800904e-05, "epoch": 19.43178433124814, "percentage": 97.16, "elapsed_time": "8:03:35", "remaining_time": "0:14:08", "throughput": 2610.58, "total_tokens": 75746368} +{"current_steps": 130470, "total_steps": 134280, "loss": 0.7929, "lr": 7.354886805927773e-05, "epoch": 19.432529043789096, "percentage": 97.16, "elapsed_time": "8:03:36", "remaining_time": "0:14:07", "throughput": 2610.59, "total_tokens": 75749152} +{"current_steps": 130475, "total_steps": 134280, "loss": 0.7873, "lr": 7.335616101776854e-05, "epoch": 19.433273756330056, "percentage": 97.17, "elapsed_time": "8:03:37", "remaining_time": "0:14:06", "throughput": 2610.6, "total_tokens": 75752352} +{"current_steps": 130480, "total_steps": 134280, "loss": 0.8013, "lr": 7.31637061467355e-05, "epoch": 19.434018468871017, "percentage": 97.17, "elapsed_time": "8:03:38", "remaining_time": "0:14:05", "throughput": 2610.6, "total_tokens": 75755328} +{"current_steps": 130485, "total_steps": 134280, "loss": 0.8024, "lr": 7.297150344943103e-05, "epoch": 19.434763181411974, "percentage": 97.17, "elapsed_time": "8:03:39", "remaining_time": "0:14:03", "throughput": 2610.61, "total_tokens": 75758368} +{"current_steps": 130490, "total_steps": 134280, "loss": 0.8058, "lr": 7.277955292910088e-05, "epoch": 19.435507893952934, "percentage": 97.18, "elapsed_time": "8:03:40", "remaining_time": "0:14:02", "throughput": 2610.62, "total_tokens": 75761280} +{"current_steps": 130495, "total_steps": 134280, "loss": 0.8141, "lr": 7.258785458898908e-05, "epoch": 19.436252606493895, "percentage": 97.18, "elapsed_time": "8:03:41", "remaining_time": "0:14:01", "throughput": 2610.62, "total_tokens": 75764192} +{"current_steps": 130500, "total_steps": 134280, "loss": 0.8109, "lr": 7.239640843233475e-05, "epoch": 19.43699731903485, "percentage": 97.18, "elapsed_time": "8:03:42", "remaining_time": "0:14:00", "throughput": 2610.63, "total_tokens": 75766944} +{"current_steps": 130505, "total_steps": 134280, "loss": 0.7903, "lr": 7.220521446237194e-05, "epoch": 19.437742031575812, "percentage": 97.19, "elapsed_time": "8:03:43", "remaining_time": "0:13:59", "throughput": 2610.63, "total_tokens": 75769888} +{"current_steps": 130510, "total_steps": 134280, "loss": 0.7957, "lr": 7.201427268232974e-05, "epoch": 19.43848674411677, "percentage": 97.19, "elapsed_time": "8:03:44", "remaining_time": "0:13:58", "throughput": 2610.63, "total_tokens": 75772640} +{"current_steps": 130515, "total_steps": 134280, "loss": 0.7872, "lr": 7.182358309543224e-05, "epoch": 19.43923145665773, "percentage": 97.2, "elapsed_time": "8:03:45", "remaining_time": "0:13:57", "throughput": 2610.64, "total_tokens": 75775456} +{"current_steps": 130520, "total_steps": 134280, "loss": 0.7733, "lr": 7.16331457049052e-05, "epoch": 19.43997616919869, "percentage": 97.2, "elapsed_time": "8:03:46", "remaining_time": "0:13:56", "throughput": 2610.64, "total_tokens": 75778112} +{"current_steps": 130525, "total_steps": 134280, "loss": 0.7928, "lr": 7.14429605139627e-05, "epoch": 19.440720881739647, "percentage": 97.2, "elapsed_time": "8:03:47", "remaining_time": "0:13:55", "throughput": 2610.64, "total_tokens": 75781056} +{"current_steps": 130530, "total_steps": 134280, "loss": 0.8163, "lr": 7.125302752581885e-05, "epoch": 19.441465594280608, "percentage": 97.21, "elapsed_time": "8:03:48", "remaining_time": "0:13:53", "throughput": 2610.65, "total_tokens": 75784128} +{"current_steps": 130535, "total_steps": 134280, "loss": 0.8094, "lr": 7.106334674368275e-05, "epoch": 19.44221030682157, "percentage": 97.21, "elapsed_time": "8:03:49", "remaining_time": "0:13:52", "throughput": 2610.65, "total_tokens": 75786848} +{"current_steps": 130540, "total_steps": 134280, "loss": 0.7964, "lr": 7.08739181707585e-05, "epoch": 19.442955019362525, "percentage": 97.21, "elapsed_time": "8:03:50", "remaining_time": "0:13:51", "throughput": 2610.66, "total_tokens": 75789984} +{"current_steps": 130545, "total_steps": 134280, "loss": 0.8107, "lr": 7.068474181024519e-05, "epoch": 19.443699731903486, "percentage": 97.22, "elapsed_time": "8:03:52", "remaining_time": "0:13:50", "throughput": 2610.66, "total_tokens": 75792736} +{"current_steps": 130550, "total_steps": 134280, "loss": 0.8024, "lr": 7.04958176653403e-05, "epoch": 19.444444444444443, "percentage": 97.22, "elapsed_time": "8:03:53", "remaining_time": "0:13:49", "throughput": 2610.67, "total_tokens": 75795936} +{"current_steps": 130555, "total_steps": 134280, "loss": 0.7945, "lr": 7.030714573923458e-05, "epoch": 19.445189156985403, "percentage": 97.23, "elapsed_time": "8:03:54", "remaining_time": "0:13:48", "throughput": 2610.68, "total_tokens": 75798848} +{"current_steps": 130560, "total_steps": 134280, "loss": 0.8038, "lr": 7.011872603511549e-05, "epoch": 19.445933869526364, "percentage": 97.23, "elapsed_time": "8:03:55", "remaining_time": "0:13:47", "throughput": 2610.68, "total_tokens": 75801664} +{"current_steps": 130565, "total_steps": 134280, "loss": 0.8189, "lr": 6.993055855616714e-05, "epoch": 19.44667858206732, "percentage": 97.23, "elapsed_time": "8:03:56", "remaining_time": "0:13:46", "throughput": 2610.68, "total_tokens": 75804352} +{"current_steps": 130570, "total_steps": 134280, "loss": 0.8018, "lr": 6.9742643305567e-05, "epoch": 19.44742329460828, "percentage": 97.24, "elapsed_time": "8:03:57", "remaining_time": "0:13:45", "throughput": 2610.69, "total_tokens": 75807328} +{"current_steps": 130575, "total_steps": 134280, "loss": 0.8078, "lr": 6.955498028649088e-05, "epoch": 19.448168007149242, "percentage": 97.24, "elapsed_time": "8:03:58", "remaining_time": "0:13:43", "throughput": 2610.7, "total_tokens": 75810368} +{"current_steps": 130580, "total_steps": 134280, "loss": 0.8038, "lr": 6.936756950210954e-05, "epoch": 19.4489127196902, "percentage": 97.24, "elapsed_time": "8:03:59", "remaining_time": "0:13:42", "throughput": 2610.7, "total_tokens": 75813120} +{"current_steps": 130585, "total_steps": 134280, "loss": 0.8102, "lr": 6.918041095558713e-05, "epoch": 19.44965743223116, "percentage": 97.25, "elapsed_time": "8:04:00", "remaining_time": "0:13:41", "throughput": 2610.7, "total_tokens": 75816096} +{"current_steps": 130590, "total_steps": 134280, "loss": 0.8123, "lr": 6.899350465008613e-05, "epoch": 19.450402144772116, "percentage": 97.25, "elapsed_time": "8:04:01", "remaining_time": "0:13:40", "throughput": 2610.71, "total_tokens": 75819136} +{"current_steps": 130595, "total_steps": 134280, "loss": 0.8016, "lr": 6.880685058876567e-05, "epoch": 19.451146857313077, "percentage": 97.26, "elapsed_time": "8:04:02", "remaining_time": "0:13:39", "throughput": 2610.71, "total_tokens": 75821824} +{"current_steps": 130600, "total_steps": 134280, "loss": 0.7976, "lr": 6.862044877477823e-05, "epoch": 19.451891569854038, "percentage": 97.26, "elapsed_time": "8:04:03", "remaining_time": "0:13:38", "throughput": 2610.71, "total_tokens": 75824576} +{"current_steps": 130605, "total_steps": 134280, "loss": 0.8095, "lr": 6.843429921127298e-05, "epoch": 19.452636282394995, "percentage": 97.26, "elapsed_time": "8:04:04", "remaining_time": "0:13:37", "throughput": 2610.72, "total_tokens": 75827680} +{"current_steps": 130610, "total_steps": 134280, "loss": 0.7837, "lr": 6.824840190139403e-05, "epoch": 19.453380994935955, "percentage": 97.27, "elapsed_time": "8:04:05", "remaining_time": "0:13:36", "throughput": 2610.73, "total_tokens": 75831040} +{"current_steps": 130615, "total_steps": 134280, "loss": 0.794, "lr": 6.806275684828222e-05, "epoch": 19.454125707476916, "percentage": 97.27, "elapsed_time": "8:04:06", "remaining_time": "0:13:35", "throughput": 2610.74, "total_tokens": 75833888} +{"current_steps": 130620, "total_steps": 134280, "loss": 0.8072, "lr": 6.787736405507505e-05, "epoch": 19.454870420017873, "percentage": 97.27, "elapsed_time": "8:04:07", "remaining_time": "0:13:33", "throughput": 2610.74, "total_tokens": 75836864} +{"current_steps": 130625, "total_steps": 134280, "loss": 0.7784, "lr": 6.769222352490167e-05, "epoch": 19.455615132558833, "percentage": 97.28, "elapsed_time": "8:04:09", "remaining_time": "0:13:32", "throughput": 2610.75, "total_tokens": 75839712} +{"current_steps": 130630, "total_steps": 134280, "loss": 0.7981, "lr": 6.750733526089292e-05, "epoch": 19.45635984509979, "percentage": 97.28, "elapsed_time": "8:04:10", "remaining_time": "0:13:31", "throughput": 2610.76, "total_tokens": 75842752} +{"current_steps": 130635, "total_steps": 134280, "loss": 0.8102, "lr": 6.732269926616963e-05, "epoch": 19.45710455764075, "percentage": 97.29, "elapsed_time": "8:04:11", "remaining_time": "0:13:30", "throughput": 2610.77, "total_tokens": 75845952} +{"current_steps": 130640, "total_steps": 134280, "loss": 0.7992, "lr": 6.713831554385429e-05, "epoch": 19.45784927018171, "percentage": 97.29, "elapsed_time": "8:04:12", "remaining_time": "0:13:29", "throughput": 2610.78, "total_tokens": 75849088} +{"current_steps": 130645, "total_steps": 134280, "loss": 0.8351, "lr": 6.695418409705944e-05, "epoch": 19.458593982722668, "percentage": 97.29, "elapsed_time": "8:04:13", "remaining_time": "0:13:28", "throughput": 2610.78, "total_tokens": 75852096} +{"current_steps": 130650, "total_steps": 134280, "loss": 0.795, "lr": 6.677030492889591e-05, "epoch": 19.45933869526363, "percentage": 97.3, "elapsed_time": "8:04:14", "remaining_time": "0:13:27", "throughput": 2610.78, "total_tokens": 75854752} +{"current_steps": 130655, "total_steps": 134280, "loss": 0.8003, "lr": 6.65866780424712e-05, "epoch": 19.46008340780459, "percentage": 97.3, "elapsed_time": "8:04:15", "remaining_time": "0:13:26", "throughput": 2610.79, "total_tokens": 75857888} +{"current_steps": 130660, "total_steps": 134280, "loss": 0.8403, "lr": 6.640330344088618e-05, "epoch": 19.460828120345546, "percentage": 97.3, "elapsed_time": "8:04:16", "remaining_time": "0:13:25", "throughput": 2610.79, "total_tokens": 75860608} +{"current_steps": 130665, "total_steps": 134280, "loss": 0.8192, "lr": 6.622018112724004e-05, "epoch": 19.461572832886507, "percentage": 97.31, "elapsed_time": "8:04:17", "remaining_time": "0:13:23", "throughput": 2610.81, "total_tokens": 75863872} +{"current_steps": 130670, "total_steps": 134280, "loss": 0.7937, "lr": 6.603731110462529e-05, "epoch": 19.462317545427464, "percentage": 97.31, "elapsed_time": "8:04:18", "remaining_time": "0:13:22", "throughput": 2610.81, "total_tokens": 75866848} +{"current_steps": 130675, "total_steps": 134280, "loss": 0.8072, "lr": 6.58546933761328e-05, "epoch": 19.463062257968424, "percentage": 97.32, "elapsed_time": "8:04:19", "remaining_time": "0:13:21", "throughput": 2610.82, "total_tokens": 75869856} +{"current_steps": 130680, "total_steps": 134280, "loss": 0.8098, "lr": 6.567232794484678e-05, "epoch": 19.463806970509385, "percentage": 97.32, "elapsed_time": "8:04:20", "remaining_time": "0:13:20", "throughput": 2610.82, "total_tokens": 75872480} +{"current_steps": 130685, "total_steps": 134280, "loss": 0.8056, "lr": 6.549021481384809e-05, "epoch": 19.464551683050342, "percentage": 97.32, "elapsed_time": "8:04:21", "remaining_time": "0:13:19", "throughput": 2610.83, "total_tokens": 75875680} +{"current_steps": 130690, "total_steps": 134280, "loss": 0.7664, "lr": 6.53083539862126e-05, "epoch": 19.465296395591302, "percentage": 97.33, "elapsed_time": "8:04:22", "remaining_time": "0:13:18", "throughput": 2610.83, "total_tokens": 75878560} +{"current_steps": 130695, "total_steps": 134280, "loss": 0.7905, "lr": 6.51267454650145e-05, "epoch": 19.46604110813226, "percentage": 97.33, "elapsed_time": "8:04:24", "remaining_time": "0:13:17", "throughput": 2610.84, "total_tokens": 75881728} +{"current_steps": 130700, "total_steps": 134280, "loss": 0.7843, "lr": 6.494538925332138e-05, "epoch": 19.46678582067322, "percentage": 97.33, "elapsed_time": "8:04:25", "remaining_time": "0:13:16", "throughput": 2610.85, "total_tokens": 75884896} +{"current_steps": 130705, "total_steps": 134280, "loss": 0.7977, "lr": 6.476428535419576e-05, "epoch": 19.46753053321418, "percentage": 97.34, "elapsed_time": "8:04:26", "remaining_time": "0:13:15", "throughput": 2610.86, "total_tokens": 75887904} +{"current_steps": 130710, "total_steps": 134280, "loss": 0.8199, "lr": 6.458343377069687e-05, "epoch": 19.468275245755137, "percentage": 97.34, "elapsed_time": "8:04:27", "remaining_time": "0:13:13", "throughput": 2610.86, "total_tokens": 75890560} +{"current_steps": 130715, "total_steps": 134280, "loss": 0.7867, "lr": 6.440283450588391e-05, "epoch": 19.469019958296098, "percentage": 97.35, "elapsed_time": "8:04:28", "remaining_time": "0:13:12", "throughput": 2610.86, "total_tokens": 75893280} +{"current_steps": 130720, "total_steps": 134280, "loss": 0.8111, "lr": 6.42224875628028e-05, "epoch": 19.46976467083706, "percentage": 97.35, "elapsed_time": "8:04:29", "remaining_time": "0:13:11", "throughput": 2610.86, "total_tokens": 75896128} +{"current_steps": 130725, "total_steps": 134280, "loss": 0.7974, "lr": 6.404239294450442e-05, "epoch": 19.470509383378015, "percentage": 97.35, "elapsed_time": "8:04:30", "remaining_time": "0:13:10", "throughput": 2610.87, "total_tokens": 75899168} +{"current_steps": 130730, "total_steps": 134280, "loss": 0.8096, "lr": 6.386255065402801e-05, "epoch": 19.471254095918976, "percentage": 97.36, "elapsed_time": "8:04:31", "remaining_time": "0:13:09", "throughput": 2610.88, "total_tokens": 75902272} +{"current_steps": 130735, "total_steps": 134280, "loss": 0.7988, "lr": 6.368296069441447e-05, "epoch": 19.471998808459933, "percentage": 97.36, "elapsed_time": "8:04:32", "remaining_time": "0:13:08", "throughput": 2610.88, "total_tokens": 75905216} +{"current_steps": 130740, "total_steps": 134280, "loss": 0.7925, "lr": 6.350362306869639e-05, "epoch": 19.472743521000893, "percentage": 97.36, "elapsed_time": "8:04:33", "remaining_time": "0:13:07", "throughput": 2610.89, "total_tokens": 75908224} +{"current_steps": 130745, "total_steps": 134280, "loss": 0.7883, "lr": 6.332453777990465e-05, "epoch": 19.473488233541854, "percentage": 97.37, "elapsed_time": "8:04:34", "remaining_time": "0:13:06", "throughput": 2610.89, "total_tokens": 75910880} +{"current_steps": 130750, "total_steps": 134280, "loss": 0.7838, "lr": 6.314570483106352e-05, "epoch": 19.47423294608281, "percentage": 97.37, "elapsed_time": "8:04:35", "remaining_time": "0:13:04", "throughput": 2610.9, "total_tokens": 75913888} +{"current_steps": 130755, "total_steps": 134280, "loss": 0.8097, "lr": 6.29671242251939e-05, "epoch": 19.47497765862377, "percentage": 97.37, "elapsed_time": "8:04:36", "remaining_time": "0:13:03", "throughput": 2610.91, "total_tokens": 75917216} +{"current_steps": 130760, "total_steps": 134280, "loss": 0.796, "lr": 6.278879596531339e-05, "epoch": 19.475722371164732, "percentage": 97.38, "elapsed_time": "8:04:37", "remaining_time": "0:13:02", "throughput": 2610.92, "total_tokens": 75920128} +{"current_steps": 130765, "total_steps": 134280, "loss": 0.8068, "lr": 6.261072005443457e-05, "epoch": 19.47646708370569, "percentage": 97.38, "elapsed_time": "8:04:39", "remaining_time": "0:13:01", "throughput": 2610.93, "total_tokens": 75923296} +{"current_steps": 130770, "total_steps": 134280, "loss": 0.7978, "lr": 6.243289649556671e-05, "epoch": 19.47721179624665, "percentage": 97.39, "elapsed_time": "8:04:40", "remaining_time": "0:13:00", "throughput": 2610.93, "total_tokens": 75926208} +{"current_steps": 130775, "total_steps": 134280, "loss": 0.8065, "lr": 6.22553252917124e-05, "epoch": 19.477956508787607, "percentage": 97.39, "elapsed_time": "8:04:41", "remaining_time": "0:12:59", "throughput": 2610.94, "total_tokens": 75929152} +{"current_steps": 130780, "total_steps": 134280, "loss": 0.7891, "lr": 6.207800644587257e-05, "epoch": 19.478701221328567, "percentage": 97.39, "elapsed_time": "8:04:42", "remaining_time": "0:12:58", "throughput": 2610.94, "total_tokens": 75931968} +{"current_steps": 130785, "total_steps": 134280, "loss": 0.7926, "lr": 6.190093996104318e-05, "epoch": 19.479445933869528, "percentage": 97.4, "elapsed_time": "8:04:43", "remaining_time": "0:12:57", "throughput": 2610.95, "total_tokens": 75935072} +{"current_steps": 130790, "total_steps": 134280, "loss": 0.7696, "lr": 6.172412584021514e-05, "epoch": 19.480190646410485, "percentage": 97.4, "elapsed_time": "8:04:44", "remaining_time": "0:12:56", "throughput": 2610.95, "total_tokens": 75937856} +{"current_steps": 130795, "total_steps": 134280, "loss": 0.8122, "lr": 6.154756408637441e-05, "epoch": 19.480935358951445, "percentage": 97.4, "elapsed_time": "8:04:45", "remaining_time": "0:12:54", "throughput": 2610.96, "total_tokens": 75940864} +{"current_steps": 130800, "total_steps": 134280, "loss": 0.7993, "lr": 6.137125470250525e-05, "epoch": 19.481680071492406, "percentage": 97.41, "elapsed_time": "8:04:46", "remaining_time": "0:12:53", "throughput": 2610.96, "total_tokens": 75943488} +{"current_steps": 130805, "total_steps": 134280, "loss": 0.8019, "lr": 6.119519769158699e-05, "epoch": 19.482424784033363, "percentage": 97.41, "elapsed_time": "8:04:47", "remaining_time": "0:12:52", "throughput": 2610.96, "total_tokens": 75946272} +{"current_steps": 130810, "total_steps": 134280, "loss": 0.7971, "lr": 6.1019393056590544e-05, "epoch": 19.483169496574323, "percentage": 97.42, "elapsed_time": "8:04:48", "remaining_time": "0:12:51", "throughput": 2610.97, "total_tokens": 75949152} +{"current_steps": 130815, "total_steps": 134280, "loss": 0.7886, "lr": 6.084384080049021e-05, "epoch": 19.48391420911528, "percentage": 97.42, "elapsed_time": "8:04:49", "remaining_time": "0:12:50", "throughput": 2610.97, "total_tokens": 75952064} +{"current_steps": 130820, "total_steps": 134280, "loss": 0.803, "lr": 6.066854092624863e-05, "epoch": 19.48465892165624, "percentage": 97.42, "elapsed_time": "8:04:50", "remaining_time": "0:12:49", "throughput": 2610.98, "total_tokens": 75954944} +{"current_steps": 130825, "total_steps": 134280, "loss": 0.8, "lr": 6.0493493436828417e-05, "epoch": 19.4854036341972, "percentage": 97.43, "elapsed_time": "8:04:51", "remaining_time": "0:12:48", "throughput": 2610.97, "total_tokens": 75957536} +{"current_steps": 130830, "total_steps": 134280, "loss": 0.7803, "lr": 6.031869833518555e-05, "epoch": 19.486148346738158, "percentage": 97.43, "elapsed_time": "8:04:52", "remaining_time": "0:12:47", "throughput": 2610.98, "total_tokens": 75960640} +{"current_steps": 130835, "total_steps": 134280, "loss": 0.7958, "lr": 6.0144155624276e-05, "epoch": 19.48689305927912, "percentage": 97.43, "elapsed_time": "8:04:53", "remaining_time": "0:12:46", "throughput": 2610.99, "total_tokens": 75963680} +{"current_steps": 130840, "total_steps": 134280, "loss": 0.7862, "lr": 5.996986530704573e-05, "epoch": 19.487637771820076, "percentage": 97.44, "elapsed_time": "8:04:54", "remaining_time": "0:12:44", "throughput": 2610.99, "total_tokens": 75966496} +{"current_steps": 130845, "total_steps": 134280, "loss": 0.7824, "lr": 5.979582738644073e-05, "epoch": 19.488382484361036, "percentage": 97.44, "elapsed_time": "8:04:55", "remaining_time": "0:12:43", "throughput": 2610.99, "total_tokens": 75969184} +{"current_steps": 130850, "total_steps": 134280, "loss": 0.7917, "lr": 5.9622041865401987e-05, "epoch": 19.489127196901997, "percentage": 97.45, "elapsed_time": "8:04:56", "remaining_time": "0:12:42", "throughput": 2611.0, "total_tokens": 75972288} +{"current_steps": 130855, "total_steps": 134280, "loss": 0.7973, "lr": 5.944850874686213e-05, "epoch": 19.489871909442954, "percentage": 97.45, "elapsed_time": "8:04:58", "remaining_time": "0:12:41", "throughput": 2611.0, "total_tokens": 75974976} +{"current_steps": 130860, "total_steps": 134280, "loss": 0.7929, "lr": 5.927522803375551e-05, "epoch": 19.490616621983914, "percentage": 97.45, "elapsed_time": "8:04:59", "remaining_time": "0:12:40", "throughput": 2611.01, "total_tokens": 75977920} +{"current_steps": 130865, "total_steps": 134280, "loss": 0.7828, "lr": 5.9102199729009764e-05, "epoch": 19.491361334524875, "percentage": 97.46, "elapsed_time": "8:05:00", "remaining_time": "0:12:39", "throughput": 2611.01, "total_tokens": 75980704} +{"current_steps": 130870, "total_steps": 134280, "loss": 0.8, "lr": 5.892942383554589e-05, "epoch": 19.492106047065832, "percentage": 97.46, "elapsed_time": "8:05:01", "remaining_time": "0:12:38", "throughput": 2611.01, "total_tokens": 75983552} +{"current_steps": 130875, "total_steps": 134280, "loss": 0.7986, "lr": 5.875690035628489e-05, "epoch": 19.492850759606792, "percentage": 97.46, "elapsed_time": "8:05:02", "remaining_time": "0:12:37", "throughput": 2611.03, "total_tokens": 75986880} +{"current_steps": 130880, "total_steps": 134280, "loss": 0.8182, "lr": 5.858462929413943e-05, "epoch": 19.49359547214775, "percentage": 97.47, "elapsed_time": "8:05:03", "remaining_time": "0:12:36", "throughput": 2611.03, "total_tokens": 75989760} +{"current_steps": 130885, "total_steps": 134280, "loss": 0.8087, "lr": 5.841261065202052e-05, "epoch": 19.49434018468871, "percentage": 97.47, "elapsed_time": "8:05:04", "remaining_time": "0:12:34", "throughput": 2611.04, "total_tokens": 75992864} +{"current_steps": 130890, "total_steps": 134280, "loss": 0.7886, "lr": 5.8240844432835835e-05, "epoch": 19.49508489722967, "percentage": 97.48, "elapsed_time": "8:05:05", "remaining_time": "0:12:33", "throughput": 2611.04, "total_tokens": 75995744} +{"current_steps": 130895, "total_steps": 134280, "loss": 0.8134, "lr": 5.806933063948638e-05, "epoch": 19.495829609770627, "percentage": 97.48, "elapsed_time": "8:05:06", "remaining_time": "0:12:32", "throughput": 2611.05, "total_tokens": 75998656} +{"current_steps": 130900, "total_steps": 134280, "loss": 0.8107, "lr": 5.789806927486818e-05, "epoch": 19.496574322311588, "percentage": 97.48, "elapsed_time": "8:05:07", "remaining_time": "0:12:31", "throughput": 2611.06, "total_tokens": 76001696} +{"current_steps": 130905, "total_steps": 134280, "loss": 0.792, "lr": 5.772706034187558e-05, "epoch": 19.49731903485255, "percentage": 97.49, "elapsed_time": "8:05:08", "remaining_time": "0:12:30", "throughput": 2611.05, "total_tokens": 76004288} +{"current_steps": 130910, "total_steps": 134280, "loss": 0.7956, "lr": 5.7556303843397934e-05, "epoch": 19.498063747393505, "percentage": 97.49, "elapsed_time": "8:05:09", "remaining_time": "0:12:29", "throughput": 2611.06, "total_tokens": 76007104} +{"current_steps": 130915, "total_steps": 134280, "loss": 0.7916, "lr": 5.738579978231961e-05, "epoch": 19.498808459934466, "percentage": 97.49, "elapsed_time": "8:05:10", "remaining_time": "0:12:28", "throughput": 2611.06, "total_tokens": 76009760} +{"current_steps": 130920, "total_steps": 134280, "loss": 0.7873, "lr": 5.7215548161521634e-05, "epoch": 19.499553172475423, "percentage": 97.5, "elapsed_time": "8:05:11", "remaining_time": "0:12:27", "throughput": 2611.06, "total_tokens": 76012384} +{"current_steps": 130925, "total_steps": 134280, "loss": 0.818, "lr": 5.704554898387837e-05, "epoch": 19.500297885016384, "percentage": 97.5, "elapsed_time": "8:05:12", "remaining_time": "0:12:26", "throughput": 2611.06, "total_tokens": 76015392} +{"current_steps": 130930, "total_steps": 134280, "loss": 0.7819, "lr": 5.687580225226418e-05, "epoch": 19.501042597557344, "percentage": 97.51, "elapsed_time": "8:05:13", "remaining_time": "0:12:24", "throughput": 2611.07, "total_tokens": 76018240} +{"current_steps": 130935, "total_steps": 134280, "loss": 0.8048, "lr": 5.6706307969546785e-05, "epoch": 19.5017873100983, "percentage": 97.51, "elapsed_time": "8:05:14", "remaining_time": "0:12:23", "throughput": 2611.07, "total_tokens": 76021088} +{"current_steps": 130940, "total_steps": 134280, "loss": 0.7852, "lr": 5.6537066138588886e-05, "epoch": 19.50253202263926, "percentage": 97.51, "elapsed_time": "8:05:15", "remaining_time": "0:12:22", "throughput": 2611.08, "total_tokens": 76024000} +{"current_steps": 130945, "total_steps": 134280, "loss": 0.801, "lr": 5.6368076762248196e-05, "epoch": 19.503276735180222, "percentage": 97.52, "elapsed_time": "8:05:17", "remaining_time": "0:12:21", "throughput": 2611.08, "total_tokens": 76027136} +{"current_steps": 130950, "total_steps": 134280, "loss": 0.7963, "lr": 5.619933984338077e-05, "epoch": 19.50402144772118, "percentage": 97.52, "elapsed_time": "8:05:18", "remaining_time": "0:12:20", "throughput": 2611.09, "total_tokens": 76030016} +{"current_steps": 130955, "total_steps": 134280, "loss": 0.7764, "lr": 5.603085538483765e-05, "epoch": 19.50476616026214, "percentage": 97.52, "elapsed_time": "8:05:19", "remaining_time": "0:12:19", "throughput": 2611.09, "total_tokens": 76032800} +{"current_steps": 130960, "total_steps": 134280, "loss": 0.7991, "lr": 5.5862623389463234e-05, "epoch": 19.505510872803097, "percentage": 97.53, "elapsed_time": "8:05:20", "remaining_time": "0:12:18", "throughput": 2611.09, "total_tokens": 76035616} +{"current_steps": 130965, "total_steps": 134280, "loss": 0.793, "lr": 5.5694643860103585e-05, "epoch": 19.506255585344057, "percentage": 97.53, "elapsed_time": "8:05:21", "remaining_time": "0:12:17", "throughput": 2611.1, "total_tokens": 76038432} +{"current_steps": 130970, "total_steps": 134280, "loss": 0.7859, "lr": 5.5526916799593094e-05, "epoch": 19.507000297885018, "percentage": 97.54, "elapsed_time": "8:05:22", "remaining_time": "0:12:16", "throughput": 2611.1, "total_tokens": 76041120} +{"current_steps": 130975, "total_steps": 134280, "loss": 0.7969, "lr": 5.5359442210766163e-05, "epoch": 19.507745010425975, "percentage": 97.54, "elapsed_time": "8:05:23", "remaining_time": "0:12:14", "throughput": 2611.1, "total_tokens": 76043904} +{"current_steps": 130980, "total_steps": 134280, "loss": 0.7967, "lr": 5.5192220096453855e-05, "epoch": 19.508489722966935, "percentage": 97.54, "elapsed_time": "8:05:24", "remaining_time": "0:12:13", "throughput": 2611.11, "total_tokens": 76046880} +{"current_steps": 130985, "total_steps": 134280, "loss": 0.7764, "lr": 5.5025250459478924e-05, "epoch": 19.509234435507892, "percentage": 97.55, "elapsed_time": "8:05:25", "remaining_time": "0:12:12", "throughput": 2611.11, "total_tokens": 76049600} +{"current_steps": 130990, "total_steps": 134280, "loss": 0.7788, "lr": 5.4858533302662436e-05, "epoch": 19.509979148048853, "percentage": 97.55, "elapsed_time": "8:05:26", "remaining_time": "0:12:11", "throughput": 2611.11, "total_tokens": 76052480} +{"current_steps": 130995, "total_steps": 134280, "loss": 0.7893, "lr": 5.469206862882214e-05, "epoch": 19.510723860589813, "percentage": 97.55, "elapsed_time": "8:05:27", "remaining_time": "0:12:10", "throughput": 2611.12, "total_tokens": 76055552} +{"current_steps": 131000, "total_steps": 134280, "loss": 0.8087, "lr": 5.4525856440769124e-05, "epoch": 19.51146857313077, "percentage": 97.56, "elapsed_time": "8:05:28", "remaining_time": "0:12:09", "throughput": 2611.12, "total_tokens": 76058464} +{"current_steps": 131005, "total_steps": 134280, "loss": 0.8263, "lr": 5.4359896741312804e-05, "epoch": 19.51221328567173, "percentage": 97.56, "elapsed_time": "8:05:29", "remaining_time": "0:12:08", "throughput": 2611.13, "total_tokens": 76061408} +{"current_steps": 131010, "total_steps": 134280, "loss": 0.8044, "lr": 5.4194189533254275e-05, "epoch": 19.51295799821269, "percentage": 97.56, "elapsed_time": "8:05:30", "remaining_time": "0:12:07", "throughput": 2611.14, "total_tokens": 76064512} +{"current_steps": 131015, "total_steps": 134280, "loss": 0.7855, "lr": 5.4028734819396295e-05, "epoch": 19.51370271075365, "percentage": 97.57, "elapsed_time": "8:05:31", "remaining_time": "0:12:05", "throughput": 2611.15, "total_tokens": 76067456} +{"current_steps": 131020, "total_steps": 134280, "loss": 0.7743, "lr": 5.3863532602531626e-05, "epoch": 19.51444742329461, "percentage": 97.57, "elapsed_time": "8:05:32", "remaining_time": "0:12:04", "throughput": 2611.15, "total_tokens": 76070144} +{"current_steps": 131025, "total_steps": 134280, "loss": 0.799, "lr": 5.369858288545304e-05, "epoch": 19.515192135835566, "percentage": 97.58, "elapsed_time": "8:05:33", "remaining_time": "0:12:03", "throughput": 2611.14, "total_tokens": 76072576} +{"current_steps": 131030, "total_steps": 134280, "loss": 0.7833, "lr": 5.353388567094497e-05, "epoch": 19.515936848376526, "percentage": 97.58, "elapsed_time": "8:05:34", "remaining_time": "0:12:02", "throughput": 2611.15, "total_tokens": 76075552} +{"current_steps": 131035, "total_steps": 134280, "loss": 0.8025, "lr": 5.336944096179186e-05, "epoch": 19.516681560917487, "percentage": 97.58, "elapsed_time": "8:05:35", "remaining_time": "0:12:01", "throughput": 2611.15, "total_tokens": 76078080} +{"current_steps": 131040, "total_steps": 134280, "loss": 0.7932, "lr": 5.320524876076982e-05, "epoch": 19.517426273458444, "percentage": 97.59, "elapsed_time": "8:05:36", "remaining_time": "0:12:00", "throughput": 2611.16, "total_tokens": 76081152} +{"current_steps": 131045, "total_steps": 134280, "loss": 0.7928, "lr": 5.304130907065496e-05, "epoch": 19.518170985999404, "percentage": 97.59, "elapsed_time": "8:05:38", "remaining_time": "0:11:59", "throughput": 2611.16, "total_tokens": 76084192} +{"current_steps": 131050, "total_steps": 134280, "loss": 0.7981, "lr": 5.2877621894215075e-05, "epoch": 19.518915698540365, "percentage": 97.59, "elapsed_time": "8:05:39", "remaining_time": "0:11:58", "throughput": 2611.18, "total_tokens": 76087776} +{"current_steps": 131055, "total_steps": 134280, "loss": 0.8027, "lr": 5.271418723421628e-05, "epoch": 19.519660411081322, "percentage": 97.6, "elapsed_time": "8:05:40", "remaining_time": "0:11:57", "throughput": 2611.19, "total_tokens": 76090912} +{"current_steps": 131060, "total_steps": 134280, "loss": 0.7871, "lr": 5.2551005093419697e-05, "epoch": 19.520405123622282, "percentage": 97.6, "elapsed_time": "8:05:41", "remaining_time": "0:11:55", "throughput": 2611.2, "total_tokens": 76093824} +{"current_steps": 131065, "total_steps": 134280, "loss": 0.8118, "lr": 5.238807547458146e-05, "epoch": 19.52114983616324, "percentage": 97.61, "elapsed_time": "8:05:42", "remaining_time": "0:11:54", "throughput": 2611.2, "total_tokens": 76096736} +{"current_steps": 131070, "total_steps": 134280, "loss": 0.8319, "lr": 5.2225398380456033e-05, "epoch": 19.5218945487042, "percentage": 97.61, "elapsed_time": "8:05:43", "remaining_time": "0:11:53", "throughput": 2611.2, "total_tokens": 76099552} +{"current_steps": 131075, "total_steps": 134280, "loss": 0.8269, "lr": 5.2062973813789546e-05, "epoch": 19.52263926124516, "percentage": 97.61, "elapsed_time": "8:05:44", "remaining_time": "0:11:52", "throughput": 2611.21, "total_tokens": 76102336} +{"current_steps": 131080, "total_steps": 134280, "loss": 0.801, "lr": 5.190080177732648e-05, "epoch": 19.523383973786117, "percentage": 97.62, "elapsed_time": "8:05:45", "remaining_time": "0:11:51", "throughput": 2611.21, "total_tokens": 76105024} +{"current_steps": 131085, "total_steps": 134280, "loss": 0.7957, "lr": 5.17388822738063e-05, "epoch": 19.524128686327078, "percentage": 97.62, "elapsed_time": "8:05:46", "remaining_time": "0:11:50", "throughput": 2611.21, "total_tokens": 76107840} +{"current_steps": 131090, "total_steps": 134280, "loss": 0.8122, "lr": 5.157721530596515e-05, "epoch": 19.52487339886804, "percentage": 97.62, "elapsed_time": "8:05:47", "remaining_time": "0:11:49", "throughput": 2611.22, "total_tokens": 76110944} +{"current_steps": 131095, "total_steps": 134280, "loss": 0.7871, "lr": 5.1415800876534187e-05, "epoch": 19.525618111408996, "percentage": 97.63, "elapsed_time": "8:05:48", "remaining_time": "0:11:48", "throughput": 2611.23, "total_tokens": 76113824} +{"current_steps": 131100, "total_steps": 134280, "loss": 0.7989, "lr": 5.1254638988241227e-05, "epoch": 19.526362823949956, "percentage": 97.63, "elapsed_time": "8:05:49", "remaining_time": "0:11:47", "throughput": 2611.24, "total_tokens": 76117120} +{"current_steps": 131105, "total_steps": 134280, "loss": 0.7757, "lr": 5.109372964380742e-05, "epoch": 19.527107536490913, "percentage": 97.64, "elapsed_time": "8:05:50", "remaining_time": "0:11:45", "throughput": 2611.24, "total_tokens": 76119840} +{"current_steps": 131110, "total_steps": 134280, "loss": 0.7879, "lr": 5.093307284595061e-05, "epoch": 19.527852249031874, "percentage": 97.64, "elapsed_time": "8:05:51", "remaining_time": "0:11:44", "throughput": 2611.24, "total_tokens": 76122784} +{"current_steps": 131115, "total_steps": 134280, "loss": 0.7931, "lr": 5.0772668597386935e-05, "epoch": 19.528596961572834, "percentage": 97.64, "elapsed_time": "8:05:52", "remaining_time": "0:11:43", "throughput": 2611.24, "total_tokens": 76125408} +{"current_steps": 131120, "total_steps": 134280, "loss": 0.7885, "lr": 5.061251690082424e-05, "epoch": 19.52934167411379, "percentage": 97.65, "elapsed_time": "8:05:53", "remaining_time": "0:11:42", "throughput": 2611.25, "total_tokens": 76128384} +{"current_steps": 131125, "total_steps": 134280, "loss": 0.7954, "lr": 5.045261775897036e-05, "epoch": 19.53008638665475, "percentage": 97.65, "elapsed_time": "8:05:55", "remaining_time": "0:11:41", "throughput": 2611.25, "total_tokens": 76131200} +{"current_steps": 131130, "total_steps": 134280, "loss": 0.8041, "lr": 5.02929711745248e-05, "epoch": 19.530831099195712, "percentage": 97.65, "elapsed_time": "8:05:56", "remaining_time": "0:11:40", "throughput": 2611.26, "total_tokens": 76134112} +{"current_steps": 131135, "total_steps": 134280, "loss": 0.7929, "lr": 5.013357715018707e-05, "epoch": 19.53157581173667, "percentage": 97.66, "elapsed_time": "8:05:57", "remaining_time": "0:11:39", "throughput": 2611.27, "total_tokens": 76137248} +{"current_steps": 131140, "total_steps": 134280, "loss": 0.8057, "lr": 4.997443568864668e-05, "epoch": 19.53232052427763, "percentage": 97.66, "elapsed_time": "8:05:58", "remaining_time": "0:11:38", "throughput": 2611.27, "total_tokens": 76140224} +{"current_steps": 131145, "total_steps": 134280, "loss": 0.791, "lr": 4.981554679259315e-05, "epoch": 19.533065236818587, "percentage": 97.67, "elapsed_time": "8:05:59", "remaining_time": "0:11:37", "throughput": 2611.28, "total_tokens": 76143264} +{"current_steps": 131150, "total_steps": 134280, "loss": 0.7956, "lr": 4.9656910464712656e-05, "epoch": 19.533809949359547, "percentage": 97.67, "elapsed_time": "8:06:00", "remaining_time": "0:11:35", "throughput": 2611.29, "total_tokens": 76146368} +{"current_steps": 131155, "total_steps": 134280, "loss": 0.7954, "lr": 4.949852670768306e-05, "epoch": 19.534554661900508, "percentage": 97.67, "elapsed_time": "8:06:01", "remaining_time": "0:11:34", "throughput": 2611.29, "total_tokens": 76149024} +{"current_steps": 131160, "total_steps": 134280, "loss": 0.8006, "lr": 4.9340395524180565e-05, "epoch": 19.535299374441465, "percentage": 97.68, "elapsed_time": "8:06:02", "remaining_time": "0:11:33", "throughput": 2611.29, "total_tokens": 76151904} +{"current_steps": 131165, "total_steps": 134280, "loss": 0.7687, "lr": 4.918251691687636e-05, "epoch": 19.536044086982425, "percentage": 97.68, "elapsed_time": "8:06:03", "remaining_time": "0:11:32", "throughput": 2611.29, "total_tokens": 76154592} +{"current_steps": 131170, "total_steps": 134280, "loss": 0.8052, "lr": 4.9024890888439975e-05, "epoch": 19.536788799523386, "percentage": 97.68, "elapsed_time": "8:06:04", "remaining_time": "0:11:31", "throughput": 2611.3, "total_tokens": 76157440} +{"current_steps": 131175, "total_steps": 134280, "loss": 0.7823, "lr": 4.8867517441530946e-05, "epoch": 19.537533512064343, "percentage": 97.69, "elapsed_time": "8:06:05", "remaining_time": "0:11:30", "throughput": 2611.3, "total_tokens": 76160192} +{"current_steps": 131180, "total_steps": 134280, "loss": 0.798, "lr": 4.871039657881049e-05, "epoch": 19.538278224605303, "percentage": 97.69, "elapsed_time": "8:06:06", "remaining_time": "0:11:29", "throughput": 2611.31, "total_tokens": 76163264} +{"current_steps": 131185, "total_steps": 134280, "loss": 0.7939, "lr": 4.8553528302931466e-05, "epoch": 19.53902293714626, "percentage": 97.7, "elapsed_time": "8:06:07", "remaining_time": "0:11:28", "throughput": 2611.31, "total_tokens": 76166240} +{"current_steps": 131190, "total_steps": 134280, "loss": 0.7969, "lr": 4.839691261654511e-05, "epoch": 19.53976764968722, "percentage": 97.7, "elapsed_time": "8:06:08", "remaining_time": "0:11:27", "throughput": 2611.31, "total_tokens": 76168992} +{"current_steps": 131195, "total_steps": 134280, "loss": 0.7869, "lr": 4.8240549522295946e-05, "epoch": 19.54051236222818, "percentage": 97.7, "elapsed_time": "8:06:09", "remaining_time": "0:11:25", "throughput": 2611.32, "total_tokens": 76172000} +{"current_steps": 131200, "total_steps": 134280, "loss": 0.8034, "lr": 4.8084439022826884e-05, "epoch": 19.54125707476914, "percentage": 97.71, "elapsed_time": "8:06:10", "remaining_time": "0:11:24", "throughput": 2611.33, "total_tokens": 76174880} +{"current_steps": 131205, "total_steps": 134280, "loss": 0.8132, "lr": 4.79285811207758e-05, "epoch": 19.5420017873101, "percentage": 97.71, "elapsed_time": "8:06:12", "remaining_time": "0:11:23", "throughput": 2611.33, "total_tokens": 76177856} +{"current_steps": 131210, "total_steps": 134280, "loss": 0.7972, "lr": 4.777297581877393e-05, "epoch": 19.542746499851056, "percentage": 97.71, "elapsed_time": "8:06:13", "remaining_time": "0:11:22", "throughput": 2611.34, "total_tokens": 76180896} +{"current_steps": 131215, "total_steps": 134280, "loss": 0.7834, "lr": 4.7617623119450835e-05, "epoch": 19.543491212392016, "percentage": 97.72, "elapsed_time": "8:06:14", "remaining_time": "0:11:21", "throughput": 2611.34, "total_tokens": 76183872} +{"current_steps": 131220, "total_steps": 134280, "loss": 0.7926, "lr": 4.746252302543108e-05, "epoch": 19.544235924932977, "percentage": 97.72, "elapsed_time": "8:06:15", "remaining_time": "0:11:20", "throughput": 2611.35, "total_tokens": 76186656} +{"current_steps": 131225, "total_steps": 134280, "loss": 0.804, "lr": 4.7307675539334236e-05, "epoch": 19.544980637473934, "percentage": 97.72, "elapsed_time": "8:06:16", "remaining_time": "0:11:19", "throughput": 2611.35, "total_tokens": 76189568} +{"current_steps": 131230, "total_steps": 134280, "loss": 0.786, "lr": 4.715308066377821e-05, "epoch": 19.545725350014894, "percentage": 97.73, "elapsed_time": "8:06:17", "remaining_time": "0:11:18", "throughput": 2611.35, "total_tokens": 76192320} +{"current_steps": 131235, "total_steps": 134280, "loss": 0.7877, "lr": 4.6998738401372585e-05, "epoch": 19.546470062555855, "percentage": 97.73, "elapsed_time": "8:06:18", "remaining_time": "0:11:17", "throughput": 2611.35, "total_tokens": 76194880} +{"current_steps": 131240, "total_steps": 134280, "loss": 0.7968, "lr": 4.6844648754726936e-05, "epoch": 19.547214775096812, "percentage": 97.74, "elapsed_time": "8:06:19", "remaining_time": "0:11:15", "throughput": 2611.35, "total_tokens": 76197696} +{"current_steps": 131245, "total_steps": 134280, "loss": 0.8083, "lr": 4.6690811726440847e-05, "epoch": 19.547959487637772, "percentage": 97.74, "elapsed_time": "8:06:20", "remaining_time": "0:11:14", "throughput": 2611.35, "total_tokens": 76200416} +{"current_steps": 131250, "total_steps": 134280, "loss": 0.7999, "lr": 4.653722731911724e-05, "epoch": 19.54870420017873, "percentage": 97.74, "elapsed_time": "8:06:21", "remaining_time": "0:11:13", "throughput": 2611.36, "total_tokens": 76203200} +{"current_steps": 131255, "total_steps": 134280, "loss": 0.7861, "lr": 4.638389553534905e-05, "epoch": 19.54944891271969, "percentage": 97.75, "elapsed_time": "8:06:22", "remaining_time": "0:11:12", "throughput": 2611.36, "total_tokens": 76205984} +{"current_steps": 131260, "total_steps": 134280, "loss": 0.8009, "lr": 4.623081637772752e-05, "epoch": 19.55019362526065, "percentage": 97.75, "elapsed_time": "8:06:23", "remaining_time": "0:11:11", "throughput": 2611.36, "total_tokens": 76208992} +{"current_steps": 131265, "total_steps": 134280, "loss": 0.8239, "lr": 4.607798984883726e-05, "epoch": 19.550938337801608, "percentage": 97.75, "elapsed_time": "8:06:24", "remaining_time": "0:11:10", "throughput": 2611.37, "total_tokens": 76211776} +{"current_steps": 131270, "total_steps": 134280, "loss": 0.7906, "lr": 4.5925415951261205e-05, "epoch": 19.551683050342568, "percentage": 97.76, "elapsed_time": "8:06:25", "remaining_time": "0:11:09", "throughput": 2611.37, "total_tokens": 76214688} +{"current_steps": 131275, "total_steps": 134280, "loss": 0.798, "lr": 4.577309468757729e-05, "epoch": 19.55242776288353, "percentage": 97.76, "elapsed_time": "8:06:26", "remaining_time": "0:11:08", "throughput": 2611.38, "total_tokens": 76217632} +{"current_steps": 131280, "total_steps": 134280, "loss": 0.7962, "lr": 4.562102606035678e-05, "epoch": 19.553172475424486, "percentage": 97.77, "elapsed_time": "8:06:27", "remaining_time": "0:11:06", "throughput": 2611.38, "total_tokens": 76220320} +{"current_steps": 131285, "total_steps": 134280, "loss": 0.8098, "lr": 4.54692100721693e-05, "epoch": 19.553917187965446, "percentage": 97.77, "elapsed_time": "8:06:28", "remaining_time": "0:11:05", "throughput": 2611.38, "total_tokens": 76223456} +{"current_steps": 131290, "total_steps": 134280, "loss": 0.7889, "lr": 4.5317646725581135e-05, "epoch": 19.554661900506403, "percentage": 97.77, "elapsed_time": "8:06:29", "remaining_time": "0:11:04", "throughput": 2611.38, "total_tokens": 76225984} +{"current_steps": 131295, "total_steps": 134280, "loss": 0.8008, "lr": 4.5166336023153564e-05, "epoch": 19.555406613047364, "percentage": 97.78, "elapsed_time": "8:06:30", "remaining_time": "0:11:03", "throughput": 2611.39, "total_tokens": 76228896} +{"current_steps": 131300, "total_steps": 134280, "loss": 0.7854, "lr": 4.5015277967439534e-05, "epoch": 19.556151325588324, "percentage": 97.78, "elapsed_time": "8:06:32", "remaining_time": "0:11:02", "throughput": 2611.38, "total_tokens": 76231488} +{"current_steps": 131305, "total_steps": 134280, "loss": 0.7928, "lr": 4.486447256099368e-05, "epoch": 19.55689603812928, "percentage": 97.78, "elapsed_time": "8:06:33", "remaining_time": "0:11:01", "throughput": 2611.39, "total_tokens": 76234560} +{"current_steps": 131310, "total_steps": 134280, "loss": 0.7985, "lr": 4.4713919806363966e-05, "epoch": 19.55764075067024, "percentage": 97.79, "elapsed_time": "8:06:34", "remaining_time": "0:11:00", "throughput": 2611.4, "total_tokens": 76237760} +{"current_steps": 131315, "total_steps": 134280, "loss": 0.7917, "lr": 4.456361970609002e-05, "epoch": 19.558385463211202, "percentage": 97.79, "elapsed_time": "8:06:35", "remaining_time": "0:10:59", "throughput": 2611.41, "total_tokens": 76240672} +{"current_steps": 131320, "total_steps": 134280, "loss": 0.7884, "lr": 4.4413572262714805e-05, "epoch": 19.55913017575216, "percentage": 97.8, "elapsed_time": "8:06:36", "remaining_time": "0:10:58", "throughput": 2611.41, "total_tokens": 76243616} +{"current_steps": 131325, "total_steps": 134280, "loss": 0.7969, "lr": 4.426377747877297e-05, "epoch": 19.55987488829312, "percentage": 97.8, "elapsed_time": "8:06:37", "remaining_time": "0:10:56", "throughput": 2611.42, "total_tokens": 76246720} +{"current_steps": 131330, "total_steps": 134280, "loss": 0.7839, "lr": 4.411423535679415e-05, "epoch": 19.560619600834077, "percentage": 97.8, "elapsed_time": "8:06:38", "remaining_time": "0:10:55", "throughput": 2611.43, "total_tokens": 76249664} +{"current_steps": 131335, "total_steps": 134280, "loss": 0.7891, "lr": 4.3964945899304665e-05, "epoch": 19.561364313375037, "percentage": 97.81, "elapsed_time": "8:06:39", "remaining_time": "0:10:54", "throughput": 2611.44, "total_tokens": 76252768} +{"current_steps": 131340, "total_steps": 134280, "loss": 0.7818, "lr": 4.3815909108825824e-05, "epoch": 19.562109025915998, "percentage": 97.81, "elapsed_time": "8:06:40", "remaining_time": "0:10:53", "throughput": 2611.44, "total_tokens": 76255552} +{"current_steps": 131345, "total_steps": 134280, "loss": 0.7851, "lr": 4.366712498787728e-05, "epoch": 19.562853738456955, "percentage": 97.81, "elapsed_time": "8:06:41", "remaining_time": "0:10:52", "throughput": 2611.45, "total_tokens": 76258560} +{"current_steps": 131350, "total_steps": 134280, "loss": 0.7849, "lr": 4.3518593538972026e-05, "epoch": 19.563598450997915, "percentage": 97.82, "elapsed_time": "8:06:42", "remaining_time": "0:10:51", "throughput": 2611.45, "total_tokens": 76261408} +{"current_steps": 131355, "total_steps": 134280, "loss": 0.8107, "lr": 4.3370314764618056e-05, "epoch": 19.564343163538872, "percentage": 97.82, "elapsed_time": "8:06:43", "remaining_time": "0:10:50", "throughput": 2611.46, "total_tokens": 76264576} +{"current_steps": 131360, "total_steps": 134280, "loss": 0.7983, "lr": 4.3222288667321695e-05, "epoch": 19.565087876079833, "percentage": 97.83, "elapsed_time": "8:06:44", "remaining_time": "0:10:49", "throughput": 2611.47, "total_tokens": 76267616} +{"current_steps": 131365, "total_steps": 134280, "loss": 0.8085, "lr": 4.307451524958428e-05, "epoch": 19.565832588620793, "percentage": 97.83, "elapsed_time": "8:06:45", "remaining_time": "0:10:48", "throughput": 2611.47, "total_tokens": 76270368} +{"current_steps": 131370, "total_steps": 134280, "loss": 0.8108, "lr": 4.2926994513900474e-05, "epoch": 19.56657730116175, "percentage": 97.83, "elapsed_time": "8:06:46", "remaining_time": "0:10:46", "throughput": 2611.47, "total_tokens": 76273216} +{"current_steps": 131375, "total_steps": 134280, "loss": 0.7927, "lr": 4.277972646276329e-05, "epoch": 19.56732201370271, "percentage": 97.84, "elapsed_time": "8:06:48", "remaining_time": "0:10:45", "throughput": 2611.48, "total_tokens": 76276064} +{"current_steps": 131380, "total_steps": 134280, "loss": 0.7903, "lr": 4.26327110986624e-05, "epoch": 19.56806672624367, "percentage": 97.84, "elapsed_time": "8:06:49", "remaining_time": "0:10:44", "throughput": 2611.47, "total_tokens": 76278688} +{"current_steps": 131385, "total_steps": 134280, "loss": 0.7922, "lr": 4.248594842407749e-05, "epoch": 19.56881143878463, "percentage": 97.84, "elapsed_time": "8:06:50", "remaining_time": "0:10:43", "throughput": 2611.47, "total_tokens": 76281344} +{"current_steps": 131390, "total_steps": 134280, "loss": 0.8094, "lr": 4.233943844149157e-05, "epoch": 19.56955615132559, "percentage": 97.85, "elapsed_time": "8:06:51", "remaining_time": "0:10:42", "throughput": 2611.48, "total_tokens": 76284544} +{"current_steps": 131395, "total_steps": 134280, "loss": 0.8092, "lr": 4.2193181153377666e-05, "epoch": 19.570300863866546, "percentage": 97.85, "elapsed_time": "8:06:52", "remaining_time": "0:10:41", "throughput": 2611.49, "total_tokens": 76287360} +{"current_steps": 131400, "total_steps": 134280, "loss": 0.7939, "lr": 4.2047176562208795e-05, "epoch": 19.571045576407506, "percentage": 97.86, "elapsed_time": "8:06:53", "remaining_time": "0:10:40", "throughput": 2611.49, "total_tokens": 76290144} +{"current_steps": 131405, "total_steps": 134280, "loss": 0.7869, "lr": 4.190142467044966e-05, "epoch": 19.571790288948467, "percentage": 97.86, "elapsed_time": "8:06:54", "remaining_time": "0:10:39", "throughput": 2611.49, "total_tokens": 76293056} +{"current_steps": 131410, "total_steps": 134280, "loss": 0.8099, "lr": 4.175592548056495e-05, "epoch": 19.572535001489424, "percentage": 97.86, "elapsed_time": "8:06:55", "remaining_time": "0:10:38", "throughput": 2611.5, "total_tokens": 76295936} +{"current_steps": 131415, "total_steps": 134280, "loss": 0.7868, "lr": 4.16106789950077e-05, "epoch": 19.573279714030384, "percentage": 97.87, "elapsed_time": "8:06:56", "remaining_time": "0:10:36", "throughput": 2611.5, "total_tokens": 76298592} +{"current_steps": 131420, "total_steps": 134280, "loss": 0.7867, "lr": 4.146568521623761e-05, "epoch": 19.574024426571345, "percentage": 97.87, "elapsed_time": "8:06:57", "remaining_time": "0:10:35", "throughput": 2611.5, "total_tokens": 76301408} +{"current_steps": 131425, "total_steps": 134280, "loss": 0.8055, "lr": 4.1320944146701065e-05, "epoch": 19.574769139112302, "percentage": 97.87, "elapsed_time": "8:06:58", "remaining_time": "0:10:34", "throughput": 2611.5, "total_tokens": 76304224} +{"current_steps": 131430, "total_steps": 134280, "loss": 0.7956, "lr": 4.117645578884277e-05, "epoch": 19.575513851653263, "percentage": 97.88, "elapsed_time": "8:06:59", "remaining_time": "0:10:33", "throughput": 2611.51, "total_tokens": 76307072} +{"current_steps": 131435, "total_steps": 134280, "loss": 0.7854, "lr": 4.103222014510577e-05, "epoch": 19.57625856419422, "percentage": 97.88, "elapsed_time": "8:07:00", "remaining_time": "0:10:32", "throughput": 2611.52, "total_tokens": 76310240} +{"current_steps": 131440, "total_steps": 134280, "loss": 0.8, "lr": 4.088823721792478e-05, "epoch": 19.57700327673518, "percentage": 97.89, "elapsed_time": "8:07:01", "remaining_time": "0:10:31", "throughput": 2611.52, "total_tokens": 76312992} +{"current_steps": 131445, "total_steps": 134280, "loss": 0.8077, "lr": 4.074450700973453e-05, "epoch": 19.57774798927614, "percentage": 97.89, "elapsed_time": "8:07:02", "remaining_time": "0:10:30", "throughput": 2611.53, "total_tokens": 76316032} +{"current_steps": 131450, "total_steps": 134280, "loss": 0.7957, "lr": 4.060102952296141e-05, "epoch": 19.578492701817098, "percentage": 97.89, "elapsed_time": "8:07:03", "remaining_time": "0:10:29", "throughput": 2611.53, "total_tokens": 76318976} +{"current_steps": 131455, "total_steps": 134280, "loss": 0.8013, "lr": 4.0457804760030136e-05, "epoch": 19.579237414358058, "percentage": 97.9, "elapsed_time": "8:07:04", "remaining_time": "0:10:28", "throughput": 2611.53, "total_tokens": 76321728} +{"current_steps": 131460, "total_steps": 134280, "loss": 0.7964, "lr": 4.031483272335878e-05, "epoch": 19.57998212689902, "percentage": 97.9, "elapsed_time": "8:07:05", "remaining_time": "0:10:26", "throughput": 2611.54, "total_tokens": 76324512} +{"current_steps": 131465, "total_steps": 134280, "loss": 0.7896, "lr": 4.017211341536542e-05, "epoch": 19.580726839439976, "percentage": 97.9, "elapsed_time": "8:07:07", "remaining_time": "0:10:25", "throughput": 2611.54, "total_tokens": 76327648} +{"current_steps": 131470, "total_steps": 134280, "loss": 0.7839, "lr": 4.0029646838459774e-05, "epoch": 19.581471551980936, "percentage": 97.91, "elapsed_time": "8:07:08", "remaining_time": "0:10:24", "throughput": 2611.55, "total_tokens": 76330336} +{"current_steps": 131475, "total_steps": 134280, "loss": 0.7937, "lr": 3.988743299504826e-05, "epoch": 19.582216264521893, "percentage": 97.91, "elapsed_time": "8:07:09", "remaining_time": "0:10:23", "throughput": 2611.55, "total_tokens": 76333088} +{"current_steps": 131480, "total_steps": 134280, "loss": 0.786, "lr": 3.9745471887533965e-05, "epoch": 19.582960977062854, "percentage": 97.91, "elapsed_time": "8:07:10", "remaining_time": "0:10:22", "throughput": 2611.56, "total_tokens": 76336288} +{"current_steps": 131485, "total_steps": 134280, "loss": 0.7866, "lr": 3.960376351831329e-05, "epoch": 19.583705689603814, "percentage": 97.92, "elapsed_time": "8:07:11", "remaining_time": "0:10:21", "throughput": 2611.56, "total_tokens": 76339008} +{"current_steps": 131490, "total_steps": 134280, "loss": 0.7968, "lr": 3.946230788978433e-05, "epoch": 19.58445040214477, "percentage": 97.92, "elapsed_time": "8:07:12", "remaining_time": "0:10:20", "throughput": 2611.57, "total_tokens": 76342080} +{"current_steps": 131495, "total_steps": 134280, "loss": 0.7966, "lr": 3.93211050043335e-05, "epoch": 19.58519511468573, "percentage": 97.93, "elapsed_time": "8:07:13", "remaining_time": "0:10:19", "throughput": 2611.57, "total_tokens": 76344800} +{"current_steps": 131500, "total_steps": 134280, "loss": 0.7986, "lr": 3.9180154864347225e-05, "epoch": 19.58593982722669, "percentage": 97.93, "elapsed_time": "8:07:14", "remaining_time": "0:10:18", "throughput": 2611.57, "total_tokens": 76347680} +{"current_steps": 131505, "total_steps": 134280, "loss": 0.8108, "lr": 3.9039457472206936e-05, "epoch": 19.58668453976765, "percentage": 97.93, "elapsed_time": "8:07:15", "remaining_time": "0:10:16", "throughput": 2611.58, "total_tokens": 76350624} +{"current_steps": 131510, "total_steps": 134280, "loss": 0.7849, "lr": 3.8899012830287405e-05, "epoch": 19.58742925230861, "percentage": 97.94, "elapsed_time": "8:07:16", "remaining_time": "0:10:15", "throughput": 2611.59, "total_tokens": 76353664} +{"current_steps": 131515, "total_steps": 134280, "loss": 0.7906, "lr": 3.875882094096505e-05, "epoch": 19.588173964849567, "percentage": 97.94, "elapsed_time": "8:07:17", "remaining_time": "0:10:14", "throughput": 2611.59, "total_tokens": 76356608} +{"current_steps": 131520, "total_steps": 134280, "loss": 0.7754, "lr": 3.8618881806606326e-05, "epoch": 19.588918677390527, "percentage": 97.94, "elapsed_time": "8:07:18", "remaining_time": "0:10:13", "throughput": 2611.59, "total_tokens": 76359328} +{"current_steps": 131525, "total_steps": 134280, "loss": 0.8184, "lr": 3.847919542957601e-05, "epoch": 19.589663389931488, "percentage": 97.95, "elapsed_time": "8:07:19", "remaining_time": "0:10:12", "throughput": 2611.59, "total_tokens": 76362144} +{"current_steps": 131530, "total_steps": 134280, "loss": 0.7985, "lr": 3.833976181223386e-05, "epoch": 19.590408102472445, "percentage": 97.95, "elapsed_time": "8:07:20", "remaining_time": "0:10:11", "throughput": 2611.61, "total_tokens": 76365408} +{"current_steps": 131535, "total_steps": 134280, "loss": 0.788, "lr": 3.820058095693468e-05, "epoch": 19.591152815013405, "percentage": 97.96, "elapsed_time": "8:07:21", "remaining_time": "0:10:10", "throughput": 2611.61, "total_tokens": 76368128} +{"current_steps": 131540, "total_steps": 134280, "loss": 0.8037, "lr": 3.8061652866029915e-05, "epoch": 19.591897527554362, "percentage": 97.96, "elapsed_time": "8:07:22", "remaining_time": "0:10:09", "throughput": 2611.62, "total_tokens": 76371200} +{"current_steps": 131545, "total_steps": 134280, "loss": 0.7891, "lr": 3.792297754186602e-05, "epoch": 19.592642240095323, "percentage": 97.96, "elapsed_time": "8:07:23", "remaining_time": "0:10:08", "throughput": 2611.61, "total_tokens": 76373856} +{"current_steps": 131550, "total_steps": 134280, "loss": 0.8232, "lr": 3.7784554986787785e-05, "epoch": 19.593386952636283, "percentage": 97.97, "elapsed_time": "8:07:24", "remaining_time": "0:10:06", "throughput": 2611.62, "total_tokens": 76376736} +{"current_steps": 131555, "total_steps": 134280, "loss": 0.7996, "lr": 3.764638520313168e-05, "epoch": 19.59413166517724, "percentage": 97.97, "elapsed_time": "8:07:26", "remaining_time": "0:10:05", "throughput": 2611.62, "total_tokens": 76379744} +{"current_steps": 131560, "total_steps": 134280, "loss": 0.791, "lr": 3.750846819323417e-05, "epoch": 19.5948763777182, "percentage": 97.97, "elapsed_time": "8:07:27", "remaining_time": "0:10:04", "throughput": 2611.62, "total_tokens": 76382336} +{"current_steps": 131565, "total_steps": 134280, "loss": 0.7846, "lr": 3.737080395942172e-05, "epoch": 19.59562109025916, "percentage": 97.98, "elapsed_time": "8:07:28", "remaining_time": "0:10:03", "throughput": 2611.63, "total_tokens": 76385216} +{"current_steps": 131570, "total_steps": 134280, "loss": 0.7926, "lr": 3.723339250402413e-05, "epoch": 19.59636580280012, "percentage": 97.98, "elapsed_time": "8:07:29", "remaining_time": "0:10:02", "throughput": 2611.63, "total_tokens": 76387968} +{"current_steps": 131575, "total_steps": 134280, "loss": 0.7984, "lr": 3.709623382936122e-05, "epoch": 19.59711051534108, "percentage": 97.99, "elapsed_time": "8:07:30", "remaining_time": "0:10:01", "throughput": 2611.63, "total_tokens": 76390816} +{"current_steps": 131580, "total_steps": 134280, "loss": 0.7809, "lr": 3.695932793774781e-05, "epoch": 19.597855227882036, "percentage": 97.99, "elapsed_time": "8:07:31", "remaining_time": "0:10:00", "throughput": 2611.64, "total_tokens": 76393696} +{"current_steps": 131585, "total_steps": 134280, "loss": 0.7935, "lr": 3.682267483150037e-05, "epoch": 19.598599940422996, "percentage": 97.99, "elapsed_time": "8:07:32", "remaining_time": "0:09:59", "throughput": 2611.64, "total_tokens": 76396544} +{"current_steps": 131590, "total_steps": 134280, "loss": 0.8054, "lr": 3.6686274512925386e-05, "epoch": 19.599344652963957, "percentage": 98.0, "elapsed_time": "8:07:33", "remaining_time": "0:09:58", "throughput": 2611.65, "total_tokens": 76399456} +{"current_steps": 131595, "total_steps": 134280, "loss": 0.8127, "lr": 3.655012698432769e-05, "epoch": 19.600089365504914, "percentage": 98.0, "elapsed_time": "8:07:34", "remaining_time": "0:09:56", "throughput": 2611.65, "total_tokens": 76402176} +{"current_steps": 131600, "total_steps": 134280, "loss": 0.7859, "lr": 3.641423224800877e-05, "epoch": 19.600834078045875, "percentage": 98.0, "elapsed_time": "8:07:35", "remaining_time": "0:09:55", "throughput": 2611.65, "total_tokens": 76404992} +{"current_steps": 131605, "total_steps": 134280, "loss": 0.804, "lr": 3.627859030626179e-05, "epoch": 19.601578790586835, "percentage": 98.01, "elapsed_time": "8:07:36", "remaining_time": "0:09:54", "throughput": 2611.66, "total_tokens": 76407936} +{"current_steps": 131610, "total_steps": 134280, "loss": 0.7947, "lr": 3.614320116137992e-05, "epoch": 19.602323503127792, "percentage": 98.01, "elapsed_time": "8:07:37", "remaining_time": "0:09:53", "throughput": 2611.65, "total_tokens": 76410528} +{"current_steps": 131615, "total_steps": 134280, "loss": 0.8407, "lr": 3.6008064815649665e-05, "epoch": 19.603068215668753, "percentage": 98.02, "elapsed_time": "8:07:38", "remaining_time": "0:09:52", "throughput": 2611.65, "total_tokens": 76413056} +{"current_steps": 131620, "total_steps": 134280, "loss": 0.8119, "lr": 3.587318127135419e-05, "epoch": 19.60381292820971, "percentage": 98.02, "elapsed_time": "8:07:39", "remaining_time": "0:09:51", "throughput": 2611.65, "total_tokens": 76415776} +{"current_steps": 131625, "total_steps": 134280, "loss": 0.8131, "lr": 3.573855053077335e-05, "epoch": 19.60455764075067, "percentage": 98.02, "elapsed_time": "8:07:40", "remaining_time": "0:09:50", "throughput": 2611.66, "total_tokens": 76418784} +{"current_steps": 131630, "total_steps": 134280, "loss": 0.7986, "lr": 3.5604172596180315e-05, "epoch": 19.60530235329163, "percentage": 98.03, "elapsed_time": "8:07:41", "remaining_time": "0:09:49", "throughput": 2611.67, "total_tokens": 76421888} +{"current_steps": 131635, "total_steps": 134280, "loss": 0.7951, "lr": 3.547004746984495e-05, "epoch": 19.606047065832588, "percentage": 98.03, "elapsed_time": "8:07:42", "remaining_time": "0:09:47", "throughput": 2611.67, "total_tokens": 76424768} +{"current_steps": 131640, "total_steps": 134280, "loss": 0.7853, "lr": 3.533617515403542e-05, "epoch": 19.606791778373548, "percentage": 98.03, "elapsed_time": "8:07:43", "remaining_time": "0:09:46", "throughput": 2611.68, "total_tokens": 76427744} +{"current_steps": 131645, "total_steps": 134280, "loss": 0.7903, "lr": 3.520255565100994e-05, "epoch": 19.60753649091451, "percentage": 98.04, "elapsed_time": "8:07:44", "remaining_time": "0:09:45", "throughput": 2611.68, "total_tokens": 76430496} +{"current_steps": 131650, "total_steps": 134280, "loss": 0.8029, "lr": 3.506918896302835e-05, "epoch": 19.608281203455466, "percentage": 98.04, "elapsed_time": "8:07:45", "remaining_time": "0:09:44", "throughput": 2611.69, "total_tokens": 76433440} +{"current_steps": 131655, "total_steps": 134280, "loss": 0.7863, "lr": 3.493607509234386e-05, "epoch": 19.609025915996426, "percentage": 98.05, "elapsed_time": "8:07:47", "remaining_time": "0:09:43", "throughput": 2611.7, "total_tokens": 76436576} +{"current_steps": 131660, "total_steps": 134280, "loss": 0.7927, "lr": 3.4803214041204674e-05, "epoch": 19.609770628537383, "percentage": 98.05, "elapsed_time": "8:07:48", "remaining_time": "0:09:42", "throughput": 2611.7, "total_tokens": 76439488} +{"current_steps": 131665, "total_steps": 134280, "loss": 0.7802, "lr": 3.4670605811855655e-05, "epoch": 19.610515341078344, "percentage": 98.05, "elapsed_time": "8:07:49", "remaining_time": "0:09:41", "throughput": 2611.71, "total_tokens": 76442464} +{"current_steps": 131670, "total_steps": 134280, "loss": 0.8119, "lr": 3.453825040653502e-05, "epoch": 19.611260053619304, "percentage": 98.06, "elapsed_time": "8:07:50", "remaining_time": "0:09:40", "throughput": 2611.72, "total_tokens": 76445664} +{"current_steps": 131675, "total_steps": 134280, "loss": 0.8031, "lr": 3.440614782748097e-05, "epoch": 19.61200476616026, "percentage": 98.06, "elapsed_time": "8:07:51", "remaining_time": "0:09:39", "throughput": 2611.72, "total_tokens": 76448352} +{"current_steps": 131680, "total_steps": 134280, "loss": 0.7914, "lr": 3.427429807692506e-05, "epoch": 19.61274947870122, "percentage": 98.06, "elapsed_time": "8:07:52", "remaining_time": "0:09:37", "throughput": 2611.72, "total_tokens": 76451200} +{"current_steps": 131685, "total_steps": 134280, "loss": 0.7966, "lr": 3.414270115709383e-05, "epoch": 19.613494191242182, "percentage": 98.07, "elapsed_time": "8:07:53", "remaining_time": "0:09:36", "throughput": 2611.73, "total_tokens": 76454240} +{"current_steps": 131690, "total_steps": 134280, "loss": 0.8088, "lr": 3.401135707021219e-05, "epoch": 19.61423890378314, "percentage": 98.07, "elapsed_time": "8:07:54", "remaining_time": "0:09:35", "throughput": 2611.73, "total_tokens": 76456800} +{"current_steps": 131695, "total_steps": 134280, "loss": 0.7885, "lr": 3.388026581849668e-05, "epoch": 19.6149836163241, "percentage": 98.07, "elapsed_time": "8:07:55", "remaining_time": "0:09:34", "throughput": 2611.73, "total_tokens": 76459808} +{"current_steps": 131700, "total_steps": 134280, "loss": 0.7992, "lr": 3.3749427404163864e-05, "epoch": 19.615728328865057, "percentage": 98.08, "elapsed_time": "8:07:56", "remaining_time": "0:09:33", "throughput": 2611.75, "total_tokens": 76463168} +{"current_steps": 131705, "total_steps": 134280, "loss": 0.8231, "lr": 3.361884182942365e-05, "epoch": 19.616473041406017, "percentage": 98.08, "elapsed_time": "8:07:57", "remaining_time": "0:09:32", "throughput": 2611.76, "total_tokens": 76466144} +{"current_steps": 131710, "total_steps": 134280, "loss": 0.7858, "lr": 3.348850909648093e-05, "epoch": 19.617217753946978, "percentage": 98.09, "elapsed_time": "8:07:58", "remaining_time": "0:09:31", "throughput": 2611.77, "total_tokens": 76469280} +{"current_steps": 131715, "total_steps": 134280, "loss": 0.7995, "lr": 3.335842920754062e-05, "epoch": 19.617962466487935, "percentage": 98.09, "elapsed_time": "8:07:59", "remaining_time": "0:09:30", "throughput": 2611.77, "total_tokens": 76471968} +{"current_steps": 131720, "total_steps": 134280, "loss": 0.7811, "lr": 3.3228602164795946e-05, "epoch": 19.618707179028895, "percentage": 98.09, "elapsed_time": "8:08:00", "remaining_time": "0:09:29", "throughput": 2611.77, "total_tokens": 76474944} +{"current_steps": 131725, "total_steps": 134280, "loss": 0.8109, "lr": 3.30990279704435e-05, "epoch": 19.619451891569852, "percentage": 98.1, "elapsed_time": "8:08:01", "remaining_time": "0:09:27", "throughput": 2611.78, "total_tokens": 76477888} +{"current_steps": 131730, "total_steps": 134280, "loss": 0.8139, "lr": 3.296970662667153e-05, "epoch": 19.620196604110813, "percentage": 98.1, "elapsed_time": "8:08:02", "remaining_time": "0:09:26", "throughput": 2611.78, "total_tokens": 76480672} +{"current_steps": 131735, "total_steps": 134280, "loss": 0.7852, "lr": 3.284063813566495e-05, "epoch": 19.620941316651773, "percentage": 98.1, "elapsed_time": "8:08:04", "remaining_time": "0:09:25", "throughput": 2611.79, "total_tokens": 76483552} +{"current_steps": 131740, "total_steps": 134280, "loss": 0.8014, "lr": 3.271182249960203e-05, "epoch": 19.62168602919273, "percentage": 98.11, "elapsed_time": "8:08:05", "remaining_time": "0:09:24", "throughput": 2611.79, "total_tokens": 76486432} +{"current_steps": 131745, "total_steps": 134280, "loss": 0.8098, "lr": 3.258325972066267e-05, "epoch": 19.62243074173369, "percentage": 98.11, "elapsed_time": "8:08:06", "remaining_time": "0:09:23", "throughput": 2611.8, "total_tokens": 76489504} +{"current_steps": 131750, "total_steps": 134280, "loss": 0.7826, "lr": 3.245494980101515e-05, "epoch": 19.62317545427465, "percentage": 98.12, "elapsed_time": "8:08:07", "remaining_time": "0:09:22", "throughput": 2611.8, "total_tokens": 76492128} +{"current_steps": 131755, "total_steps": 134280, "loss": 0.8096, "lr": 3.232689274283107e-05, "epoch": 19.62392016681561, "percentage": 98.12, "elapsed_time": "8:08:08", "remaining_time": "0:09:21", "throughput": 2611.8, "total_tokens": 76494816} +{"current_steps": 131760, "total_steps": 134280, "loss": 0.8123, "lr": 3.219908854827036e-05, "epoch": 19.62466487935657, "percentage": 98.12, "elapsed_time": "8:08:09", "remaining_time": "0:09:20", "throughput": 2611.81, "total_tokens": 76497888} +{"current_steps": 131765, "total_steps": 134280, "loss": 0.7923, "lr": 3.207153721949296e-05, "epoch": 19.625409591897526, "percentage": 98.13, "elapsed_time": "8:08:10", "remaining_time": "0:09:19", "throughput": 2611.81, "total_tokens": 76500960} +{"current_steps": 131770, "total_steps": 134280, "loss": 0.7903, "lr": 3.194423875865548e-05, "epoch": 19.626154304438487, "percentage": 98.13, "elapsed_time": "8:08:11", "remaining_time": "0:09:17", "throughput": 2611.82, "total_tokens": 76503808} +{"current_steps": 131775, "total_steps": 134280, "loss": 0.792, "lr": 3.181719316790621e-05, "epoch": 19.626899016979447, "percentage": 98.13, "elapsed_time": "8:08:12", "remaining_time": "0:09:16", "throughput": 2611.83, "total_tokens": 76507008} +{"current_steps": 131780, "total_steps": 134280, "loss": 0.8063, "lr": 3.1690400449393416e-05, "epoch": 19.627643729520404, "percentage": 98.14, "elapsed_time": "8:08:13", "remaining_time": "0:09:15", "throughput": 2611.83, "total_tokens": 76510112} +{"current_steps": 131785, "total_steps": 134280, "loss": 0.8045, "lr": 3.1563860605257064e-05, "epoch": 19.628388442061365, "percentage": 98.14, "elapsed_time": "8:08:14", "remaining_time": "0:09:14", "throughput": 2611.84, "total_tokens": 76513312} +{"current_steps": 131790, "total_steps": 134280, "loss": 0.8, "lr": 3.1437573637637104e-05, "epoch": 19.629133154602325, "percentage": 98.15, "elapsed_time": "8:08:15", "remaining_time": "0:09:13", "throughput": 2611.85, "total_tokens": 76516096} +{"current_steps": 131795, "total_steps": 134280, "loss": 0.8193, "lr": 3.1311539548665165e-05, "epoch": 19.629877867143282, "percentage": 98.15, "elapsed_time": "8:08:16", "remaining_time": "0:09:12", "throughput": 2611.85, "total_tokens": 76519008} +{"current_steps": 131800, "total_steps": 134280, "loss": 0.796, "lr": 3.1185758340472876e-05, "epoch": 19.630622579684243, "percentage": 98.15, "elapsed_time": "8:08:17", "remaining_time": "0:09:11", "throughput": 2611.85, "total_tokens": 76521536} +{"current_steps": 131805, "total_steps": 134280, "loss": 0.8027, "lr": 3.106023001518188e-05, "epoch": 19.6313672922252, "percentage": 98.16, "elapsed_time": "8:08:18", "remaining_time": "0:09:10", "throughput": 2611.85, "total_tokens": 76524352} +{"current_steps": 131810, "total_steps": 134280, "loss": 0.7771, "lr": 3.093495457491546e-05, "epoch": 19.63211200476616, "percentage": 98.16, "elapsed_time": "8:08:19", "remaining_time": "0:09:09", "throughput": 2611.86, "total_tokens": 76527232} +{"current_steps": 131815, "total_steps": 134280, "loss": 0.7982, "lr": 3.080993202178861e-05, "epoch": 19.63285671730712, "percentage": 98.16, "elapsed_time": "8:08:21", "remaining_time": "0:09:07", "throughput": 2611.86, "total_tokens": 76530208} +{"current_steps": 131820, "total_steps": 134280, "loss": 0.7977, "lr": 3.0685162357912964e-05, "epoch": 19.633601429848078, "percentage": 98.17, "elapsed_time": "8:08:22", "remaining_time": "0:09:06", "throughput": 2611.87, "total_tokens": 76533056} +{"current_steps": 131825, "total_steps": 134280, "loss": 0.7866, "lr": 3.056064558539851e-05, "epoch": 19.634346142389038, "percentage": 98.17, "elapsed_time": "8:08:23", "remaining_time": "0:09:05", "throughput": 2611.87, "total_tokens": 76536000} +{"current_steps": 131830, "total_steps": 134280, "loss": 0.786, "lr": 3.0436381706348547e-05, "epoch": 19.63509085493, "percentage": 98.18, "elapsed_time": "8:08:24", "remaining_time": "0:09:04", "throughput": 2611.87, "total_tokens": 76538720} +{"current_steps": 131835, "total_steps": 134280, "loss": 0.8057, "lr": 3.031237072285975e-05, "epoch": 19.635835567470956, "percentage": 98.18, "elapsed_time": "8:08:25", "remaining_time": "0:09:03", "throughput": 2611.88, "total_tokens": 76541920} +{"current_steps": 131840, "total_steps": 134280, "loss": 0.8175, "lr": 3.018861263703043e-05, "epoch": 19.636580280011916, "percentage": 98.18, "elapsed_time": "8:08:26", "remaining_time": "0:09:02", "throughput": 2611.89, "total_tokens": 76544992} +{"current_steps": 131845, "total_steps": 134280, "loss": 0.7949, "lr": 3.0065107450948923e-05, "epoch": 19.637324992552873, "percentage": 98.19, "elapsed_time": "8:08:27", "remaining_time": "0:09:01", "throughput": 2611.89, "total_tokens": 76547808} +{"current_steps": 131850, "total_steps": 134280, "loss": 0.8091, "lr": 2.9941855166703557e-05, "epoch": 19.638069705093834, "percentage": 98.19, "elapsed_time": "8:08:28", "remaining_time": "0:09:00", "throughput": 2611.9, "total_tokens": 76550880} +{"current_steps": 131855, "total_steps": 134280, "loss": 0.7755, "lr": 2.981885578637433e-05, "epoch": 19.638814417634794, "percentage": 98.19, "elapsed_time": "8:08:29", "remaining_time": "0:08:59", "throughput": 2611.9, "total_tokens": 76553664} +{"current_steps": 131860, "total_steps": 134280, "loss": 0.779, "lr": 2.9696109312041252e-05, "epoch": 19.63955913017575, "percentage": 98.2, "elapsed_time": "8:08:30", "remaining_time": "0:08:57", "throughput": 2611.91, "total_tokens": 76556512} +{"current_steps": 131865, "total_steps": 134280, "loss": 0.7892, "lr": 2.957361574577766e-05, "epoch": 19.640303842716712, "percentage": 98.2, "elapsed_time": "8:08:31", "remaining_time": "0:08:56", "throughput": 2611.91, "total_tokens": 76559264} +{"current_steps": 131870, "total_steps": 134280, "loss": 0.8174, "lr": 2.9451375089651897e-05, "epoch": 19.64104855525767, "percentage": 98.21, "elapsed_time": "8:08:32", "remaining_time": "0:08:55", "throughput": 2611.92, "total_tokens": 76562272} +{"current_steps": 131875, "total_steps": 134280, "loss": 0.7927, "lr": 2.9329387345730648e-05, "epoch": 19.64179326779863, "percentage": 98.21, "elapsed_time": "8:08:33", "remaining_time": "0:08:54", "throughput": 2611.92, "total_tokens": 76565056} +{"current_steps": 131880, "total_steps": 134280, "loss": 0.8041, "lr": 2.920765251607227e-05, "epoch": 19.64253798033959, "percentage": 98.21, "elapsed_time": "8:08:34", "remaining_time": "0:08:53", "throughput": 2611.92, "total_tokens": 76567776} +{"current_steps": 131885, "total_steps": 134280, "loss": 0.7813, "lr": 2.908617060273677e-05, "epoch": 19.643282692880547, "percentage": 98.22, "elapsed_time": "8:08:35", "remaining_time": "0:08:52", "throughput": 2611.92, "total_tokens": 76570464} +{"current_steps": 131890, "total_steps": 134280, "loss": 0.781, "lr": 2.8964941607774187e-05, "epoch": 19.644027405421507, "percentage": 98.22, "elapsed_time": "8:08:36", "remaining_time": "0:08:51", "throughput": 2611.92, "total_tokens": 76573088} +{"current_steps": 131895, "total_steps": 134280, "loss": 0.7948, "lr": 2.8843965533231206e-05, "epoch": 19.644772117962468, "percentage": 98.22, "elapsed_time": "8:08:37", "remaining_time": "0:08:50", "throughput": 2611.93, "total_tokens": 76576128} +{"current_steps": 131900, "total_steps": 134280, "loss": 0.8216, "lr": 2.8723242381156198e-05, "epoch": 19.645516830503425, "percentage": 98.23, "elapsed_time": "8:08:38", "remaining_time": "0:08:49", "throughput": 2611.93, "total_tokens": 76578976} +{"current_steps": 131905, "total_steps": 134280, "loss": 0.7744, "lr": 2.8602772153584197e-05, "epoch": 19.646261543044385, "percentage": 98.23, "elapsed_time": "8:08:39", "remaining_time": "0:08:47", "throughput": 2611.93, "total_tokens": 76581696} +{"current_steps": 131910, "total_steps": 134280, "loss": 0.7921, "lr": 2.848255485255191e-05, "epoch": 19.647006255585342, "percentage": 98.24, "elapsed_time": "8:08:41", "remaining_time": "0:08:46", "throughput": 2611.94, "total_tokens": 76584704} +{"current_steps": 131915, "total_steps": 134280, "loss": 0.7968, "lr": 2.836259048009271e-05, "epoch": 19.647750968126303, "percentage": 98.24, "elapsed_time": "8:08:42", "remaining_time": "0:08:45", "throughput": 2611.95, "total_tokens": 76587872} +{"current_steps": 131920, "total_steps": 134280, "loss": 0.7907, "lr": 2.8242879038228307e-05, "epoch": 19.648495680667263, "percentage": 98.24, "elapsed_time": "8:08:43", "remaining_time": "0:08:44", "throughput": 2611.95, "total_tokens": 76590784} +{"current_steps": 131925, "total_steps": 134280, "loss": 0.785, "lr": 2.812342052898542e-05, "epoch": 19.64924039320822, "percentage": 98.25, "elapsed_time": "8:08:44", "remaining_time": "0:08:43", "throughput": 2611.95, "total_tokens": 76593632} +{"current_steps": 131930, "total_steps": 134280, "loss": 0.7892, "lr": 2.8004214954380767e-05, "epoch": 19.64998510574918, "percentage": 98.25, "elapsed_time": "8:08:45", "remaining_time": "0:08:42", "throughput": 2611.96, "total_tokens": 76596416} +{"current_steps": 131935, "total_steps": 134280, "loss": 0.8034, "lr": 2.788526231642774e-05, "epoch": 19.65072981829014, "percentage": 98.25, "elapsed_time": "8:08:46", "remaining_time": "0:08:41", "throughput": 2611.97, "total_tokens": 76599648} +{"current_steps": 131940, "total_steps": 134280, "loss": 0.8077, "lr": 2.7766562617134726e-05, "epoch": 19.6514745308311, "percentage": 98.26, "elapsed_time": "8:08:47", "remaining_time": "0:08:40", "throughput": 2611.98, "total_tokens": 76602784} +{"current_steps": 131945, "total_steps": 134280, "loss": 0.7923, "lr": 2.7648115858510123e-05, "epoch": 19.65221924337206, "percentage": 98.26, "elapsed_time": "8:08:48", "remaining_time": "0:08:39", "throughput": 2611.98, "total_tokens": 76605536} +{"current_steps": 131950, "total_steps": 134280, "loss": 0.8042, "lr": 2.7529922042554e-05, "epoch": 19.652963955913016, "percentage": 98.26, "elapsed_time": "8:08:49", "remaining_time": "0:08:37", "throughput": 2611.98, "total_tokens": 76608256} +{"current_steps": 131955, "total_steps": 134280, "loss": 0.7981, "lr": 2.7411981171259758e-05, "epoch": 19.653708668453977, "percentage": 98.27, "elapsed_time": "8:08:50", "remaining_time": "0:08:36", "throughput": 2611.98, "total_tokens": 76611008} +{"current_steps": 131960, "total_steps": 134280, "loss": 0.8045, "lr": 2.72942932466258e-05, "epoch": 19.654453380994937, "percentage": 98.27, "elapsed_time": "8:08:51", "remaining_time": "0:08:35", "throughput": 2611.99, "total_tokens": 76613952} +{"current_steps": 131965, "total_steps": 134280, "loss": 0.7953, "lr": 2.717685827063554e-05, "epoch": 19.655198093535894, "percentage": 98.28, "elapsed_time": "8:08:52", "remaining_time": "0:08:34", "throughput": 2611.99, "total_tokens": 76616960} +{"current_steps": 131970, "total_steps": 134280, "loss": 0.7904, "lr": 2.7059676245274055e-05, "epoch": 19.655942806076855, "percentage": 98.28, "elapsed_time": "8:08:53", "remaining_time": "0:08:33", "throughput": 2612.0, "total_tokens": 76619936} +{"current_steps": 131975, "total_steps": 134280, "loss": 0.7934, "lr": 2.6942747172523095e-05, "epoch": 19.656687518617815, "percentage": 98.28, "elapsed_time": "8:08:54", "remaining_time": "0:08:32", "throughput": 2612.0, "total_tokens": 76622656} +{"current_steps": 131980, "total_steps": 134280, "loss": 0.7876, "lr": 2.6826071054354417e-05, "epoch": 19.657432231158772, "percentage": 98.29, "elapsed_time": "8:08:55", "remaining_time": "0:08:31", "throughput": 2612.01, "total_tokens": 76625536} +{"current_steps": 131985, "total_steps": 134280, "loss": 0.8014, "lr": 2.6709647892743105e-05, "epoch": 19.658176943699733, "percentage": 98.29, "elapsed_time": "8:08:56", "remaining_time": "0:08:30", "throughput": 2612.01, "total_tokens": 76628512} +{"current_steps": 131990, "total_steps": 134280, "loss": 0.8084, "lr": 2.6593477689654255e-05, "epoch": 19.65892165624069, "percentage": 98.29, "elapsed_time": "8:08:58", "remaining_time": "0:08:29", "throughput": 2612.02, "total_tokens": 76631456} +{"current_steps": 131995, "total_steps": 134280, "loss": 0.7869, "lr": 2.647756044704963e-05, "epoch": 19.65966636878165, "percentage": 98.3, "elapsed_time": "8:08:59", "remaining_time": "0:08:27", "throughput": 2612.02, "total_tokens": 76634304} +{"current_steps": 132000, "total_steps": 134280, "loss": 0.8025, "lr": 2.6361896166887664e-05, "epoch": 19.66041108132261, "percentage": 98.3, "elapsed_time": "8:09:00", "remaining_time": "0:08:26", "throughput": 2612.03, "total_tokens": 76637280} +{"current_steps": 132005, "total_steps": 134280, "loss": 0.7931, "lr": 2.6246484851123462e-05, "epoch": 19.661155793863568, "percentage": 98.31, "elapsed_time": "8:09:01", "remaining_time": "0:08:25", "throughput": 2612.03, "total_tokens": 76640160} +{"current_steps": 132010, "total_steps": 134280, "loss": 0.7942, "lr": 2.6131326501705464e-05, "epoch": 19.66190050640453, "percentage": 98.31, "elapsed_time": "8:09:02", "remaining_time": "0:08:24", "throughput": 2612.04, "total_tokens": 76643168} +{"current_steps": 132015, "total_steps": 134280, "loss": 0.8009, "lr": 2.601642112058211e-05, "epoch": 19.662645218945485, "percentage": 98.31, "elapsed_time": "8:09:03", "remaining_time": "0:08:23", "throughput": 2612.04, "total_tokens": 76645888} +{"current_steps": 132020, "total_steps": 134280, "loss": 0.8126, "lr": 2.5901768709690186e-05, "epoch": 19.663389931486446, "percentage": 98.32, "elapsed_time": "8:09:04", "remaining_time": "0:08:22", "throughput": 2612.05, "total_tokens": 76648896} +{"current_steps": 132025, "total_steps": 134280, "loss": 0.7998, "lr": 2.5787369270969806e-05, "epoch": 19.664134644027406, "percentage": 98.32, "elapsed_time": "8:09:05", "remaining_time": "0:08:21", "throughput": 2612.06, "total_tokens": 76652224} +{"current_steps": 132030, "total_steps": 134280, "loss": 0.8021, "lr": 2.5673222806352757e-05, "epoch": 19.664879356568363, "percentage": 98.32, "elapsed_time": "8:09:06", "remaining_time": "0:08:20", "throughput": 2612.06, "total_tokens": 76655008} +{"current_steps": 132035, "total_steps": 134280, "loss": 0.8162, "lr": 2.5559329317767497e-05, "epoch": 19.665624069109324, "percentage": 98.33, "elapsed_time": "8:09:07", "remaining_time": "0:08:18", "throughput": 2612.07, "total_tokens": 76657792} +{"current_steps": 132040, "total_steps": 134280, "loss": 0.8248, "lr": 2.544568880713749e-05, "epoch": 19.666368781650284, "percentage": 98.33, "elapsed_time": "8:09:08", "remaining_time": "0:08:17", "throughput": 2612.07, "total_tokens": 76660512} +{"current_steps": 132045, "total_steps": 134280, "loss": 0.8092, "lr": 2.533230127638286e-05, "epoch": 19.66711349419124, "percentage": 98.34, "elapsed_time": "8:09:09", "remaining_time": "0:08:16", "throughput": 2612.07, "total_tokens": 76663488} +{"current_steps": 132050, "total_steps": 134280, "loss": 0.8225, "lr": 2.5219166727420417e-05, "epoch": 19.667858206732202, "percentage": 98.34, "elapsed_time": "8:09:10", "remaining_time": "0:08:15", "throughput": 2612.07, "total_tokens": 76666144} +{"current_steps": 132055, "total_steps": 134280, "loss": 0.8013, "lr": 2.510628516216029e-05, "epoch": 19.66860291927316, "percentage": 98.34, "elapsed_time": "8:09:11", "remaining_time": "0:08:14", "throughput": 2612.07, "total_tokens": 76668864} +{"current_steps": 132060, "total_steps": 134280, "loss": 0.8133, "lr": 2.499365658250929e-05, "epoch": 19.66934763181412, "percentage": 98.35, "elapsed_time": "8:09:12", "remaining_time": "0:08:13", "throughput": 2612.08, "total_tokens": 76671936} +{"current_steps": 132065, "total_steps": 134280, "loss": 0.8022, "lr": 2.4881280990370902e-05, "epoch": 19.67009234435508, "percentage": 98.35, "elapsed_time": "8:09:13", "remaining_time": "0:08:12", "throughput": 2612.09, "total_tokens": 76674880} +{"current_steps": 132070, "total_steps": 134280, "loss": 0.7997, "lr": 2.476915838764193e-05, "epoch": 19.670837056896037, "percentage": 98.35, "elapsed_time": "8:09:14", "remaining_time": "0:08:11", "throughput": 2612.09, "total_tokens": 76677600} +{"current_steps": 132075, "total_steps": 134280, "loss": 0.8129, "lr": 2.46572887762192e-05, "epoch": 19.671581769436997, "percentage": 98.36, "elapsed_time": "8:09:16", "remaining_time": "0:08:10", "throughput": 2612.1, "total_tokens": 76680768} +{"current_steps": 132080, "total_steps": 134280, "loss": 0.8127, "lr": 2.4545672157991192e-05, "epoch": 19.672326481977958, "percentage": 98.36, "elapsed_time": "8:09:17", "remaining_time": "0:08:08", "throughput": 2612.09, "total_tokens": 76683424} +{"current_steps": 132085, "total_steps": 134280, "loss": 0.798, "lr": 2.4434308534843074e-05, "epoch": 19.673071194518915, "percentage": 98.37, "elapsed_time": "8:09:18", "remaining_time": "0:08:07", "throughput": 2612.1, "total_tokens": 76686432} +{"current_steps": 132090, "total_steps": 134280, "loss": 0.8101, "lr": 2.4323197908658334e-05, "epoch": 19.673815907059875, "percentage": 98.37, "elapsed_time": "8:09:19", "remaining_time": "0:08:06", "throughput": 2612.1, "total_tokens": 76689120} +{"current_steps": 132095, "total_steps": 134280, "loss": 0.794, "lr": 2.421234028131047e-05, "epoch": 19.674560619600832, "percentage": 98.37, "elapsed_time": "8:09:20", "remaining_time": "0:08:05", "throughput": 2612.11, "total_tokens": 76692096} +{"current_steps": 132100, "total_steps": 134280, "loss": 0.7861, "lr": 2.4101735654676324e-05, "epoch": 19.675305332141793, "percentage": 98.38, "elapsed_time": "8:09:21", "remaining_time": "0:08:04", "throughput": 2612.12, "total_tokens": 76695040} +{"current_steps": 132105, "total_steps": 134280, "loss": 0.7856, "lr": 2.3991384030621066e-05, "epoch": 19.676050044682754, "percentage": 98.38, "elapsed_time": "8:09:22", "remaining_time": "0:08:03", "throughput": 2612.12, "total_tokens": 76697952} +{"current_steps": 132110, "total_steps": 134280, "loss": 0.7895, "lr": 2.388128541101153e-05, "epoch": 19.67679475722371, "percentage": 98.38, "elapsed_time": "8:09:23", "remaining_time": "0:08:02", "throughput": 2612.12, "total_tokens": 76700512} +{"current_steps": 132115, "total_steps": 134280, "loss": 0.7897, "lr": 2.377143979770624e-05, "epoch": 19.67753946976467, "percentage": 98.39, "elapsed_time": "8:09:24", "remaining_time": "0:08:01", "throughput": 2612.13, "total_tokens": 76703680} +{"current_steps": 132120, "total_steps": 134280, "loss": 0.7806, "lr": 2.366184719256037e-05, "epoch": 19.67828418230563, "percentage": 98.39, "elapsed_time": "8:09:25", "remaining_time": "0:08:00", "throughput": 2612.13, "total_tokens": 76706400} +{"current_steps": 132125, "total_steps": 134280, "loss": 0.8163, "lr": 2.355250759742744e-05, "epoch": 19.67902889484659, "percentage": 98.4, "elapsed_time": "8:09:26", "remaining_time": "0:07:58", "throughput": 2612.14, "total_tokens": 76709344} +{"current_steps": 132130, "total_steps": 134280, "loss": 0.7931, "lr": 2.3443421014154307e-05, "epoch": 19.67977360738755, "percentage": 98.4, "elapsed_time": "8:09:27", "remaining_time": "0:07:57", "throughput": 2612.14, "total_tokens": 76712352} +{"current_steps": 132135, "total_steps": 134280, "loss": 0.7902, "lr": 2.3334587444581166e-05, "epoch": 19.680518319928506, "percentage": 98.4, "elapsed_time": "8:09:28", "remaining_time": "0:07:56", "throughput": 2612.15, "total_tokens": 76715264} +{"current_steps": 132140, "total_steps": 134280, "loss": 0.8062, "lr": 2.3226006890549875e-05, "epoch": 19.681263032469467, "percentage": 98.41, "elapsed_time": "8:09:29", "remaining_time": "0:07:55", "throughput": 2612.15, "total_tokens": 76718272} +{"current_steps": 132145, "total_steps": 134280, "loss": 0.7842, "lr": 2.3117679353892307e-05, "epoch": 19.682007745010427, "percentage": 98.41, "elapsed_time": "8:09:30", "remaining_time": "0:07:54", "throughput": 2612.16, "total_tokens": 76721408} +{"current_steps": 132150, "total_steps": 134280, "loss": 0.7973, "lr": 2.300960483644032e-05, "epoch": 19.682752457551384, "percentage": 98.41, "elapsed_time": "8:09:31", "remaining_time": "0:07:53", "throughput": 2612.16, "total_tokens": 76724064} +{"current_steps": 132155, "total_steps": 134280, "loss": 0.7914, "lr": 2.2901783340019132e-05, "epoch": 19.683497170092345, "percentage": 98.42, "elapsed_time": "8:09:32", "remaining_time": "0:07:52", "throughput": 2612.17, "total_tokens": 76726880} +{"current_steps": 132160, "total_steps": 134280, "loss": 0.7803, "lr": 2.2794214866450613e-05, "epoch": 19.684241882633305, "percentage": 98.42, "elapsed_time": "8:09:33", "remaining_time": "0:07:51", "throughput": 2612.17, "total_tokens": 76729728} +{"current_steps": 132165, "total_steps": 134280, "loss": 0.8011, "lr": 2.2686899417551642e-05, "epoch": 19.684986595174262, "percentage": 98.42, "elapsed_time": "8:09:34", "remaining_time": "0:07:50", "throughput": 2612.17, "total_tokens": 76732320} +{"current_steps": 132170, "total_steps": 134280, "loss": 0.7909, "lr": 2.257983699513577e-05, "epoch": 19.685731307715223, "percentage": 98.43, "elapsed_time": "8:09:36", "remaining_time": "0:07:48", "throughput": 2612.18, "total_tokens": 76735424} +{"current_steps": 132175, "total_steps": 134280, "loss": 0.8208, "lr": 2.2473027601009887e-05, "epoch": 19.68647602025618, "percentage": 98.43, "elapsed_time": "8:09:37", "remaining_time": "0:07:47", "throughput": 2612.18, "total_tokens": 76738240} +{"current_steps": 132180, "total_steps": 134280, "loss": 0.7886, "lr": 2.2366471236980876e-05, "epoch": 19.68722073279714, "percentage": 98.44, "elapsed_time": "8:09:38", "remaining_time": "0:07:46", "throughput": 2612.19, "total_tokens": 76741216} +{"current_steps": 132185, "total_steps": 134280, "loss": 0.8051, "lr": 2.2260167904847304e-05, "epoch": 19.6879654453381, "percentage": 98.44, "elapsed_time": "8:09:39", "remaining_time": "0:07:45", "throughput": 2612.19, "total_tokens": 76743872} +{"current_steps": 132190, "total_steps": 134280, "loss": 0.7857, "lr": 2.21541176064044e-05, "epoch": 19.688710157879058, "percentage": 98.44, "elapsed_time": "8:09:40", "remaining_time": "0:07:44", "throughput": 2612.19, "total_tokens": 76746752} +{"current_steps": 132195, "total_steps": 134280, "loss": 0.7932, "lr": 2.2048320343445726e-05, "epoch": 19.68945487042002, "percentage": 98.45, "elapsed_time": "8:09:41", "remaining_time": "0:07:43", "throughput": 2612.2, "total_tokens": 76749696} +{"current_steps": 132200, "total_steps": 134280, "loss": 0.7979, "lr": 2.194277611775819e-05, "epoch": 19.69019958296098, "percentage": 98.45, "elapsed_time": "8:09:42", "remaining_time": "0:07:42", "throughput": 2612.21, "total_tokens": 76753024} +{"current_steps": 132205, "total_steps": 134280, "loss": 0.8052, "lr": 2.1837484931123697e-05, "epoch": 19.690944295501936, "percentage": 98.45, "elapsed_time": "8:09:43", "remaining_time": "0:07:41", "throughput": 2612.22, "total_tokens": 76756160} +{"current_steps": 132210, "total_steps": 134280, "loss": 0.7876, "lr": 2.173244678532249e-05, "epoch": 19.691689008042896, "percentage": 98.46, "elapsed_time": "8:09:44", "remaining_time": "0:07:40", "throughput": 2612.22, "total_tokens": 76759168} +{"current_steps": 132215, "total_steps": 134280, "loss": 0.7938, "lr": 2.162766168212815e-05, "epoch": 19.692433720583853, "percentage": 98.46, "elapsed_time": "8:09:45", "remaining_time": "0:07:38", "throughput": 2612.22, "total_tokens": 76761760} +{"current_steps": 132220, "total_steps": 134280, "loss": 0.7989, "lr": 2.1523129623310932e-05, "epoch": 19.693178433124814, "percentage": 98.47, "elapsed_time": "8:09:46", "remaining_time": "0:07:37", "throughput": 2612.23, "total_tokens": 76764672} +{"current_steps": 132225, "total_steps": 134280, "loss": 0.7875, "lr": 2.141885061063775e-05, "epoch": 19.693923145665774, "percentage": 98.47, "elapsed_time": "8:09:47", "remaining_time": "0:07:36", "throughput": 2612.23, "total_tokens": 76767328} +{"current_steps": 132230, "total_steps": 134280, "loss": 0.8013, "lr": 2.1314824645868867e-05, "epoch": 19.69466785820673, "percentage": 98.47, "elapsed_time": "8:09:48", "remaining_time": "0:07:35", "throughput": 2612.23, "total_tokens": 76770016} +{"current_steps": 132235, "total_steps": 134280, "loss": 0.8032, "lr": 2.1211051730762876e-05, "epoch": 19.695412570747692, "percentage": 98.48, "elapsed_time": "8:09:49", "remaining_time": "0:07:34", "throughput": 2612.24, "total_tokens": 76773312} +{"current_steps": 132240, "total_steps": 134280, "loss": 0.8172, "lr": 2.1107531867071703e-05, "epoch": 19.69615728328865, "percentage": 98.48, "elapsed_time": "8:09:50", "remaining_time": "0:07:33", "throughput": 2612.25, "total_tokens": 76776512} +{"current_steps": 132245, "total_steps": 134280, "loss": 0.8071, "lr": 2.100426505654562e-05, "epoch": 19.69690199582961, "percentage": 98.48, "elapsed_time": "8:09:51", "remaining_time": "0:07:32", "throughput": 2612.25, "total_tokens": 76779264} +{"current_steps": 132250, "total_steps": 134280, "loss": 0.7977, "lr": 2.090125130092657e-05, "epoch": 19.69764670837057, "percentage": 98.49, "elapsed_time": "8:09:53", "remaining_time": "0:07:31", "throughput": 2612.26, "total_tokens": 76782240} +{"current_steps": 132255, "total_steps": 134280, "loss": 0.8103, "lr": 2.0798490601958154e-05, "epoch": 19.698391420911527, "percentage": 98.49, "elapsed_time": "8:09:54", "remaining_time": "0:07:30", "throughput": 2612.26, "total_tokens": 76785056} +{"current_steps": 132260, "total_steps": 134280, "loss": 0.7941, "lr": 2.0695982961375646e-05, "epoch": 19.699136133452487, "percentage": 98.5, "elapsed_time": "8:09:55", "remaining_time": "0:07:28", "throughput": 2612.26, "total_tokens": 76787744} +{"current_steps": 132265, "total_steps": 134280, "loss": 0.8014, "lr": 2.0593728380911003e-05, "epoch": 19.699880845993448, "percentage": 98.5, "elapsed_time": "8:09:56", "remaining_time": "0:07:27", "throughput": 2612.27, "total_tokens": 76790976} +{"current_steps": 132270, "total_steps": 134280, "loss": 0.7889, "lr": 2.0491726862289505e-05, "epoch": 19.700625558534405, "percentage": 98.5, "elapsed_time": "8:09:57", "remaining_time": "0:07:26", "throughput": 2612.28, "total_tokens": 76793760} +{"current_steps": 132275, "total_steps": 134280, "loss": 0.8015, "lr": 2.0389978407234775e-05, "epoch": 19.701370271075366, "percentage": 98.51, "elapsed_time": "8:09:58", "remaining_time": "0:07:25", "throughput": 2612.28, "total_tokens": 76796640} +{"current_steps": 132280, "total_steps": 134280, "loss": 0.8146, "lr": 2.028848301746877e-05, "epoch": 19.702114983616323, "percentage": 98.51, "elapsed_time": "8:09:59", "remaining_time": "0:07:24", "throughput": 2612.29, "total_tokens": 76799872} +{"current_steps": 132285, "total_steps": 134280, "loss": 0.8047, "lr": 2.0187240694703455e-05, "epoch": 19.702859696157283, "percentage": 98.51, "elapsed_time": "8:10:00", "remaining_time": "0:07:23", "throughput": 2612.29, "total_tokens": 76802656} +{"current_steps": 132290, "total_steps": 134280, "loss": 0.8068, "lr": 2.0086251440649128e-05, "epoch": 19.703604408698244, "percentage": 98.52, "elapsed_time": "8:10:01", "remaining_time": "0:07:22", "throughput": 2612.3, "total_tokens": 76805568} +{"current_steps": 132295, "total_steps": 134280, "loss": 0.8089, "lr": 1.9985515257012752e-05, "epoch": 19.7043491212392, "percentage": 98.52, "elapsed_time": "8:10:02", "remaining_time": "0:07:21", "throughput": 2612.3, "total_tokens": 76808480} +{"current_steps": 132300, "total_steps": 134280, "loss": 0.8217, "lr": 1.988503214549797e-05, "epoch": 19.70509383378016, "percentage": 98.53, "elapsed_time": "8:10:03", "remaining_time": "0:07:20", "throughput": 2612.31, "total_tokens": 76811328} +{"current_steps": 132305, "total_steps": 134280, "loss": 0.8218, "lr": 1.9784802107798427e-05, "epoch": 19.70583854632112, "percentage": 98.53, "elapsed_time": "8:10:04", "remaining_time": "0:07:18", "throughput": 2612.32, "total_tokens": 76814400} +{"current_steps": 132310, "total_steps": 134280, "loss": 0.8165, "lr": 1.9684825145611096e-05, "epoch": 19.70658325886208, "percentage": 98.53, "elapsed_time": "8:10:05", "remaining_time": "0:07:17", "throughput": 2612.32, "total_tokens": 76817088} +{"current_steps": 132315, "total_steps": 134280, "loss": 0.7985, "lr": 1.9585101260621297e-05, "epoch": 19.70732797140304, "percentage": 98.54, "elapsed_time": "8:10:06", "remaining_time": "0:07:16", "throughput": 2612.32, "total_tokens": 76819840} +{"current_steps": 132320, "total_steps": 134280, "loss": 0.8068, "lr": 1.9485630454517677e-05, "epoch": 19.708072683943996, "percentage": 98.54, "elapsed_time": "8:10:07", "remaining_time": "0:07:15", "throughput": 2612.33, "total_tokens": 76822880} +{"current_steps": 132325, "total_steps": 134280, "loss": 0.7961, "lr": 1.938641272897723e-05, "epoch": 19.708817396484957, "percentage": 98.54, "elapsed_time": "8:10:08", "remaining_time": "0:07:14", "throughput": 2612.34, "total_tokens": 76826176} +{"current_steps": 132330, "total_steps": 134280, "loss": 0.7964, "lr": 1.9287448085678615e-05, "epoch": 19.709562109025917, "percentage": 98.55, "elapsed_time": "8:10:10", "remaining_time": "0:07:13", "throughput": 2612.35, "total_tokens": 76829184} +{"current_steps": 132335, "total_steps": 134280, "loss": 0.795, "lr": 1.9188736526293825e-05, "epoch": 19.710306821566874, "percentage": 98.55, "elapsed_time": "8:10:11", "remaining_time": "0:07:12", "throughput": 2612.35, "total_tokens": 76832064} +{"current_steps": 132340, "total_steps": 134280, "loss": 0.7929, "lr": 1.9090278052488195e-05, "epoch": 19.711051534107835, "percentage": 98.56, "elapsed_time": "8:10:12", "remaining_time": "0:07:11", "throughput": 2612.35, "total_tokens": 76835040} +{"current_steps": 132345, "total_steps": 134280, "loss": 0.7976, "lr": 1.899207266592706e-05, "epoch": 19.711796246648795, "percentage": 98.56, "elapsed_time": "8:10:13", "remaining_time": "0:07:10", "throughput": 2612.36, "total_tokens": 76837856} +{"current_steps": 132350, "total_steps": 134280, "loss": 0.7883, "lr": 1.889412036826743e-05, "epoch": 19.712540959189752, "percentage": 98.56, "elapsed_time": "8:10:14", "remaining_time": "0:07:08", "throughput": 2612.36, "total_tokens": 76840672} +{"current_steps": 132355, "total_steps": 134280, "loss": 0.7955, "lr": 1.879642116116631e-05, "epoch": 19.713285671730713, "percentage": 98.57, "elapsed_time": "8:10:15", "remaining_time": "0:07:07", "throughput": 2612.37, "total_tokens": 76843520} +{"current_steps": 132360, "total_steps": 134280, "loss": 0.7925, "lr": 1.8698975046274047e-05, "epoch": 19.71403038427167, "percentage": 98.57, "elapsed_time": "8:10:16", "remaining_time": "0:07:06", "throughput": 2612.37, "total_tokens": 76846528} +{"current_steps": 132365, "total_steps": 134280, "loss": 0.7984, "lr": 1.860178202523599e-05, "epoch": 19.71477509681263, "percentage": 98.57, "elapsed_time": "8:10:17", "remaining_time": "0:07:05", "throughput": 2612.38, "total_tokens": 76849344} +{"current_steps": 132370, "total_steps": 134280, "loss": 0.807, "lr": 1.8504842099694163e-05, "epoch": 19.71551980935359, "percentage": 98.58, "elapsed_time": "8:10:18", "remaining_time": "0:07:04", "throughput": 2612.39, "total_tokens": 76852704} +{"current_steps": 132375, "total_steps": 134280, "loss": 0.797, "lr": 1.8408155271287253e-05, "epoch": 19.716264521894548, "percentage": 98.58, "elapsed_time": "8:10:19", "remaining_time": "0:07:03", "throughput": 2612.39, "total_tokens": 76855424} +{"current_steps": 132380, "total_steps": 134280, "loss": 0.7989, "lr": 1.8311721541647284e-05, "epoch": 19.71700923443551, "percentage": 98.59, "elapsed_time": "8:10:20", "remaining_time": "0:07:02", "throughput": 2612.4, "total_tokens": 76858496} +{"current_steps": 132385, "total_steps": 134280, "loss": 0.7834, "lr": 1.8215540912404627e-05, "epoch": 19.717753946976465, "percentage": 98.59, "elapsed_time": "8:10:21", "remaining_time": "0:07:01", "throughput": 2612.4, "total_tokens": 76860960} +{"current_steps": 132390, "total_steps": 134280, "loss": 0.7986, "lr": 1.8119613385182975e-05, "epoch": 19.718498659517426, "percentage": 98.59, "elapsed_time": "8:10:22", "remaining_time": "0:07:00", "throughput": 2612.4, "total_tokens": 76863904} +{"current_steps": 132395, "total_steps": 134280, "loss": 0.7848, "lr": 1.8023938961604368e-05, "epoch": 19.719243372058386, "percentage": 98.6, "elapsed_time": "8:10:23", "remaining_time": "0:06:58", "throughput": 2612.4, "total_tokens": 76866688} +{"current_steps": 132400, "total_steps": 134280, "loss": 0.7828, "lr": 1.7928517643282515e-05, "epoch": 19.719988084599343, "percentage": 98.6, "elapsed_time": "8:10:24", "remaining_time": "0:06:57", "throughput": 2612.41, "total_tokens": 76869728} +{"current_steps": 132405, "total_steps": 134280, "loss": 0.7998, "lr": 1.783334943183279e-05, "epoch": 19.720732797140304, "percentage": 98.6, "elapsed_time": "8:10:25", "remaining_time": "0:06:56", "throughput": 2612.42, "total_tokens": 76872864} +{"current_steps": 132410, "total_steps": 134280, "loss": 0.7935, "lr": 1.7738434328860575e-05, "epoch": 19.721477509681264, "percentage": 98.61, "elapsed_time": "8:10:27", "remaining_time": "0:06:55", "throughput": 2612.43, "total_tokens": 76875840} +{"current_steps": 132415, "total_steps": 134280, "loss": 0.8105, "lr": 1.7643772335971253e-05, "epoch": 19.72222222222222, "percentage": 98.61, "elapsed_time": "8:10:28", "remaining_time": "0:06:54", "throughput": 2612.43, "total_tokens": 76878848} +{"current_steps": 132420, "total_steps": 134280, "loss": 0.8126, "lr": 1.754936345476188e-05, "epoch": 19.722966934763182, "percentage": 98.61, "elapsed_time": "8:10:29", "remaining_time": "0:06:53", "throughput": 2612.44, "total_tokens": 76881792} +{"current_steps": 132425, "total_steps": 134280, "loss": 0.795, "lr": 1.745520768682951e-05, "epoch": 19.72371164730414, "percentage": 98.62, "elapsed_time": "8:10:30", "remaining_time": "0:06:52", "throughput": 2612.45, "total_tokens": 76884832} +{"current_steps": 132430, "total_steps": 134280, "loss": 0.78, "lr": 1.736130503376454e-05, "epoch": 19.7244563598451, "percentage": 98.62, "elapsed_time": "8:10:31", "remaining_time": "0:06:51", "throughput": 2612.45, "total_tokens": 76887616} +{"current_steps": 132435, "total_steps": 134280, "loss": 0.7985, "lr": 1.7267655497150702e-05, "epoch": 19.72520107238606, "percentage": 98.63, "elapsed_time": "8:10:32", "remaining_time": "0:06:50", "throughput": 2612.46, "total_tokens": 76890816} +{"current_steps": 132440, "total_steps": 134280, "loss": 0.8014, "lr": 1.7174259078573396e-05, "epoch": 19.725945784927017, "percentage": 98.63, "elapsed_time": "8:10:33", "remaining_time": "0:06:48", "throughput": 2612.47, "total_tokens": 76894112} +{"current_steps": 132445, "total_steps": 134280, "loss": 0.8194, "lr": 1.7081115779608023e-05, "epoch": 19.726690497467978, "percentage": 98.63, "elapsed_time": "8:10:34", "remaining_time": "0:06:47", "throughput": 2612.48, "total_tokens": 76897056} +{"current_steps": 132450, "total_steps": 134280, "loss": 0.7935, "lr": 1.6988225601829997e-05, "epoch": 19.727435210008938, "percentage": 98.64, "elapsed_time": "8:10:35", "remaining_time": "0:06:46", "throughput": 2612.48, "total_tokens": 76899872} +{"current_steps": 132455, "total_steps": 134280, "loss": 0.824, "lr": 1.689558854680806e-05, "epoch": 19.728179922549895, "percentage": 98.64, "elapsed_time": "8:10:36", "remaining_time": "0:06:45", "throughput": 2612.49, "total_tokens": 76902944} +{"current_steps": 132460, "total_steps": 134280, "loss": 0.8126, "lr": 1.6803204616105958e-05, "epoch": 19.728924635090856, "percentage": 98.64, "elapsed_time": "8:10:37", "remaining_time": "0:06:44", "throughput": 2612.49, "total_tokens": 76905504} +{"current_steps": 132465, "total_steps": 134280, "loss": 0.8116, "lr": 1.671107381128578e-05, "epoch": 19.729669347631813, "percentage": 98.65, "elapsed_time": "8:10:38", "remaining_time": "0:06:43", "throughput": 2612.49, "total_tokens": 76908640} +{"current_steps": 132470, "total_steps": 134280, "loss": 0.7993, "lr": 1.661919613390461e-05, "epoch": 19.730414060172773, "percentage": 98.65, "elapsed_time": "8:10:39", "remaining_time": "0:06:42", "throughput": 2612.5, "total_tokens": 76911808} +{"current_steps": 132475, "total_steps": 134280, "loss": 0.7987, "lr": 1.6527571585512878e-05, "epoch": 19.731158772713734, "percentage": 98.66, "elapsed_time": "8:10:40", "remaining_time": "0:06:41", "throughput": 2612.51, "total_tokens": 76914688} +{"current_steps": 132480, "total_steps": 134280, "loss": 0.797, "lr": 1.6436200167659344e-05, "epoch": 19.73190348525469, "percentage": 98.66, "elapsed_time": "8:10:41", "remaining_time": "0:06:40", "throughput": 2612.51, "total_tokens": 76917536} +{"current_steps": 132485, "total_steps": 134280, "loss": 0.7745, "lr": 1.634508188188777e-05, "epoch": 19.73264819779565, "percentage": 98.66, "elapsed_time": "8:10:43", "remaining_time": "0:06:38", "throughput": 2612.51, "total_tokens": 76920320} +{"current_steps": 132490, "total_steps": 134280, "loss": 0.8221, "lr": 1.625421672973859e-05, "epoch": 19.73339291033661, "percentage": 98.67, "elapsed_time": "8:10:44", "remaining_time": "0:06:37", "throughput": 2612.52, "total_tokens": 76923392} +{"current_steps": 132495, "total_steps": 134280, "loss": 0.8115, "lr": 1.6163604712743917e-05, "epoch": 19.73413762287757, "percentage": 98.67, "elapsed_time": "8:10:45", "remaining_time": "0:06:36", "throughput": 2612.52, "total_tokens": 76926112} +{"current_steps": 132500, "total_steps": 134280, "loss": 0.7813, "lr": 1.6073245832435856e-05, "epoch": 19.73488233541853, "percentage": 98.67, "elapsed_time": "8:10:46", "remaining_time": "0:06:35", "throughput": 2612.53, "total_tokens": 76929344} +{"current_steps": 132505, "total_steps": 134280, "loss": 0.8128, "lr": 1.5983140090343185e-05, "epoch": 19.735627047959486, "percentage": 98.68, "elapsed_time": "8:10:47", "remaining_time": "0:06:34", "throughput": 2612.54, "total_tokens": 76932352} +{"current_steps": 132510, "total_steps": 134280, "loss": 0.7942, "lr": 1.5893287487984687e-05, "epoch": 19.736371760500447, "percentage": 98.68, "elapsed_time": "8:10:48", "remaining_time": "0:06:33", "throughput": 2612.54, "total_tokens": 76935040} +{"current_steps": 132515, "total_steps": 134280, "loss": 0.7745, "lr": 1.5803688026880814e-05, "epoch": 19.737116473041407, "percentage": 98.69, "elapsed_time": "8:10:49", "remaining_time": "0:06:32", "throughput": 2612.54, "total_tokens": 76937920} +{"current_steps": 132520, "total_steps": 134280, "loss": 0.7983, "lr": 1.571434170854369e-05, "epoch": 19.737861185582364, "percentage": 98.69, "elapsed_time": "8:10:50", "remaining_time": "0:06:31", "throughput": 2612.54, "total_tokens": 76940544} +{"current_steps": 132525, "total_steps": 134280, "loss": 0.8014, "lr": 1.5625248534483772e-05, "epoch": 19.738605898123325, "percentage": 98.69, "elapsed_time": "8:10:51", "remaining_time": "0:06:30", "throughput": 2612.54, "total_tokens": 76943488} +{"current_steps": 132530, "total_steps": 134280, "loss": 0.7877, "lr": 1.553640850620652e-05, "epoch": 19.73935061066428, "percentage": 98.7, "elapsed_time": "8:10:52", "remaining_time": "0:06:28", "throughput": 2612.54, "total_tokens": 76946048} +{"current_steps": 132535, "total_steps": 134280, "loss": 0.7953, "lr": 1.5447821625210745e-05, "epoch": 19.740095323205242, "percentage": 98.7, "elapsed_time": "8:10:53", "remaining_time": "0:06:27", "throughput": 2612.55, "total_tokens": 76948960} +{"current_steps": 132540, "total_steps": 134280, "loss": 0.8251, "lr": 1.5359487892995237e-05, "epoch": 19.740840035746203, "percentage": 98.7, "elapsed_time": "8:10:54", "remaining_time": "0:06:26", "throughput": 2612.56, "total_tokens": 76952064} +{"current_steps": 132545, "total_steps": 134280, "loss": 0.8091, "lr": 1.527140731105214e-05, "epoch": 19.74158474828716, "percentage": 98.71, "elapsed_time": "8:10:55", "remaining_time": "0:06:25", "throughput": 2612.56, "total_tokens": 76954720} +{"current_steps": 132550, "total_steps": 134280, "loss": 0.8012, "lr": 1.5183579880868602e-05, "epoch": 19.74232946082812, "percentage": 98.71, "elapsed_time": "8:10:56", "remaining_time": "0:06:24", "throughput": 2612.56, "total_tokens": 76957664} +{"current_steps": 132555, "total_steps": 134280, "loss": 0.7874, "lr": 1.5096005603926764e-05, "epoch": 19.74307417336908, "percentage": 98.72, "elapsed_time": "8:10:57", "remaining_time": "0:06:23", "throughput": 2612.57, "total_tokens": 76960704} +{"current_steps": 132560, "total_steps": 134280, "loss": 0.7903, "lr": 1.5008684481710443e-05, "epoch": 19.743818885910038, "percentage": 98.72, "elapsed_time": "8:10:58", "remaining_time": "0:06:22", "throughput": 2612.57, "total_tokens": 76963584} +{"current_steps": 132565, "total_steps": 134280, "loss": 0.8017, "lr": 1.4921616515690128e-05, "epoch": 19.744563598451, "percentage": 98.72, "elapsed_time": "8:10:59", "remaining_time": "0:06:21", "throughput": 2612.57, "total_tokens": 76966336} +{"current_steps": 132570, "total_steps": 134280, "loss": 0.8037, "lr": 1.483480170733964e-05, "epoch": 19.74530831099196, "percentage": 98.73, "elapsed_time": "8:11:01", "remaining_time": "0:06:20", "throughput": 2612.58, "total_tokens": 76969216} +{"current_steps": 132575, "total_steps": 134280, "loss": 0.7893, "lr": 1.4748240058126138e-05, "epoch": 19.746053023532916, "percentage": 98.73, "elapsed_time": "8:11:02", "remaining_time": "0:06:18", "throughput": 2612.6, "total_tokens": 76972640} +{"current_steps": 132580, "total_steps": 134280, "loss": 0.8006, "lr": 1.4661931569510123e-05, "epoch": 19.746797736073876, "percentage": 98.73, "elapsed_time": "8:11:03", "remaining_time": "0:06:17", "throughput": 2612.6, "total_tokens": 76975488} +{"current_steps": 132585, "total_steps": 134280, "loss": 0.7832, "lr": 1.4575876242950425e-05, "epoch": 19.747542448614833, "percentage": 98.74, "elapsed_time": "8:11:04", "remaining_time": "0:06:16", "throughput": 2612.6, "total_tokens": 76978272} +{"current_steps": 132590, "total_steps": 134280, "loss": 0.795, "lr": 1.4490074079899218e-05, "epoch": 19.748287161155794, "percentage": 98.74, "elapsed_time": "8:11:05", "remaining_time": "0:06:15", "throughput": 2612.61, "total_tokens": 76981152} +{"current_steps": 132595, "total_steps": 134280, "loss": 0.7943, "lr": 1.4404525081810338e-05, "epoch": 19.749031873696755, "percentage": 98.75, "elapsed_time": "8:11:06", "remaining_time": "0:06:14", "throughput": 2612.61, "total_tokens": 76983936} +{"current_steps": 132600, "total_steps": 134280, "loss": 0.7965, "lr": 1.4319229250124299e-05, "epoch": 19.74977658623771, "percentage": 98.75, "elapsed_time": "8:11:07", "remaining_time": "0:06:13", "throughput": 2612.61, "total_tokens": 76986944} +{"current_steps": 132605, "total_steps": 134280, "loss": 0.7809, "lr": 1.4234186586284947e-05, "epoch": 19.750521298778672, "percentage": 98.75, "elapsed_time": "8:11:08", "remaining_time": "0:06:12", "throughput": 2612.63, "total_tokens": 76990464} +{"current_steps": 132610, "total_steps": 134280, "loss": 0.7934, "lr": 1.4149397091727799e-05, "epoch": 19.75126601131963, "percentage": 98.76, "elapsed_time": "8:11:09", "remaining_time": "0:06:11", "throughput": 2612.63, "total_tokens": 76993312} +{"current_steps": 132615, "total_steps": 134280, "loss": 0.8022, "lr": 1.4064860767885046e-05, "epoch": 19.75201072386059, "percentage": 98.76, "elapsed_time": "8:11:10", "remaining_time": "0:06:10", "throughput": 2612.63, "total_tokens": 76996032} +{"current_steps": 132620, "total_steps": 134280, "loss": 0.795, "lr": 1.3980577616187206e-05, "epoch": 19.75275543640155, "percentage": 98.76, "elapsed_time": "8:11:11", "remaining_time": "0:06:08", "throughput": 2612.64, "total_tokens": 76998880} +{"current_steps": 132625, "total_steps": 134280, "loss": 0.7852, "lr": 1.3896547638054812e-05, "epoch": 19.753500148942507, "percentage": 98.77, "elapsed_time": "8:11:12", "remaining_time": "0:06:07", "throughput": 2612.65, "total_tokens": 77002016} +{"current_steps": 132630, "total_steps": 134280, "loss": 0.7964, "lr": 1.381277083491006e-05, "epoch": 19.754244861483468, "percentage": 98.77, "elapsed_time": "8:11:13", "remaining_time": "0:06:06", "throughput": 2612.65, "total_tokens": 77004672} +{"current_steps": 132635, "total_steps": 134280, "loss": 0.8281, "lr": 1.3729247208166816e-05, "epoch": 19.754989574024428, "percentage": 98.77, "elapsed_time": "8:11:14", "remaining_time": "0:06:05", "throughput": 2612.65, "total_tokens": 77007584} +{"current_steps": 132640, "total_steps": 134280, "loss": 0.7974, "lr": 1.3645976759235623e-05, "epoch": 19.755734286565385, "percentage": 98.78, "elapsed_time": "8:11:15", "remaining_time": "0:06:04", "throughput": 2612.66, "total_tokens": 77010528} +{"current_steps": 132645, "total_steps": 134280, "loss": 0.8173, "lr": 1.356295948952535e-05, "epoch": 19.756478999106346, "percentage": 98.78, "elapsed_time": "8:11:16", "remaining_time": "0:06:03", "throughput": 2612.66, "total_tokens": 77013440} +{"current_steps": 132650, "total_steps": 134280, "loss": 0.7838, "lr": 1.3480195400436545e-05, "epoch": 19.757223711647303, "percentage": 98.79, "elapsed_time": "8:11:18", "remaining_time": "0:06:02", "throughput": 2612.67, "total_tokens": 77016320} +{"current_steps": 132655, "total_steps": 134280, "loss": 0.7925, "lr": 1.3397684493369754e-05, "epoch": 19.757968424188263, "percentage": 98.79, "elapsed_time": "8:11:19", "remaining_time": "0:06:01", "throughput": 2612.67, "total_tokens": 77019328} +{"current_steps": 132660, "total_steps": 134280, "loss": 0.7894, "lr": 1.3315426769715532e-05, "epoch": 19.758713136729224, "percentage": 98.79, "elapsed_time": "8:11:20", "remaining_time": "0:06:00", "throughput": 2612.68, "total_tokens": 77022368} +{"current_steps": 132665, "total_steps": 134280, "loss": 0.7892, "lr": 1.3233422230867764e-05, "epoch": 19.75945784927018, "percentage": 98.8, "elapsed_time": "8:11:21", "remaining_time": "0:05:58", "throughput": 2612.69, "total_tokens": 77025600} +{"current_steps": 132670, "total_steps": 134280, "loss": 0.7915, "lr": 1.315167087820701e-05, "epoch": 19.76020256181114, "percentage": 98.8, "elapsed_time": "8:11:22", "remaining_time": "0:05:57", "throughput": 2612.69, "total_tokens": 77028384} +{"current_steps": 132675, "total_steps": 134280, "loss": 0.7995, "lr": 1.3070172713118833e-05, "epoch": 19.7609472743521, "percentage": 98.8, "elapsed_time": "8:11:23", "remaining_time": "0:05:56", "throughput": 2612.69, "total_tokens": 77030944} +{"current_steps": 132680, "total_steps": 134280, "loss": 0.8098, "lr": 1.2988927736977129e-05, "epoch": 19.76169198689306, "percentage": 98.81, "elapsed_time": "8:11:24", "remaining_time": "0:05:55", "throughput": 2612.69, "total_tokens": 77033696} +{"current_steps": 132685, "total_steps": 134280, "loss": 0.7901, "lr": 1.2907935951154136e-05, "epoch": 19.76243669943402, "percentage": 98.81, "elapsed_time": "8:11:25", "remaining_time": "0:05:54", "throughput": 2612.69, "total_tokens": 77036576} +{"current_steps": 132690, "total_steps": 134280, "loss": 0.7947, "lr": 1.2827197357020425e-05, "epoch": 19.763181411974976, "percentage": 98.82, "elapsed_time": "8:11:26", "remaining_time": "0:05:53", "throughput": 2612.7, "total_tokens": 77039584} +{"current_steps": 132695, "total_steps": 134280, "loss": 0.7844, "lr": 1.2746711955939905e-05, "epoch": 19.763926124515937, "percentage": 98.82, "elapsed_time": "8:11:27", "remaining_time": "0:05:52", "throughput": 2612.71, "total_tokens": 77042560} +{"current_steps": 132700, "total_steps": 134280, "loss": 0.7794, "lr": 1.2666479749269821e-05, "epoch": 19.764670837056897, "percentage": 98.82, "elapsed_time": "8:11:28", "remaining_time": "0:05:51", "throughput": 2612.71, "total_tokens": 77045440} +{"current_steps": 132705, "total_steps": 134280, "loss": 0.832, "lr": 1.2586500738367423e-05, "epoch": 19.765415549597854, "percentage": 98.83, "elapsed_time": "8:11:29", "remaining_time": "0:05:49", "throughput": 2612.71, "total_tokens": 77048192} +{"current_steps": 132710, "total_steps": 134280, "loss": 0.7791, "lr": 1.2506774924583297e-05, "epoch": 19.766160262138815, "percentage": 98.83, "elapsed_time": "8:11:30", "remaining_time": "0:05:48", "throughput": 2612.72, "total_tokens": 77051072} +{"current_steps": 132715, "total_steps": 134280, "loss": 0.8311, "lr": 1.2427302309266363e-05, "epoch": 19.766904974679775, "percentage": 98.83, "elapsed_time": "8:11:31", "remaining_time": "0:05:47", "throughput": 2612.72, "total_tokens": 77053888} +{"current_steps": 132720, "total_steps": 134280, "loss": 0.7698, "lr": 1.2348082893755551e-05, "epoch": 19.767649687220732, "percentage": 98.84, "elapsed_time": "8:11:32", "remaining_time": "0:05:46", "throughput": 2612.73, "total_tokens": 77056800} +{"current_steps": 132725, "total_steps": 134280, "loss": 0.7986, "lr": 1.2269116679391455e-05, "epoch": 19.768394399761693, "percentage": 98.84, "elapsed_time": "8:11:33", "remaining_time": "0:05:45", "throughput": 2612.73, "total_tokens": 77059744} +{"current_steps": 132730, "total_steps": 134280, "loss": 0.7904, "lr": 1.2190403667509675e-05, "epoch": 19.76913911230265, "percentage": 98.85, "elapsed_time": "8:11:35", "remaining_time": "0:05:44", "throughput": 2612.74, "total_tokens": 77062720} +{"current_steps": 132735, "total_steps": 134280, "loss": 0.7792, "lr": 1.2111943859435815e-05, "epoch": 19.76988382484361, "percentage": 98.85, "elapsed_time": "8:11:36", "remaining_time": "0:05:43", "throughput": 2612.74, "total_tokens": 77065632} +{"current_steps": 132740, "total_steps": 134280, "loss": 0.8013, "lr": 1.2033737256498811e-05, "epoch": 19.77062853738457, "percentage": 98.85, "elapsed_time": "8:11:37", "remaining_time": "0:05:42", "throughput": 2612.74, "total_tokens": 77068416} +{"current_steps": 132745, "total_steps": 134280, "loss": 0.7965, "lr": 1.195578386001761e-05, "epoch": 19.771373249925528, "percentage": 98.86, "elapsed_time": "8:11:38", "remaining_time": "0:05:41", "throughput": 2612.75, "total_tokens": 77071424} +{"current_steps": 132750, "total_steps": 134280, "loss": 0.7998, "lr": 1.1878083671311157e-05, "epoch": 19.77211796246649, "percentage": 98.86, "elapsed_time": "8:11:39", "remaining_time": "0:05:39", "throughput": 2612.76, "total_tokens": 77074336} +{"current_steps": 132755, "total_steps": 134280, "loss": 0.8012, "lr": 1.1800636691691735e-05, "epoch": 19.772862675007445, "percentage": 98.86, "elapsed_time": "8:11:40", "remaining_time": "0:05:38", "throughput": 2612.76, "total_tokens": 77077376} +{"current_steps": 132760, "total_steps": 134280, "loss": 0.8114, "lr": 1.172344292246663e-05, "epoch": 19.773607387548406, "percentage": 98.87, "elapsed_time": "8:11:41", "remaining_time": "0:05:37", "throughput": 2612.76, "total_tokens": 77080032} +{"current_steps": 132765, "total_steps": 134280, "loss": 0.7954, "lr": 1.1646502364939803e-05, "epoch": 19.774352100089367, "percentage": 98.87, "elapsed_time": "8:11:42", "remaining_time": "0:05:36", "throughput": 2612.76, "total_tokens": 77082720} +{"current_steps": 132770, "total_steps": 134280, "loss": 0.7888, "lr": 1.1569815020411878e-05, "epoch": 19.775096812630323, "percentage": 98.88, "elapsed_time": "8:11:43", "remaining_time": "0:05:35", "throughput": 2612.77, "total_tokens": 77085888} +{"current_steps": 132775, "total_steps": 134280, "loss": 0.8131, "lr": 1.149338089018015e-05, "epoch": 19.775841525171284, "percentage": 98.88, "elapsed_time": "8:11:44", "remaining_time": "0:05:34", "throughput": 2612.78, "total_tokens": 77088960} +{"current_steps": 132780, "total_steps": 134280, "loss": 0.8213, "lr": 1.1417199975531922e-05, "epoch": 19.776586237712245, "percentage": 98.88, "elapsed_time": "8:11:45", "remaining_time": "0:05:33", "throughput": 2612.79, "total_tokens": 77092064} +{"current_steps": 132785, "total_steps": 134280, "loss": 0.7941, "lr": 1.134127227775783e-05, "epoch": 19.7773309502532, "percentage": 98.89, "elapsed_time": "8:11:46", "remaining_time": "0:05:32", "throughput": 2612.79, "total_tokens": 77094880} +{"current_steps": 132790, "total_steps": 134280, "loss": 0.8025, "lr": 1.1265597798138515e-05, "epoch": 19.778075662794162, "percentage": 98.89, "elapsed_time": "8:11:47", "remaining_time": "0:05:31", "throughput": 2612.79, "total_tokens": 77097568} +{"current_steps": 132795, "total_steps": 134280, "loss": 0.792, "lr": 1.119017653795462e-05, "epoch": 19.77882037533512, "percentage": 98.89, "elapsed_time": "8:11:48", "remaining_time": "0:05:29", "throughput": 2612.8, "total_tokens": 77100416} +{"current_steps": 132800, "total_steps": 134280, "loss": 0.7817, "lr": 1.1115008498476797e-05, "epoch": 19.77956508787608, "percentage": 98.9, "elapsed_time": "8:11:49", "remaining_time": "0:05:28", "throughput": 2612.8, "total_tokens": 77103360} +{"current_steps": 132805, "total_steps": 134280, "loss": 0.7977, "lr": 1.1040093680977358e-05, "epoch": 19.78030980041704, "percentage": 98.9, "elapsed_time": "8:11:50", "remaining_time": "0:05:27", "throughput": 2612.81, "total_tokens": 77106272} +{"current_steps": 132810, "total_steps": 134280, "loss": 0.7774, "lr": 1.096543208672196e-05, "epoch": 19.781054512957997, "percentage": 98.91, "elapsed_time": "8:11:51", "remaining_time": "0:05:26", "throughput": 2612.81, "total_tokens": 77109024} +{"current_steps": 132815, "total_steps": 134280, "loss": 0.7912, "lr": 1.089102371697126e-05, "epoch": 19.781799225498958, "percentage": 98.91, "elapsed_time": "8:11:52", "remaining_time": "0:05:25", "throughput": 2612.81, "total_tokens": 77111808} +{"current_steps": 132820, "total_steps": 134280, "loss": 0.8034, "lr": 1.081686857298092e-05, "epoch": 19.782543938039918, "percentage": 98.91, "elapsed_time": "8:11:54", "remaining_time": "0:05:24", "throughput": 2612.82, "total_tokens": 77114816} +{"current_steps": 132825, "total_steps": 134280, "loss": 0.788, "lr": 1.0742966656006603e-05, "epoch": 19.783288650580875, "percentage": 98.92, "elapsed_time": "8:11:55", "remaining_time": "0:05:23", "throughput": 2612.82, "total_tokens": 77117728} +{"current_steps": 132830, "total_steps": 134280, "loss": 0.7847, "lr": 1.0669317967295643e-05, "epoch": 19.784033363121836, "percentage": 98.92, "elapsed_time": "8:11:56", "remaining_time": "0:05:22", "throughput": 2612.82, "total_tokens": 77120416} +{"current_steps": 132835, "total_steps": 134280, "loss": 0.7831, "lr": 1.0595922508092047e-05, "epoch": 19.784778075662793, "percentage": 98.92, "elapsed_time": "8:11:57", "remaining_time": "0:05:21", "throughput": 2612.83, "total_tokens": 77123648} +{"current_steps": 132840, "total_steps": 134280, "loss": 0.8007, "lr": 1.052278027963649e-05, "epoch": 19.785522788203753, "percentage": 98.93, "elapsed_time": "8:11:58", "remaining_time": "0:05:19", "throughput": 2612.83, "total_tokens": 77126464} +{"current_steps": 132845, "total_steps": 134280, "loss": 0.7916, "lr": 1.0449891283162982e-05, "epoch": 19.786267500744714, "percentage": 98.93, "elapsed_time": "8:11:59", "remaining_time": "0:05:18", "throughput": 2612.84, "total_tokens": 77129312} +{"current_steps": 132850, "total_steps": 134280, "loss": 0.7927, "lr": 1.0377255519903871e-05, "epoch": 19.78701221328567, "percentage": 98.94, "elapsed_time": "8:12:00", "remaining_time": "0:05:17", "throughput": 2612.84, "total_tokens": 77132032} +{"current_steps": 132855, "total_steps": 134280, "loss": 0.7899, "lr": 1.0304872991086511e-05, "epoch": 19.78775692582663, "percentage": 98.94, "elapsed_time": "8:12:01", "remaining_time": "0:05:16", "throughput": 2612.84, "total_tokens": 77134880} +{"current_steps": 132860, "total_steps": 134280, "loss": 0.7937, "lr": 1.0232743697933255e-05, "epoch": 19.788501638367592, "percentage": 98.94, "elapsed_time": "8:12:02", "remaining_time": "0:05:15", "throughput": 2612.84, "total_tokens": 77137472} +{"current_steps": 132865, "total_steps": 134280, "loss": 0.8061, "lr": 1.0160867641663129e-05, "epoch": 19.78924635090855, "percentage": 98.95, "elapsed_time": "8:12:03", "remaining_time": "0:05:14", "throughput": 2612.84, "total_tokens": 77140320} +{"current_steps": 132870, "total_steps": 134280, "loss": 0.7952, "lr": 1.0089244823490161e-05, "epoch": 19.78999106344951, "percentage": 98.95, "elapsed_time": "8:12:04", "remaining_time": "0:05:13", "throughput": 2612.84, "total_tokens": 77143104} +{"current_steps": 132875, "total_steps": 134280, "loss": 0.7957, "lr": 1.0017875244623386e-05, "epoch": 19.790735775990466, "percentage": 98.95, "elapsed_time": "8:12:05", "remaining_time": "0:05:12", "throughput": 2612.85, "total_tokens": 77146240} +{"current_steps": 132880, "total_steps": 134280, "loss": 0.8091, "lr": 9.94675890627017e-06, "epoch": 19.791480488531427, "percentage": 98.96, "elapsed_time": "8:12:06", "remaining_time": "0:05:11", "throughput": 2612.86, "total_tokens": 77149344} +{"current_steps": 132885, "total_steps": 134280, "loss": 0.793, "lr": 9.87589580963122e-06, "epoch": 19.792225201072387, "percentage": 98.96, "elapsed_time": "8:12:07", "remaining_time": "0:05:09", "throughput": 2612.87, "total_tokens": 77152352} +{"current_steps": 132890, "total_steps": 134280, "loss": 0.7913, "lr": 9.805285955903908e-06, "epoch": 19.792969913613344, "percentage": 98.96, "elapsed_time": "8:12:08", "remaining_time": "0:05:08", "throughput": 2612.87, "total_tokens": 77155168} +{"current_steps": 132895, "total_steps": 134280, "loss": 0.798, "lr": 9.734929346280618e-06, "epoch": 19.793714626154305, "percentage": 98.97, "elapsed_time": "8:12:09", "remaining_time": "0:05:07", "throughput": 2612.87, "total_tokens": 77157920} +{"current_steps": 132900, "total_steps": 134280, "loss": 0.7885, "lr": 9.664825981950398e-06, "epoch": 19.794459338695262, "percentage": 98.97, "elapsed_time": "8:12:10", "remaining_time": "0:05:06", "throughput": 2612.88, "total_tokens": 77160896} +{"current_steps": 132905, "total_steps": 134280, "loss": 0.7921, "lr": 9.594975864097299e-06, "epoch": 19.795204051236222, "percentage": 98.98, "elapsed_time": "8:12:12", "remaining_time": "0:05:05", "throughput": 2612.89, "total_tokens": 77163904} +{"current_steps": 132910, "total_steps": 134280, "loss": 0.7833, "lr": 9.525378993902045e-06, "epoch": 19.795948763777183, "percentage": 98.98, "elapsed_time": "8:12:13", "remaining_time": "0:05:04", "throughput": 2612.89, "total_tokens": 77166688} +{"current_steps": 132915, "total_steps": 134280, "loss": 0.7916, "lr": 9.45603537254036e-06, "epoch": 19.79669347631814, "percentage": 98.98, "elapsed_time": "8:12:14", "remaining_time": "0:05:03", "throughput": 2612.9, "total_tokens": 77169760} +{"current_steps": 132920, "total_steps": 134280, "loss": 0.797, "lr": 9.386945001181312e-06, "epoch": 19.7974381888591, "percentage": 98.99, "elapsed_time": "8:12:15", "remaining_time": "0:05:02", "throughput": 2612.9, "total_tokens": 77172704} +{"current_steps": 132925, "total_steps": 134280, "loss": 0.801, "lr": 9.31810788099563e-06, "epoch": 19.79818290140006, "percentage": 98.99, "elapsed_time": "8:12:16", "remaining_time": "0:05:01", "throughput": 2612.91, "total_tokens": 77175680} +{"current_steps": 132930, "total_steps": 134280, "loss": 0.8083, "lr": 9.24952401314405e-06, "epoch": 19.798927613941018, "percentage": 98.99, "elapsed_time": "8:12:17", "remaining_time": "0:04:59", "throughput": 2612.91, "total_tokens": 77178784} +{"current_steps": 132935, "total_steps": 134280, "loss": 0.809, "lr": 9.181193398787313e-06, "epoch": 19.79967232648198, "percentage": 99.0, "elapsed_time": "8:12:18", "remaining_time": "0:04:58", "throughput": 2612.92, "total_tokens": 77181536} +{"current_steps": 132940, "total_steps": 134280, "loss": 0.7916, "lr": 9.113116039076164e-06, "epoch": 19.800417039022935, "percentage": 99.0, "elapsed_time": "8:12:19", "remaining_time": "0:04:57", "throughput": 2612.92, "total_tokens": 77184512} +{"current_steps": 132945, "total_steps": 134280, "loss": 0.8111, "lr": 9.045291935164679e-06, "epoch": 19.801161751563896, "percentage": 99.01, "elapsed_time": "8:12:20", "remaining_time": "0:04:56", "throughput": 2612.92, "total_tokens": 77187200} +{"current_steps": 132950, "total_steps": 134280, "loss": 0.7867, "lr": 8.977721088195277e-06, "epoch": 19.801906464104857, "percentage": 99.01, "elapsed_time": "8:12:21", "remaining_time": "0:04:55", "throughput": 2612.92, "total_tokens": 77189952} +{"current_steps": 132955, "total_steps": 134280, "loss": 0.7985, "lr": 8.910403499312046e-06, "epoch": 19.802651176645814, "percentage": 99.01, "elapsed_time": "8:12:22", "remaining_time": "0:04:54", "throughput": 2612.93, "total_tokens": 77192896} +{"current_steps": 132960, "total_steps": 134280, "loss": 0.7884, "lr": 8.843339169650744e-06, "epoch": 19.803395889186774, "percentage": 99.02, "elapsed_time": "8:12:23", "remaining_time": "0:04:53", "throughput": 2612.93, "total_tokens": 77195872} +{"current_steps": 132965, "total_steps": 134280, "loss": 0.8095, "lr": 8.77652810034546e-06, "epoch": 19.804140601727735, "percentage": 99.02, "elapsed_time": "8:12:24", "remaining_time": "0:04:52", "throughput": 2612.94, "total_tokens": 77198752} +{"current_steps": 132970, "total_steps": 134280, "loss": 0.7838, "lr": 8.709970292523627e-06, "epoch": 19.80488531426869, "percentage": 99.02, "elapsed_time": "8:12:25", "remaining_time": "0:04:51", "throughput": 2612.94, "total_tokens": 77201600} +{"current_steps": 132975, "total_steps": 134280, "loss": 0.7999, "lr": 8.643665747311014e-06, "epoch": 19.805630026809652, "percentage": 99.03, "elapsed_time": "8:12:26", "remaining_time": "0:04:49", "throughput": 2612.95, "total_tokens": 77204512} +{"current_steps": 132980, "total_steps": 134280, "loss": 0.8013, "lr": 8.577614465826722e-06, "epoch": 19.80637473935061, "percentage": 99.03, "elapsed_time": "8:12:27", "remaining_time": "0:04:48", "throughput": 2612.95, "total_tokens": 77207136} +{"current_steps": 132985, "total_steps": 134280, "loss": 0.7742, "lr": 8.511816449186526e-06, "epoch": 19.80711945189157, "percentage": 99.04, "elapsed_time": "8:12:28", "remaining_time": "0:04:47", "throughput": 2612.95, "total_tokens": 77210112} +{"current_steps": 132990, "total_steps": 134280, "loss": 0.7891, "lr": 8.446271698504537e-06, "epoch": 19.80786416443253, "percentage": 99.04, "elapsed_time": "8:12:30", "remaining_time": "0:04:46", "throughput": 2612.96, "total_tokens": 77213088} +{"current_steps": 132995, "total_steps": 134280, "loss": 0.8008, "lr": 8.380980214883204e-06, "epoch": 19.808608876973487, "percentage": 99.04, "elapsed_time": "8:12:31", "remaining_time": "0:04:45", "throughput": 2612.96, "total_tokens": 77215968} +{"current_steps": 133000, "total_steps": 134280, "loss": 0.8189, "lr": 8.315941999429977e-06, "epoch": 19.809353589514448, "percentage": 99.05, "elapsed_time": "8:12:32", "remaining_time": "0:04:44", "throughput": 2612.97, "total_tokens": 77218912} +{"current_steps": 133005, "total_steps": 134280, "loss": 0.8062, "lr": 8.251157053242308e-06, "epoch": 19.81009830205541, "percentage": 99.05, "elapsed_time": "8:12:33", "remaining_time": "0:04:43", "throughput": 2612.97, "total_tokens": 77221760} +{"current_steps": 133010, "total_steps": 134280, "loss": 0.7995, "lr": 8.186625377414324e-06, "epoch": 19.810843014596365, "percentage": 99.05, "elapsed_time": "8:12:34", "remaining_time": "0:04:42", "throughput": 2612.98, "total_tokens": 77224672} +{"current_steps": 133015, "total_steps": 134280, "loss": 0.789, "lr": 8.12234697303682e-06, "epoch": 19.811587727137326, "percentage": 99.06, "elapsed_time": "8:12:35", "remaining_time": "0:04:41", "throughput": 2612.99, "total_tokens": 77227712} +{"current_steps": 133020, "total_steps": 134280, "loss": 0.8123, "lr": 8.058321841193927e-06, "epoch": 19.812332439678283, "percentage": 99.06, "elapsed_time": "8:12:36", "remaining_time": "0:04:39", "throughput": 2612.99, "total_tokens": 77230528} +{"current_steps": 133025, "total_steps": 134280, "loss": 0.8023, "lr": 7.994549982968113e-06, "epoch": 19.813077152219243, "percentage": 99.07, "elapsed_time": "8:12:37", "remaining_time": "0:04:38", "throughput": 2612.99, "total_tokens": 77233344} +{"current_steps": 133030, "total_steps": 134280, "loss": 0.8015, "lr": 7.931031399438514e-06, "epoch": 19.813821864760204, "percentage": 99.07, "elapsed_time": "8:12:38", "remaining_time": "0:04:37", "throughput": 2613.0, "total_tokens": 77236384} +{"current_steps": 133035, "total_steps": 134280, "loss": 0.8002, "lr": 7.867766091677608e-06, "epoch": 19.81456657730116, "percentage": 99.07, "elapsed_time": "8:12:39", "remaining_time": "0:04:36", "throughput": 2613.01, "total_tokens": 77239520} +{"current_steps": 133040, "total_steps": 134280, "loss": 0.7945, "lr": 7.804754060751206e-06, "epoch": 19.81531128984212, "percentage": 99.08, "elapsed_time": "8:12:40", "remaining_time": "0:04:35", "throughput": 2613.01, "total_tokens": 77242432} +{"current_steps": 133045, "total_steps": 134280, "loss": 0.7995, "lr": 7.741995307728455e-06, "epoch": 19.816056002383082, "percentage": 99.08, "elapsed_time": "8:12:41", "remaining_time": "0:04:34", "throughput": 2613.02, "total_tokens": 77245280} +{"current_steps": 133050, "total_steps": 134280, "loss": 0.8007, "lr": 7.679489833665176e-06, "epoch": 19.81680071492404, "percentage": 99.08, "elapsed_time": "8:12:42", "remaining_time": "0:04:33", "throughput": 2613.02, "total_tokens": 77248320} +{"current_steps": 133055, "total_steps": 134280, "loss": 0.7891, "lr": 7.6172376396205215e-06, "epoch": 19.817545427465, "percentage": 99.09, "elapsed_time": "8:12:43", "remaining_time": "0:04:32", "throughput": 2613.03, "total_tokens": 77251424} +{"current_steps": 133060, "total_steps": 134280, "loss": 0.8031, "lr": 7.555238726645319e-06, "epoch": 19.818290140005956, "percentage": 99.09, "elapsed_time": "8:12:44", "remaining_time": "0:04:31", "throughput": 2613.04, "total_tokens": 77254432} +{"current_steps": 133065, "total_steps": 134280, "loss": 0.7738, "lr": 7.493493095785397e-06, "epoch": 19.819034852546917, "percentage": 99.1, "elapsed_time": "8:12:46", "remaining_time": "0:04:29", "throughput": 2613.05, "total_tokens": 77257600} +{"current_steps": 133070, "total_steps": 134280, "loss": 0.7967, "lr": 7.432000748086586e-06, "epoch": 19.819779565087877, "percentage": 99.1, "elapsed_time": "8:12:47", "remaining_time": "0:04:28", "throughput": 2613.05, "total_tokens": 77260512} +{"current_steps": 133075, "total_steps": 134280, "loss": 0.7935, "lr": 7.370761684584726e-06, "epoch": 19.820524277628834, "percentage": 99.1, "elapsed_time": "8:12:48", "remaining_time": "0:04:27", "throughput": 2613.07, "total_tokens": 77263840} +{"current_steps": 133080, "total_steps": 134280, "loss": 0.7974, "lr": 7.309775906317317e-06, "epoch": 19.821268990169795, "percentage": 99.11, "elapsed_time": "8:12:49", "remaining_time": "0:04:26", "throughput": 2613.07, "total_tokens": 77266752} +{"current_steps": 133085, "total_steps": 134280, "loss": 0.8106, "lr": 7.249043414313538e-06, "epoch": 19.822013702710755, "percentage": 99.11, "elapsed_time": "8:12:50", "remaining_time": "0:04:25", "throughput": 2613.07, "total_tokens": 77269568} +{"current_steps": 133090, "total_steps": 134280, "loss": 0.8006, "lr": 7.188564209599235e-06, "epoch": 19.822758415251712, "percentage": 99.11, "elapsed_time": "8:12:51", "remaining_time": "0:04:24", "throughput": 2613.08, "total_tokens": 77272416} +{"current_steps": 133095, "total_steps": 134280, "loss": 0.784, "lr": 7.128338293195257e-06, "epoch": 19.823503127792673, "percentage": 99.12, "elapsed_time": "8:12:52", "remaining_time": "0:04:23", "throughput": 2613.07, "total_tokens": 77274912} +{"current_steps": 133100, "total_steps": 134280, "loss": 0.8047, "lr": 7.06836566612079e-06, "epoch": 19.82424784033363, "percentage": 99.12, "elapsed_time": "8:12:53", "remaining_time": "0:04:22", "throughput": 2613.07, "total_tokens": 77277632} +{"current_steps": 133105, "total_steps": 134280, "loss": 0.7671, "lr": 7.008646329386692e-06, "epoch": 19.82499255287459, "percentage": 99.12, "elapsed_time": "8:12:54", "remaining_time": "0:04:21", "throughput": 2613.08, "total_tokens": 77280864} +{"current_steps": 133110, "total_steps": 134280, "loss": 0.7903, "lr": 6.949180284005485e-06, "epoch": 19.82573726541555, "percentage": 99.13, "elapsed_time": "8:12:55", "remaining_time": "0:04:19", "throughput": 2613.09, "total_tokens": 77283680} +{"current_steps": 133115, "total_steps": 134280, "loss": 0.8127, "lr": 6.889967530978036e-06, "epoch": 19.826481977956508, "percentage": 99.13, "elapsed_time": "8:12:56", "remaining_time": "0:04:18", "throughput": 2613.09, "total_tokens": 77286752} +{"current_steps": 133120, "total_steps": 134280, "loss": 0.7749, "lr": 6.831008071306876e-06, "epoch": 19.82722669049747, "percentage": 99.14, "elapsed_time": "8:12:57", "remaining_time": "0:04:17", "throughput": 2613.1, "total_tokens": 77289632} +{"current_steps": 133125, "total_steps": 134280, "loss": 0.8339, "lr": 6.772301905987876e-06, "epoch": 19.827971403038426, "percentage": 99.14, "elapsed_time": "8:12:58", "remaining_time": "0:04:16", "throughput": 2613.1, "total_tokens": 77292512} +{"current_steps": 133130, "total_steps": 134280, "loss": 0.7903, "lr": 6.71384903601191e-06, "epoch": 19.828716115579386, "percentage": 99.14, "elapsed_time": "8:12:59", "remaining_time": "0:04:15", "throughput": 2613.1, "total_tokens": 77295232} +{"current_steps": 133135, "total_steps": 134280, "loss": 0.7957, "lr": 6.655649462366519e-06, "epoch": 19.829460828120347, "percentage": 99.15, "elapsed_time": "8:13:00", "remaining_time": "0:04:14", "throughput": 2613.11, "total_tokens": 77298112} +{"current_steps": 133140, "total_steps": 134280, "loss": 0.7986, "lr": 6.597703186035919e-06, "epoch": 19.830205540661304, "percentage": 99.15, "elapsed_time": "8:13:02", "remaining_time": "0:04:13", "throughput": 2613.12, "total_tokens": 77301248} +{"current_steps": 133145, "total_steps": 134280, "loss": 0.8137, "lr": 6.5400102079976595e-06, "epoch": 19.830950253202264, "percentage": 99.15, "elapsed_time": "8:13:03", "remaining_time": "0:04:12", "throughput": 2613.12, "total_tokens": 77304096} +{"current_steps": 133150, "total_steps": 134280, "loss": 0.7789, "lr": 6.482570529227627e-06, "epoch": 19.831694965743225, "percentage": 99.16, "elapsed_time": "8:13:04", "remaining_time": "0:04:11", "throughput": 2613.12, "total_tokens": 77306880} +{"current_steps": 133155, "total_steps": 134280, "loss": 0.7903, "lr": 6.425384150696711e-06, "epoch": 19.83243967828418, "percentage": 99.16, "elapsed_time": "8:13:05", "remaining_time": "0:04:09", "throughput": 2613.12, "total_tokens": 77309664} +{"current_steps": 133160, "total_steps": 134280, "loss": 0.7803, "lr": 6.368451073369141e-06, "epoch": 19.833184390825142, "percentage": 99.17, "elapsed_time": "8:13:06", "remaining_time": "0:04:08", "throughput": 2613.13, "total_tokens": 77312800} +{"current_steps": 133165, "total_steps": 134280, "loss": 0.7858, "lr": 6.311771298209145e-06, "epoch": 19.8339291033661, "percentage": 99.17, "elapsed_time": "8:13:07", "remaining_time": "0:04:07", "throughput": 2613.14, "total_tokens": 77315648} +{"current_steps": 133170, "total_steps": 134280, "loss": 0.7869, "lr": 6.255344826170961e-06, "epoch": 19.83467381590706, "percentage": 99.17, "elapsed_time": "8:13:08", "remaining_time": "0:04:06", "throughput": 2613.14, "total_tokens": 77318688} +{"current_steps": 133175, "total_steps": 134280, "loss": 0.8196, "lr": 6.1991716582104896e-06, "epoch": 19.83541852844802, "percentage": 99.18, "elapsed_time": "8:13:09", "remaining_time": "0:04:05", "throughput": 2613.15, "total_tokens": 77321472} +{"current_steps": 133180, "total_steps": 134280, "loss": 0.8144, "lr": 6.143251795276971e-06, "epoch": 19.836163240988977, "percentage": 99.18, "elapsed_time": "8:13:10", "remaining_time": "0:04:04", "throughput": 2613.15, "total_tokens": 77324384} +{"current_steps": 133185, "total_steps": 134280, "loss": 0.7957, "lr": 6.087585238312986e-06, "epoch": 19.836907953529938, "percentage": 99.18, "elapsed_time": "8:13:11", "remaining_time": "0:04:03", "throughput": 2613.15, "total_tokens": 77327264} +{"current_steps": 133190, "total_steps": 134280, "loss": 0.7954, "lr": 6.032171988261114e-06, "epoch": 19.8376526660709, "percentage": 99.19, "elapsed_time": "8:13:12", "remaining_time": "0:04:02", "throughput": 2613.16, "total_tokens": 77330272} +{"current_steps": 133195, "total_steps": 134280, "loss": 0.803, "lr": 5.977012046055607e-06, "epoch": 19.838397378611855, "percentage": 99.19, "elapsed_time": "8:13:13", "remaining_time": "0:04:01", "throughput": 2613.17, "total_tokens": 77333216} +{"current_steps": 133200, "total_steps": 134280, "loss": 0.8105, "lr": 5.9221054126290526e-06, "epoch": 19.839142091152816, "percentage": 99.2, "elapsed_time": "8:13:14", "remaining_time": "0:03:59", "throughput": 2613.17, "total_tokens": 77335840} +{"current_steps": 133205, "total_steps": 134280, "loss": 0.7732, "lr": 5.867452088910707e-06, "epoch": 19.839886803693773, "percentage": 99.2, "elapsed_time": "8:13:15", "remaining_time": "0:03:58", "throughput": 2613.17, "total_tokens": 77338528} +{"current_steps": 133210, "total_steps": 134280, "loss": 0.8061, "lr": 5.813052075821501e-06, "epoch": 19.840631516234733, "percentage": 99.2, "elapsed_time": "8:13:16", "remaining_time": "0:03:57", "throughput": 2613.17, "total_tokens": 77341472} +{"current_steps": 133215, "total_steps": 134280, "loss": 0.8085, "lr": 5.7589053742806985e-06, "epoch": 19.841376228775694, "percentage": 99.21, "elapsed_time": "8:13:17", "remaining_time": "0:03:56", "throughput": 2613.17, "total_tokens": 77344320} +{"current_steps": 133220, "total_steps": 134280, "loss": 0.7971, "lr": 5.705011985204233e-06, "epoch": 19.84212094131665, "percentage": 99.21, "elapsed_time": "8:13:18", "remaining_time": "0:03:55", "throughput": 2613.18, "total_tokens": 77347200} +{"current_steps": 133225, "total_steps": 134280, "loss": 0.7889, "lr": 5.651371909501379e-06, "epoch": 19.84286565385761, "percentage": 99.21, "elapsed_time": "8:13:19", "remaining_time": "0:03:54", "throughput": 2613.18, "total_tokens": 77349856} +{"current_steps": 133230, "total_steps": 134280, "loss": 0.801, "lr": 5.597985148079743e-06, "epoch": 19.843610366398572, "percentage": 99.22, "elapsed_time": "8:13:20", "remaining_time": "0:03:53", "throughput": 2613.18, "total_tokens": 77352480} +{"current_steps": 133235, "total_steps": 134280, "loss": 0.7975, "lr": 5.544851701841935e-06, "epoch": 19.84435507893953, "percentage": 99.22, "elapsed_time": "8:13:21", "remaining_time": "0:03:52", "throughput": 2613.18, "total_tokens": 77355168} +{"current_steps": 133240, "total_steps": 134280, "loss": 0.7769, "lr": 5.491971571682241e-06, "epoch": 19.84509979148049, "percentage": 99.23, "elapsed_time": "8:13:23", "remaining_time": "0:03:51", "throughput": 2613.18, "total_tokens": 77358240} +{"current_steps": 133245, "total_steps": 134280, "loss": 0.802, "lr": 5.439344758496611e-06, "epoch": 19.845844504021446, "percentage": 99.23, "elapsed_time": "8:13:24", "remaining_time": "0:03:49", "throughput": 2613.19, "total_tokens": 77361120} +{"current_steps": 133250, "total_steps": 134280, "loss": 0.7851, "lr": 5.386971263172668e-06, "epoch": 19.846589216562407, "percentage": 99.23, "elapsed_time": "8:13:25", "remaining_time": "0:03:48", "throughput": 2613.19, "total_tokens": 77364000} +{"current_steps": 133255, "total_steps": 134280, "loss": 0.8137, "lr": 5.334851086596371e-06, "epoch": 19.847333929103367, "percentage": 99.24, "elapsed_time": "8:13:26", "remaining_time": "0:03:47", "throughput": 2613.19, "total_tokens": 77366752} +{"current_steps": 133260, "total_steps": 134280, "loss": 0.8088, "lr": 5.282984229648679e-06, "epoch": 19.848078641644324, "percentage": 99.24, "elapsed_time": "8:13:27", "remaining_time": "0:03:46", "throughput": 2613.2, "total_tokens": 77369728} +{"current_steps": 133265, "total_steps": 134280, "loss": 0.8094, "lr": 5.231370693203896e-06, "epoch": 19.848823354185285, "percentage": 99.24, "elapsed_time": "8:13:28", "remaining_time": "0:03:45", "throughput": 2613.21, "total_tokens": 77372896} +{"current_steps": 133270, "total_steps": 134280, "loss": 0.7803, "lr": 5.180010478136321e-06, "epoch": 19.849568066726242, "percentage": 99.25, "elapsed_time": "8:13:29", "remaining_time": "0:03:44", "throughput": 2613.22, "total_tokens": 77375840} +{"current_steps": 133275, "total_steps": 134280, "loss": 0.7895, "lr": 5.128903585311927e-06, "epoch": 19.850312779267203, "percentage": 99.25, "elapsed_time": "8:13:30", "remaining_time": "0:03:43", "throughput": 2613.22, "total_tokens": 77378688} +{"current_steps": 133280, "total_steps": 134280, "loss": 0.8288, "lr": 5.078050015595026e-06, "epoch": 19.851057491808163, "percentage": 99.26, "elapsed_time": "8:13:31", "remaining_time": "0:03:42", "throughput": 2613.23, "total_tokens": 77381760} +{"current_steps": 133285, "total_steps": 134280, "loss": 0.7944, "lr": 5.027449769843262e-06, "epoch": 19.85180220434912, "percentage": 99.26, "elapsed_time": "8:13:32", "remaining_time": "0:03:41", "throughput": 2613.23, "total_tokens": 77384352} +{"current_steps": 133290, "total_steps": 134280, "loss": 0.8058, "lr": 4.977102848912617e-06, "epoch": 19.85254691689008, "percentage": 99.26, "elapsed_time": "8:13:33", "remaining_time": "0:03:39", "throughput": 2613.23, "total_tokens": 77387264} +{"current_steps": 133295, "total_steps": 134280, "loss": 0.7952, "lr": 4.92700925365408e-06, "epoch": 19.85329162943104, "percentage": 99.27, "elapsed_time": "8:13:34", "remaining_time": "0:03:38", "throughput": 2613.23, "total_tokens": 77389888} +{"current_steps": 133300, "total_steps": 134280, "loss": 0.8003, "lr": 4.8771689849136375e-06, "epoch": 19.854036341971998, "percentage": 99.27, "elapsed_time": "8:13:35", "remaining_time": "0:03:37", "throughput": 2613.24, "total_tokens": 77392928} +{"current_steps": 133305, "total_steps": 134280, "loss": 0.7923, "lr": 4.827582043532286e-06, "epoch": 19.85478105451296, "percentage": 99.27, "elapsed_time": "8:13:36", "remaining_time": "0:03:36", "throughput": 2613.25, "total_tokens": 77395936} +{"current_steps": 133310, "total_steps": 134280, "loss": 0.8104, "lr": 4.778248430349352e-06, "epoch": 19.855525767053916, "percentage": 99.28, "elapsed_time": "8:13:37", "remaining_time": "0:03:35", "throughput": 2613.25, "total_tokens": 77398848} +{"current_steps": 133315, "total_steps": 134280, "loss": 0.7907, "lr": 4.729168146197504e-06, "epoch": 19.856270479594876, "percentage": 99.28, "elapsed_time": "8:13:38", "remaining_time": "0:03:34", "throughput": 2613.25, "total_tokens": 77401664} +{"current_steps": 133320, "total_steps": 134280, "loss": 0.8159, "lr": 4.680341191904413e-06, "epoch": 19.857015192135837, "percentage": 99.29, "elapsed_time": "8:13:39", "remaining_time": "0:03:33", "throughput": 2613.26, "total_tokens": 77404608} +{"current_steps": 133325, "total_steps": 134280, "loss": 0.7935, "lr": 4.631767568297751e-06, "epoch": 19.857759904676794, "percentage": 99.29, "elapsed_time": "8:13:41", "remaining_time": "0:03:32", "throughput": 2613.26, "total_tokens": 77407552} +{"current_steps": 133330, "total_steps": 134280, "loss": 0.7761, "lr": 4.5834472761968615e-06, "epoch": 19.858504617217754, "percentage": 99.29, "elapsed_time": "8:13:42", "remaining_time": "0:03:31", "throughput": 2613.27, "total_tokens": 77410624} +{"current_steps": 133335, "total_steps": 134280, "loss": 0.8052, "lr": 4.535380316417758e-06, "epoch": 19.859249329758715, "percentage": 99.3, "elapsed_time": "8:13:43", "remaining_time": "0:03:29", "throughput": 2613.27, "total_tokens": 77413344} +{"current_steps": 133340, "total_steps": 134280, "loss": 0.7839, "lr": 4.4875666897714605e-06, "epoch": 19.85999404229967, "percentage": 99.3, "elapsed_time": "8:13:44", "remaining_time": "0:03:28", "throughput": 2613.27, "total_tokens": 77415936} +{"current_steps": 133345, "total_steps": 134280, "loss": 0.7902, "lr": 4.440006397068985e-06, "epoch": 19.860738754840632, "percentage": 99.3, "elapsed_time": "8:13:45", "remaining_time": "0:03:27", "throughput": 2613.27, "total_tokens": 77418944} +{"current_steps": 133350, "total_steps": 134280, "loss": 0.7902, "lr": 4.392699439109693e-06, "epoch": 19.86148346738159, "percentage": 99.31, "elapsed_time": "8:13:46", "remaining_time": "0:03:26", "throughput": 2613.28, "total_tokens": 77422016} +{"current_steps": 133355, "total_steps": 134280, "loss": 0.7973, "lr": 4.345645816696275e-06, "epoch": 19.86222817992255, "percentage": 99.31, "elapsed_time": "8:13:47", "remaining_time": "0:03:25", "throughput": 2613.28, "total_tokens": 77424672} +{"current_steps": 133360, "total_steps": 134280, "loss": 0.7786, "lr": 4.298845530623096e-06, "epoch": 19.86297289246351, "percentage": 99.31, "elapsed_time": "8:13:48", "remaining_time": "0:03:24", "throughput": 2613.29, "total_tokens": 77427616} +{"current_steps": 133365, "total_steps": 134280, "loss": 0.7882, "lr": 4.25229858167786e-06, "epoch": 19.863717605004467, "percentage": 99.32, "elapsed_time": "8:13:49", "remaining_time": "0:03:23", "throughput": 2613.29, "total_tokens": 77430368} +{"current_steps": 133370, "total_steps": 134280, "loss": 0.7972, "lr": 4.206004970649934e-06, "epoch": 19.864462317545428, "percentage": 99.32, "elapsed_time": "8:13:50", "remaining_time": "0:03:22", "throughput": 2613.29, "total_tokens": 77433312} +{"current_steps": 133375, "total_steps": 134280, "loss": 0.7941, "lr": 4.159964698320362e-06, "epoch": 19.86520703008639, "percentage": 99.33, "elapsed_time": "8:13:51", "remaining_time": "0:03:21", "throughput": 2613.3, "total_tokens": 77436128} +{"current_steps": 133380, "total_steps": 134280, "loss": 0.8006, "lr": 4.1141777654685185e-06, "epoch": 19.865951742627345, "percentage": 99.33, "elapsed_time": "8:13:52", "remaining_time": "0:03:19", "throughput": 2613.3, "total_tokens": 77438944} +{"current_steps": 133385, "total_steps": 134280, "loss": 0.7883, "lr": 4.068644172865454e-06, "epoch": 19.866696455168306, "percentage": 99.33, "elapsed_time": "8:13:53", "remaining_time": "0:03:18", "throughput": 2613.31, "total_tokens": 77441824} +{"current_steps": 133390, "total_steps": 134280, "loss": 0.7825, "lr": 4.023363921280554e-06, "epoch": 19.867441167709263, "percentage": 99.34, "elapsed_time": "8:13:54", "remaining_time": "0:03:17", "throughput": 2613.31, "total_tokens": 77444576} +{"current_steps": 133395, "total_steps": 134280, "loss": 0.7748, "lr": 3.978337011479871e-06, "epoch": 19.868185880250223, "percentage": 99.34, "elapsed_time": "8:13:55", "remaining_time": "0:03:16", "throughput": 2613.32, "total_tokens": 77447872} +{"current_steps": 133400, "total_steps": 134280, "loss": 0.8046, "lr": 3.933563444224464e-06, "epoch": 19.868930592791184, "percentage": 99.34, "elapsed_time": "8:13:56", "remaining_time": "0:03:15", "throughput": 2613.33, "total_tokens": 77450976} +{"current_steps": 133405, "total_steps": 134280, "loss": 0.8025, "lr": 3.889043220270394e-06, "epoch": 19.86967530533214, "percentage": 99.35, "elapsed_time": "8:13:57", "remaining_time": "0:03:14", "throughput": 2613.33, "total_tokens": 77453856} +{"current_steps": 133410, "total_steps": 134280, "loss": 0.7879, "lr": 3.8447763403703924e-06, "epoch": 19.8704200178731, "percentage": 99.35, "elapsed_time": "8:13:59", "remaining_time": "0:03:13", "throughput": 2613.34, "total_tokens": 77456736} +{"current_steps": 133415, "total_steps": 134280, "loss": 0.8064, "lr": 3.80076280527053e-06, "epoch": 19.87116473041406, "percentage": 99.36, "elapsed_time": "8:14:00", "remaining_time": "0:03:12", "throughput": 2613.34, "total_tokens": 77459488} +{"current_steps": 133420, "total_steps": 134280, "loss": 0.7985, "lr": 3.75700261571521e-06, "epoch": 19.87190944295502, "percentage": 99.36, "elapsed_time": "8:14:01", "remaining_time": "0:03:11", "throughput": 2613.34, "total_tokens": 77462464} +{"current_steps": 133425, "total_steps": 134280, "loss": 0.783, "lr": 3.713495772443842e-06, "epoch": 19.87265415549598, "percentage": 99.36, "elapsed_time": "8:14:02", "remaining_time": "0:03:09", "throughput": 2613.35, "total_tokens": 77465280} +{"current_steps": 133430, "total_steps": 134280, "loss": 0.8052, "lr": 3.670242276190838e-06, "epoch": 19.873398868036936, "percentage": 99.37, "elapsed_time": "8:14:03", "remaining_time": "0:03:08", "throughput": 2613.35, "total_tokens": 77467936} +{"current_steps": 133435, "total_steps": 134280, "loss": 0.7802, "lr": 3.6272421276889455e-06, "epoch": 19.874143580577897, "percentage": 99.37, "elapsed_time": "8:14:04", "remaining_time": "0:03:07", "throughput": 2613.35, "total_tokens": 77470816} +{"current_steps": 133440, "total_steps": 134280, "loss": 0.8064, "lr": 3.5844953276609193e-06, "epoch": 19.874888293118858, "percentage": 99.37, "elapsed_time": "8:14:05", "remaining_time": "0:03:06", "throughput": 2613.35, "total_tokens": 77473472} +{"current_steps": 133445, "total_steps": 134280, "loss": 0.8578, "lr": 3.5420018768328453e-06, "epoch": 19.875633005659815, "percentage": 99.38, "elapsed_time": "8:14:06", "remaining_time": "0:03:05", "throughput": 2613.36, "total_tokens": 77476864} +{"current_steps": 133450, "total_steps": 134280, "loss": 0.8129, "lr": 3.4997617759208174e-06, "epoch": 19.876377718200775, "percentage": 99.38, "elapsed_time": "8:14:07", "remaining_time": "0:03:04", "throughput": 2613.37, "total_tokens": 77479744} +{"current_steps": 133455, "total_steps": 134280, "loss": 0.8076, "lr": 3.4577750256392648e-06, "epoch": 19.877122430741732, "percentage": 99.39, "elapsed_time": "8:14:08", "remaining_time": "0:03:03", "throughput": 2613.37, "total_tokens": 77482400} +{"current_steps": 133460, "total_steps": 134280, "loss": 0.7845, "lr": 3.4160416266959536e-06, "epoch": 19.877867143282693, "percentage": 99.39, "elapsed_time": "8:14:09", "remaining_time": "0:03:02", "throughput": 2613.38, "total_tokens": 77485600} +{"current_steps": 133465, "total_steps": 134280, "loss": 0.792, "lr": 3.3745615797969863e-06, "epoch": 19.878611855823653, "percentage": 99.39, "elapsed_time": "8:14:10", "remaining_time": "0:03:01", "throughput": 2613.38, "total_tokens": 77488544} +{"current_steps": 133470, "total_steps": 134280, "loss": 0.8049, "lr": 3.333334885641803e-06, "epoch": 19.87935656836461, "percentage": 99.4, "elapsed_time": "8:14:11", "remaining_time": "0:02:59", "throughput": 2613.39, "total_tokens": 77491360} +{"current_steps": 133475, "total_steps": 134280, "loss": 0.8291, "lr": 3.2923615449298447e-06, "epoch": 19.88010128090557, "percentage": 99.4, "elapsed_time": "8:14:12", "remaining_time": "0:02:58", "throughput": 2613.39, "total_tokens": 77494112} +{"current_steps": 133480, "total_steps": 134280, "loss": 0.8075, "lr": 3.2516415583505595e-06, "epoch": 19.88084599344653, "percentage": 99.4, "elapsed_time": "8:14:13", "remaining_time": "0:02:57", "throughput": 2613.39, "total_tokens": 77497120} +{"current_steps": 133485, "total_steps": 134280, "loss": 0.804, "lr": 3.211174926591731e-06, "epoch": 19.881590705987488, "percentage": 99.41, "elapsed_time": "8:14:14", "remaining_time": "0:02:56", "throughput": 2613.4, "total_tokens": 77500000} +{"current_steps": 133490, "total_steps": 134280, "loss": 0.7872, "lr": 3.1709616503394766e-06, "epoch": 19.88233541852845, "percentage": 99.41, "elapsed_time": "8:14:15", "remaining_time": "0:02:55", "throughput": 2613.4, "total_tokens": 77502688} +{"current_steps": 133495, "total_steps": 134280, "loss": 0.7859, "lr": 3.1310017302715875e-06, "epoch": 19.883080131069406, "percentage": 99.42, "elapsed_time": "8:14:16", "remaining_time": "0:02:54", "throughput": 2613.4, "total_tokens": 77505312} +{"current_steps": 133500, "total_steps": 134280, "loss": 0.7942, "lr": 3.0912951670625245e-06, "epoch": 19.883824843610366, "percentage": 99.42, "elapsed_time": "8:14:18", "remaining_time": "0:02:53", "throughput": 2613.4, "total_tokens": 77508352} +{"current_steps": 133505, "total_steps": 134280, "loss": 0.7944, "lr": 3.051841961385082e-06, "epoch": 19.884569556151327, "percentage": 99.42, "elapsed_time": "8:14:19", "remaining_time": "0:02:52", "throughput": 2613.42, "total_tokens": 77511584} +{"current_steps": 133510, "total_steps": 134280, "loss": 0.8159, "lr": 3.0126421139037295e-06, "epoch": 19.885314268692284, "percentage": 99.43, "elapsed_time": "8:14:20", "remaining_time": "0:02:51", "throughput": 2613.42, "total_tokens": 77514592} +{"current_steps": 133515, "total_steps": 134280, "loss": 0.803, "lr": 2.9736956252812697e-06, "epoch": 19.886058981233244, "percentage": 99.43, "elapsed_time": "8:14:21", "remaining_time": "0:02:49", "throughput": 2613.42, "total_tokens": 77517408} +{"current_steps": 133520, "total_steps": 134280, "loss": 0.8085, "lr": 2.9350024961755095e-06, "epoch": 19.886803693774205, "percentage": 99.43, "elapsed_time": "8:14:22", "remaining_time": "0:02:48", "throughput": 2613.43, "total_tokens": 77520256} +{"current_steps": 133525, "total_steps": 134280, "loss": 0.7915, "lr": 2.8965627272425906e-06, "epoch": 19.88754840631516, "percentage": 99.44, "elapsed_time": "8:14:23", "remaining_time": "0:02:47", "throughput": 2613.44, "total_tokens": 77523360} +{"current_steps": 133530, "total_steps": 134280, "loss": 0.7953, "lr": 2.8583763191269984e-06, "epoch": 19.888293118856122, "percentage": 99.44, "elapsed_time": "8:14:24", "remaining_time": "0:02:46", "throughput": 2613.44, "total_tokens": 77526016} +{"current_steps": 133535, "total_steps": 134280, "loss": 0.7945, "lr": 2.8204432724798776e-06, "epoch": 19.88903783139708, "percentage": 99.45, "elapsed_time": "8:14:25", "remaining_time": "0:02:45", "throughput": 2613.45, "total_tokens": 77529248} +{"current_steps": 133540, "total_steps": 134280, "loss": 0.7898, "lr": 2.7827635879357215e-06, "epoch": 19.88978254393804, "percentage": 99.45, "elapsed_time": "8:14:26", "remaining_time": "0:02:44", "throughput": 2613.45, "total_tokens": 77532096} +{"current_steps": 133545, "total_steps": 134280, "loss": 0.7835, "lr": 2.7453372661373486e-06, "epoch": 19.890527256479, "percentage": 99.45, "elapsed_time": "8:14:27", "remaining_time": "0:02:43", "throughput": 2613.45, "total_tokens": 77534720} +{"current_steps": 133550, "total_steps": 134280, "loss": 0.7729, "lr": 2.7081643077125906e-06, "epoch": 19.891271969019957, "percentage": 99.46, "elapsed_time": "8:14:28", "remaining_time": "0:02:42", "throughput": 2613.45, "total_tokens": 77537536} +{"current_steps": 133555, "total_steps": 134280, "loss": 0.7942, "lr": 2.671244713289278e-06, "epoch": 19.892016681560918, "percentage": 99.46, "elapsed_time": "8:14:29", "remaining_time": "0:02:41", "throughput": 2613.46, "total_tokens": 77540608} +{"current_steps": 133560, "total_steps": 134280, "loss": 0.7992, "lr": 2.634578483495242e-06, "epoch": 19.89276139410188, "percentage": 99.46, "elapsed_time": "8:14:30", "remaining_time": "0:02:39", "throughput": 2613.46, "total_tokens": 77543360} +{"current_steps": 133565, "total_steps": 134280, "loss": 0.7803, "lr": 2.598165618946657e-06, "epoch": 19.893506106642835, "percentage": 99.47, "elapsed_time": "8:14:31", "remaining_time": "0:02:38", "throughput": 2613.47, "total_tokens": 77546464} +{"current_steps": 133570, "total_steps": 134280, "loss": 0.8122, "lr": 2.562006120258031e-06, "epoch": 19.894250819183796, "percentage": 99.47, "elapsed_time": "8:14:32", "remaining_time": "0:02:37", "throughput": 2613.47, "total_tokens": 77549376} +{"current_steps": 133575, "total_steps": 134280, "loss": 0.7947, "lr": 2.5260999880422074e-06, "epoch": 19.894995531724753, "percentage": 99.47, "elapsed_time": "8:14:33", "remaining_time": "0:02:36", "throughput": 2613.47, "total_tokens": 77552128} +{"current_steps": 133580, "total_steps": 134280, "loss": 0.8036, "lr": 2.4904472229053676e-06, "epoch": 19.895740244265713, "percentage": 99.48, "elapsed_time": "8:14:35", "remaining_time": "0:02:35", "throughput": 2613.48, "total_tokens": 77555104} +{"current_steps": 133585, "total_steps": 134280, "loss": 0.7935, "lr": 2.4550478254503627e-06, "epoch": 19.896484956806674, "percentage": 99.48, "elapsed_time": "8:14:36", "remaining_time": "0:02:34", "throughput": 2613.48, "total_tokens": 77557920} +{"current_steps": 133590, "total_steps": 134280, "loss": 0.7992, "lr": 2.4199017962750478e-06, "epoch": 19.89722966934763, "percentage": 99.49, "elapsed_time": "8:14:37", "remaining_time": "0:02:33", "throughput": 2613.49, "total_tokens": 77560992} +{"current_steps": 133595, "total_steps": 134280, "loss": 0.8029, "lr": 2.385009135970617e-06, "epoch": 19.89797438188859, "percentage": 99.49, "elapsed_time": "8:14:38", "remaining_time": "0:02:32", "throughput": 2613.5, "total_tokens": 77564032} +{"current_steps": 133600, "total_steps": 134280, "loss": 0.7891, "lr": 2.350369845129929e-06, "epoch": 19.898719094429552, "percentage": 99.49, "elapsed_time": "8:14:39", "remaining_time": "0:02:31", "throughput": 2613.51, "total_tokens": 77567296} +{"current_steps": 133605, "total_steps": 134280, "loss": 0.7932, "lr": 2.3159839243358516e-06, "epoch": 19.89946380697051, "percentage": 99.5, "elapsed_time": "8:14:40", "remaining_time": "0:02:29", "throughput": 2613.51, "total_tokens": 77570112} +{"current_steps": 133610, "total_steps": 134280, "loss": 0.8027, "lr": 2.2818513741712507e-06, "epoch": 19.90020851951147, "percentage": 99.5, "elapsed_time": "8:14:41", "remaining_time": "0:02:28", "throughput": 2613.52, "total_tokens": 77572928} +{"current_steps": 133615, "total_steps": 134280, "loss": 0.8028, "lr": 2.247972195210668e-06, "epoch": 19.900953232052427, "percentage": 99.5, "elapsed_time": "8:14:42", "remaining_time": "0:02:27", "throughput": 2613.52, "total_tokens": 77575520} +{"current_steps": 133620, "total_steps": 134280, "loss": 0.7899, "lr": 2.2143463880286427e-06, "epoch": 19.901697944593387, "percentage": 99.51, "elapsed_time": "8:14:43", "remaining_time": "0:02:26", "throughput": 2613.52, "total_tokens": 77578272} +{"current_steps": 133625, "total_steps": 134280, "loss": 0.8015, "lr": 2.1809739531913894e-06, "epoch": 19.902442657134348, "percentage": 99.51, "elapsed_time": "8:14:44", "remaining_time": "0:02:25", "throughput": 2613.53, "total_tokens": 77581344} +{"current_steps": 133630, "total_steps": 134280, "loss": 0.8172, "lr": 2.1478548912634566e-06, "epoch": 19.903187369675305, "percentage": 99.52, "elapsed_time": "8:14:45", "remaining_time": "0:02:24", "throughput": 2613.53, "total_tokens": 77584352} +{"current_steps": 133635, "total_steps": 134280, "loss": 0.8096, "lr": 2.114989202806061e-06, "epoch": 19.903932082216265, "percentage": 99.52, "elapsed_time": "8:14:46", "remaining_time": "0:02:23", "throughput": 2613.54, "total_tokens": 77587264} +{"current_steps": 133640, "total_steps": 134280, "loss": 0.79, "lr": 2.0823768883704297e-06, "epoch": 19.904676794757222, "percentage": 99.52, "elapsed_time": "8:14:47", "remaining_time": "0:02:22", "throughput": 2613.54, "total_tokens": 77590112} +{"current_steps": 133645, "total_steps": 134280, "loss": 0.7912, "lr": 2.050017948511118e-06, "epoch": 19.905421507298183, "percentage": 99.53, "elapsed_time": "8:14:48", "remaining_time": "0:02:21", "throughput": 2613.54, "total_tokens": 77592800} +{"current_steps": 133650, "total_steps": 134280, "loss": 0.7753, "lr": 2.017912383772691e-06, "epoch": 19.906166219839143, "percentage": 99.53, "elapsed_time": "8:14:49", "remaining_time": "0:02:19", "throughput": 2613.55, "total_tokens": 77595840} +{"current_steps": 133655, "total_steps": 134280, "loss": 0.794, "lr": 1.9860601946997125e-06, "epoch": 19.9069109323801, "percentage": 99.53, "elapsed_time": "8:14:50", "remaining_time": "0:02:18", "throughput": 2613.55, "total_tokens": 77598752} +{"current_steps": 133660, "total_steps": 134280, "loss": 0.7807, "lr": 1.9544613818284207e-06, "epoch": 19.90765564492106, "percentage": 99.54, "elapsed_time": "8:14:51", "remaining_time": "0:02:17", "throughput": 2613.56, "total_tokens": 77601632} +{"current_steps": 133665, "total_steps": 134280, "loss": 0.8026, "lr": 1.9231159456917222e-06, "epoch": 19.90840035746202, "percentage": 99.54, "elapsed_time": "8:14:52", "remaining_time": "0:02:16", "throughput": 2613.56, "total_tokens": 77604320} +{"current_steps": 133670, "total_steps": 134280, "loss": 0.8069, "lr": 1.8920238868225248e-06, "epoch": 19.909145070002978, "percentage": 99.55, "elapsed_time": "8:14:54", "remaining_time": "0:02:15", "throughput": 2613.56, "total_tokens": 77607040} +{"current_steps": 133675, "total_steps": 134280, "loss": 0.8105, "lr": 1.8611852057437427e-06, "epoch": 19.90988978254394, "percentage": 99.55, "elapsed_time": "8:14:55", "remaining_time": "0:02:14", "throughput": 2613.56, "total_tokens": 77609856} +{"current_steps": 133680, "total_steps": 134280, "loss": 0.8026, "lr": 1.8305999029766262e-06, "epoch": 19.910634495084896, "percentage": 99.55, "elapsed_time": "8:14:56", "remaining_time": "0:02:13", "throughput": 2613.56, "total_tokens": 77612608} +{"current_steps": 133685, "total_steps": 134280, "loss": 0.8042, "lr": 1.8002679790374286e-06, "epoch": 19.911379207625856, "percentage": 99.56, "elapsed_time": "8:14:57", "remaining_time": "0:02:12", "throughput": 2613.57, "total_tokens": 77615584} +{"current_steps": 133690, "total_steps": 134280, "loss": 0.8014, "lr": 1.7701894344390733e-06, "epoch": 19.912123920166817, "percentage": 99.56, "elapsed_time": "8:14:58", "remaining_time": "0:02:11", "throughput": 2613.57, "total_tokens": 77618272} +{"current_steps": 133695, "total_steps": 134280, "loss": 0.8065, "lr": 1.7403642696911524e-06, "epoch": 19.912868632707774, "percentage": 99.56, "elapsed_time": "8:14:59", "remaining_time": "0:02:09", "throughput": 2613.58, "total_tokens": 77621504} +{"current_steps": 133700, "total_steps": 134280, "loss": 0.7958, "lr": 1.7107924852949317e-06, "epoch": 19.913613345248734, "percentage": 99.57, "elapsed_time": "8:15:00", "remaining_time": "0:02:08", "throughput": 2613.58, "total_tokens": 77624064} +{"current_steps": 133705, "total_steps": 134280, "loss": 0.7867, "lr": 1.681474081751677e-06, "epoch": 19.914358057789695, "percentage": 99.57, "elapsed_time": "8:15:01", "remaining_time": "0:02:07", "throughput": 2613.59, "total_tokens": 77627168} +{"current_steps": 133710, "total_steps": 134280, "loss": 0.8044, "lr": 1.6524090595576579e-06, "epoch": 19.915102770330652, "percentage": 99.58, "elapsed_time": "8:15:02", "remaining_time": "0:02:06", "throughput": 2613.59, "total_tokens": 77630048} +{"current_steps": 133715, "total_steps": 134280, "loss": 0.8056, "lr": 1.6235974192008174e-06, "epoch": 19.915847482871612, "percentage": 99.58, "elapsed_time": "8:15:03", "remaining_time": "0:02:05", "throughput": 2613.59, "total_tokens": 77632768} +{"current_steps": 133720, "total_steps": 134280, "loss": 0.8162, "lr": 1.5950391611707636e-06, "epoch": 19.91659219541257, "percentage": 99.58, "elapsed_time": "8:15:04", "remaining_time": "0:02:04", "throughput": 2613.6, "total_tokens": 77635968} +{"current_steps": 133725, "total_steps": 134280, "loss": 0.799, "lr": 1.5667342859487787e-06, "epoch": 19.91733690795353, "percentage": 99.59, "elapsed_time": "8:15:05", "remaining_time": "0:02:03", "throughput": 2613.6, "total_tokens": 77638752} +{"current_steps": 133730, "total_steps": 134280, "loss": 0.804, "lr": 1.5386827940128133e-06, "epoch": 19.91808162049449, "percentage": 99.59, "elapsed_time": "8:15:06", "remaining_time": "0:02:02", "throughput": 2613.61, "total_tokens": 77641728} +{"current_steps": 133735, "total_steps": 134280, "loss": 0.794, "lr": 1.5108846858358227e-06, "epoch": 19.918826333035447, "percentage": 99.59, "elapsed_time": "8:15:07", "remaining_time": "0:02:01", "throughput": 2613.62, "total_tokens": 77644672} +{"current_steps": 133740, "total_steps": 134280, "loss": 0.7974, "lr": 1.4833399618907617e-06, "epoch": 19.919571045576408, "percentage": 99.6, "elapsed_time": "8:15:08", "remaining_time": "0:01:59", "throughput": 2613.63, "total_tokens": 77647808} +{"current_steps": 133745, "total_steps": 134280, "loss": 0.7914, "lr": 1.4560486226389279e-06, "epoch": 19.92031575811737, "percentage": 99.6, "elapsed_time": "8:15:09", "remaining_time": "0:01:58", "throughput": 2613.64, "total_tokens": 77650848} +{"current_steps": 133750, "total_steps": 134280, "loss": 0.7939, "lr": 1.4290106685449498e-06, "epoch": 19.921060470658325, "percentage": 99.61, "elapsed_time": "8:15:10", "remaining_time": "0:01:57", "throughput": 2613.64, "total_tokens": 77653664} +{"current_steps": 133755, "total_steps": 134280, "loss": 0.8008, "lr": 1.4022261000617986e-06, "epoch": 19.921805183199286, "percentage": 99.61, "elapsed_time": "8:15:11", "remaining_time": "0:01:56", "throughput": 2613.64, "total_tokens": 77656352} +{"current_steps": 133760, "total_steps": 134280, "loss": 0.8131, "lr": 1.3756949176457755e-06, "epoch": 19.922549895740243, "percentage": 99.61, "elapsed_time": "8:15:13", "remaining_time": "0:01:55", "throughput": 2613.64, "total_tokens": 77659264} +{"current_steps": 133765, "total_steps": 134280, "loss": 0.7999, "lr": 1.3494171217431904e-06, "epoch": 19.923294608281203, "percentage": 99.62, "elapsed_time": "8:15:14", "remaining_time": "0:01:54", "throughput": 2613.65, "total_tokens": 77662144} +{"current_steps": 133770, "total_steps": 134280, "loss": 0.797, "lr": 1.3233927127986876e-06, "epoch": 19.924039320822164, "percentage": 99.62, "elapsed_time": "8:15:15", "remaining_time": "0:01:53", "throughput": 2613.65, "total_tokens": 77664960} +{"current_steps": 133775, "total_steps": 134280, "loss": 0.7787, "lr": 1.2976216912519155e-06, "epoch": 19.92478403336312, "percentage": 99.62, "elapsed_time": "8:15:16", "remaining_time": "0:01:52", "throughput": 2613.66, "total_tokens": 77667936} +{"current_steps": 133780, "total_steps": 134280, "loss": 0.7894, "lr": 1.272104057535861e-06, "epoch": 19.92552874590408, "percentage": 99.63, "elapsed_time": "8:15:17", "remaining_time": "0:01:51", "throughput": 2613.66, "total_tokens": 77670816} +{"current_steps": 133785, "total_steps": 134280, "loss": 0.7892, "lr": 1.2468398120851764e-06, "epoch": 19.92627345844504, "percentage": 99.63, "elapsed_time": "8:15:18", "remaining_time": "0:01:49", "throughput": 2613.66, "total_tokens": 77673696} +{"current_steps": 133790, "total_steps": 134280, "loss": 0.7809, "lr": 1.221828955324522e-06, "epoch": 19.927018170986, "percentage": 99.64, "elapsed_time": "8:15:19", "remaining_time": "0:01:48", "throughput": 2613.67, "total_tokens": 77676608} +{"current_steps": 133795, "total_steps": 134280, "loss": 0.8027, "lr": 1.1970714876768928e-06, "epoch": 19.92776288352696, "percentage": 99.64, "elapsed_time": "8:15:20", "remaining_time": "0:01:47", "throughput": 2613.67, "total_tokens": 77679392} +{"current_steps": 133800, "total_steps": 134280, "loss": 0.7993, "lr": 1.172567409561953e-06, "epoch": 19.928507596067917, "percentage": 99.64, "elapsed_time": "8:15:21", "remaining_time": "0:01:46", "throughput": 2613.67, "total_tokens": 77682176} +{"current_steps": 133805, "total_steps": 134280, "loss": 0.7929, "lr": 1.1483167213910405e-06, "epoch": 19.929252308608877, "percentage": 99.65, "elapsed_time": "8:15:22", "remaining_time": "0:01:45", "throughput": 2613.67, "total_tokens": 77684736} +{"current_steps": 133810, "total_steps": 134280, "loss": 0.7978, "lr": 1.1243194235754926e-06, "epoch": 19.929997021149838, "percentage": 99.65, "elapsed_time": "8:15:23", "remaining_time": "0:01:44", "throughput": 2613.67, "total_tokens": 77687584} +{"current_steps": 133815, "total_steps": 134280, "loss": 0.8087, "lr": 1.100575516519986e-06, "epoch": 19.930741733690795, "percentage": 99.65, "elapsed_time": "8:15:24", "remaining_time": "0:01:43", "throughput": 2613.68, "total_tokens": 77690336} +{"current_steps": 133820, "total_steps": 134280, "loss": 0.7733, "lr": 1.077085000625866e-06, "epoch": 19.931486446231755, "percentage": 99.66, "elapsed_time": "8:15:25", "remaining_time": "0:01:42", "throughput": 2613.68, "total_tokens": 77693280} +{"current_steps": 133825, "total_steps": 134280, "loss": 0.7958, "lr": 1.0538478762911475e-06, "epoch": 19.932231158772712, "percentage": 99.66, "elapsed_time": "8:15:26", "remaining_time": "0:01:41", "throughput": 2613.68, "total_tokens": 77696096} +{"current_steps": 133830, "total_steps": 134280, "loss": 0.8035, "lr": 1.0308641439071841e-06, "epoch": 19.932975871313673, "percentage": 99.66, "elapsed_time": "8:15:27", "remaining_time": "0:01:39", "throughput": 2613.69, "total_tokens": 77698912} +{"current_steps": 133835, "total_steps": 134280, "loss": 0.7822, "lr": 1.008133803861999e-06, "epoch": 19.933720583854633, "percentage": 99.67, "elapsed_time": "8:15:28", "remaining_time": "0:01:38", "throughput": 2613.69, "total_tokens": 77701600} +{"current_steps": 133840, "total_steps": 134280, "loss": 0.8144, "lr": 9.856568565402845e-07, "epoch": 19.93446529639559, "percentage": 99.67, "elapsed_time": "8:15:29", "remaining_time": "0:01:37", "throughput": 2613.69, "total_tokens": 77704448} +{"current_steps": 133845, "total_steps": 134280, "loss": 0.7913, "lr": 9.634333023217366e-07, "epoch": 19.93521000893655, "percentage": 99.68, "elapsed_time": "8:15:30", "remaining_time": "0:01:36", "throughput": 2613.7, "total_tokens": 77707424} +{"current_steps": 133850, "total_steps": 134280, "loss": 0.7898, "lr": 9.414631415810559e-07, "epoch": 19.93595472147751, "percentage": 99.68, "elapsed_time": "8:15:31", "remaining_time": "0:01:35", "throughput": 2613.7, "total_tokens": 77710112} +{"current_steps": 133855, "total_steps": 134280, "loss": 0.8033, "lr": 9.197463746912771e-07, "epoch": 19.93669943401847, "percentage": 99.68, "elapsed_time": "8:15:32", "remaining_time": "0:01:34", "throughput": 2613.7, "total_tokens": 77712992} +{"current_steps": 133860, "total_steps": 134280, "loss": 0.7878, "lr": 8.982830020171084e-07, "epoch": 19.93744414655943, "percentage": 99.69, "elapsed_time": "8:15:34", "remaining_time": "0:01:33", "throughput": 2613.71, "total_tokens": 77715936} +{"current_steps": 133865, "total_steps": 134280, "loss": 0.7996, "lr": 8.770730239215929e-07, "epoch": 19.938188859100386, "percentage": 99.69, "elapsed_time": "8:15:35", "remaining_time": "0:01:32", "throughput": 2613.71, "total_tokens": 77718880} +{"current_steps": 133870, "total_steps": 134280, "loss": 0.8063, "lr": 8.561164407644428e-07, "epoch": 19.938933571641346, "percentage": 99.69, "elapsed_time": "8:15:36", "remaining_time": "0:01:31", "throughput": 2613.72, "total_tokens": 77721952} +{"current_steps": 133875, "total_steps": 134280, "loss": 0.7995, "lr": 8.35413252898709e-07, "epoch": 19.939678284182307, "percentage": 99.7, "elapsed_time": "8:15:37", "remaining_time": "0:01:29", "throughput": 2613.72, "total_tokens": 77724736} +{"current_steps": 133880, "total_steps": 134280, "loss": 0.8197, "lr": 8.149634606741119e-07, "epoch": 19.940422996723264, "percentage": 99.7, "elapsed_time": "8:15:38", "remaining_time": "0:01:28", "throughput": 2613.72, "total_tokens": 77727648} +{"current_steps": 133885, "total_steps": 134280, "loss": 0.7888, "lr": 7.947670644353754e-07, "epoch": 19.941167709264224, "percentage": 99.71, "elapsed_time": "8:15:39", "remaining_time": "0:01:27", "throughput": 2613.73, "total_tokens": 77730688} +{"current_steps": 133890, "total_steps": 134280, "loss": 0.7872, "lr": 7.748240645255589e-07, "epoch": 19.941912421805185, "percentage": 99.71, "elapsed_time": "8:15:40", "remaining_time": "0:01:26", "throughput": 2613.73, "total_tokens": 77733472} +{"current_steps": 133895, "total_steps": 134280, "loss": 0.7917, "lr": 7.551344612793942e-07, "epoch": 19.942657134346142, "percentage": 99.71, "elapsed_time": "8:15:41", "remaining_time": "0:01:25", "throughput": 2613.74, "total_tokens": 77736416} +{"current_steps": 133900, "total_steps": 134280, "loss": 0.8016, "lr": 7.356982550316137e-07, "epoch": 19.943401846887102, "percentage": 99.72, "elapsed_time": "8:15:42", "remaining_time": "0:01:24", "throughput": 2613.74, "total_tokens": 77739104} +{"current_steps": 133905, "total_steps": 134280, "loss": 0.7889, "lr": 7.165154461102885e-07, "epoch": 19.94414655942806, "percentage": 99.72, "elapsed_time": "8:15:43", "remaining_time": "0:01:23", "throughput": 2613.74, "total_tokens": 77741952} +{"current_steps": 133910, "total_steps": 134280, "loss": 0.7958, "lr": 6.975860348368278e-07, "epoch": 19.94489127196902, "percentage": 99.72, "elapsed_time": "8:15:44", "remaining_time": "0:01:22", "throughput": 2613.75, "total_tokens": 77744832} +{"current_steps": 133915, "total_steps": 134280, "loss": 0.8002, "lr": 6.789100215343069e-07, "epoch": 19.94563598450998, "percentage": 99.73, "elapsed_time": "8:15:45", "remaining_time": "0:01:21", "throughput": 2613.75, "total_tokens": 77747552} +{"current_steps": 133920, "total_steps": 134280, "loss": 0.8337, "lr": 6.604874065174737e-07, "epoch": 19.946380697050937, "percentage": 99.73, "elapsed_time": "8:15:46", "remaining_time": "0:01:19", "throughput": 2613.75, "total_tokens": 77750432} +{"current_steps": 133925, "total_steps": 134280, "loss": 0.8061, "lr": 6.423181900960805e-07, "epoch": 19.947125409591898, "percentage": 99.74, "elapsed_time": "8:15:47", "remaining_time": "0:01:18", "throughput": 2613.76, "total_tokens": 77753344} +{"current_steps": 133930, "total_steps": 134280, "loss": 0.7879, "lr": 6.244023725782144e-07, "epoch": 19.947870122132855, "percentage": 99.74, "elapsed_time": "8:15:48", "remaining_time": "0:01:17", "throughput": 2613.76, "total_tokens": 77756224} +{"current_steps": 133935, "total_steps": 134280, "loss": 0.775, "lr": 6.06739954266966e-07, "epoch": 19.948614834673815, "percentage": 99.74, "elapsed_time": "8:15:49", "remaining_time": "0:01:16", "throughput": 2613.76, "total_tokens": 77758944} +{"current_steps": 133940, "total_steps": 134280, "loss": 0.791, "lr": 5.893309354604304e-07, "epoch": 19.949359547214776, "percentage": 99.75, "elapsed_time": "8:15:50", "remaining_time": "0:01:15", "throughput": 2613.76, "total_tokens": 77761824} +{"current_steps": 133945, "total_steps": 134280, "loss": 0.7898, "lr": 5.721753164517063e-07, "epoch": 19.950104259755733, "percentage": 99.75, "elapsed_time": "8:15:51", "remaining_time": "0:01:14", "throughput": 2613.77, "total_tokens": 77764672} +{"current_steps": 133950, "total_steps": 134280, "loss": 0.7974, "lr": 5.55273097530562e-07, "epoch": 19.950848972296694, "percentage": 99.75, "elapsed_time": "8:15:53", "remaining_time": "0:01:13", "throughput": 2613.78, "total_tokens": 77767776} +{"current_steps": 133955, "total_steps": 134280, "loss": 0.7885, "lr": 5.386242789851004e-07, "epoch": 19.951593684837654, "percentage": 99.76, "elapsed_time": "8:15:54", "remaining_time": "0:01:12", "throughput": 2613.78, "total_tokens": 77770720} +{"current_steps": 133960, "total_steps": 134280, "loss": 0.818, "lr": 5.222288610934322e-07, "epoch": 19.95233839737861, "percentage": 99.76, "elapsed_time": "8:15:55", "remaining_time": "0:01:11", "throughput": 2613.78, "total_tokens": 77773504} +{"current_steps": 133965, "total_steps": 134280, "loss": 0.774, "lr": 5.060868441336685e-07, "epoch": 19.95308310991957, "percentage": 99.77, "elapsed_time": "8:15:56", "remaining_time": "0:01:09", "throughput": 2613.79, "total_tokens": 77776800} +{"current_steps": 133970, "total_steps": 134280, "loss": 0.8278, "lr": 4.901982283805895e-07, "epoch": 19.95382782246053, "percentage": 99.77, "elapsed_time": "8:15:57", "remaining_time": "0:01:08", "throughput": 2613.8, "total_tokens": 77779776} +{"current_steps": 133975, "total_steps": 134280, "loss": 0.821, "lr": 4.7456301409898317e-07, "epoch": 19.95457253500149, "percentage": 99.77, "elapsed_time": "8:15:58", "remaining_time": "0:01:07", "throughput": 2613.81, "total_tokens": 77782720} +{"current_steps": 133980, "total_steps": 134280, "loss": 0.8058, "lr": 4.591812015553032e-07, "epoch": 19.95531724754245, "percentage": 99.78, "elapsed_time": "8:15:59", "remaining_time": "0:01:06", "throughput": 2613.81, "total_tokens": 77785600} +{"current_steps": 133985, "total_steps": 134280, "loss": 0.774, "lr": 4.440527910093417e-07, "epoch": 19.956061960083407, "percentage": 99.78, "elapsed_time": "8:16:00", "remaining_time": "0:01:05", "throughput": 2613.82, "total_tokens": 77788832} +{"current_steps": 133990, "total_steps": 134280, "loss": 0.8118, "lr": 4.2917778271589487e-07, "epoch": 19.956806672624367, "percentage": 99.78, "elapsed_time": "8:16:01", "remaining_time": "0:01:04", "throughput": 2613.82, "total_tokens": 77791776} +{"current_steps": 133995, "total_steps": 134280, "loss": 0.7913, "lr": 4.145561769264283e-07, "epoch": 19.957551385165328, "percentage": 99.79, "elapsed_time": "8:16:02", "remaining_time": "0:01:03", "throughput": 2613.83, "total_tokens": 77794720} +{"current_steps": 134000, "total_steps": 134280, "loss": 0.8092, "lr": 4.001879738890768e-07, "epoch": 19.958296097706285, "percentage": 99.79, "elapsed_time": "8:16:03", "remaining_time": "0:01:02", "throughput": 2613.84, "total_tokens": 77797728} +{"current_steps": 134005, "total_steps": 134280, "loss": 0.7951, "lr": 3.8607317384531377e-07, "epoch": 19.959040810247245, "percentage": 99.8, "elapsed_time": "8:16:04", "remaining_time": "0:01:01", "throughput": 2613.84, "total_tokens": 77800512} +{"current_steps": 134010, "total_steps": 134280, "loss": 0.8184, "lr": 3.722117770332822e-07, "epoch": 19.959785522788202, "percentage": 99.8, "elapsed_time": "8:16:05", "remaining_time": "0:00:59", "throughput": 2613.84, "total_tokens": 77803136} +{"current_steps": 134015, "total_steps": 134280, "loss": 0.8001, "lr": 3.586037836877942e-07, "epoch": 19.960530235329163, "percentage": 99.8, "elapsed_time": "8:16:06", "remaining_time": "0:00:58", "throughput": 2613.84, "total_tokens": 77806112} +{"current_steps": 134020, "total_steps": 134280, "loss": 0.8042, "lr": 3.4524919403866593e-07, "epoch": 19.961274947870123, "percentage": 99.81, "elapsed_time": "8:16:08", "remaining_time": "0:00:57", "throughput": 2613.85, "total_tokens": 77808960} +{"current_steps": 134025, "total_steps": 134280, "loss": 0.789, "lr": 3.321480083123829e-07, "epoch": 19.96201966041108, "percentage": 99.81, "elapsed_time": "8:16:09", "remaining_time": "0:00:56", "throughput": 2613.85, "total_tokens": 77811744} +{"current_steps": 134030, "total_steps": 134280, "loss": 0.802, "lr": 3.1930022672876923e-07, "epoch": 19.96276437295204, "percentage": 99.81, "elapsed_time": "8:16:10", "remaining_time": "0:00:55", "throughput": 2613.86, "total_tokens": 77814848} +{"current_steps": 134035, "total_steps": 134280, "loss": 0.808, "lr": 3.0670584950598376e-07, "epoch": 19.963509085493, "percentage": 99.82, "elapsed_time": "8:16:11", "remaining_time": "0:00:54", "throughput": 2613.86, "total_tokens": 77817952} +{"current_steps": 134040, "total_steps": 134280, "loss": 0.794, "lr": 2.9436487685718935e-07, "epoch": 19.96425379803396, "percentage": 99.82, "elapsed_time": "8:16:12", "remaining_time": "0:00:53", "throughput": 2613.87, "total_tokens": 77820832} +{"current_steps": 134045, "total_steps": 134280, "loss": 0.8008, "lr": 2.8227730898888745e-07, "epoch": 19.96499851057492, "percentage": 99.82, "elapsed_time": "8:16:13", "remaining_time": "0:00:52", "throughput": 2613.88, "total_tokens": 77823936} +{"current_steps": 134050, "total_steps": 134280, "loss": 0.7845, "lr": 2.704431461059142e-07, "epoch": 19.965743223115876, "percentage": 99.83, "elapsed_time": "8:16:14", "remaining_time": "0:00:51", "throughput": 2613.88, "total_tokens": 77826912} +{"current_steps": 134055, "total_steps": 134280, "loss": 0.8049, "lr": 2.588623884097751e-07, "epoch": 19.966487935656836, "percentage": 99.83, "elapsed_time": "8:16:15", "remaining_time": "0:00:49", "throughput": 2613.89, "total_tokens": 77829888} +{"current_steps": 134060, "total_steps": 134280, "loss": 0.788, "lr": 2.4753503609531434e-07, "epoch": 19.967232648197797, "percentage": 99.84, "elapsed_time": "8:16:16", "remaining_time": "0:00:48", "throughput": 2613.89, "total_tokens": 77832704} +{"current_steps": 134065, "total_steps": 134280, "loss": 0.8117, "lr": 2.364610893540453e-07, "epoch": 19.967977360738754, "percentage": 99.84, "elapsed_time": "8:16:17", "remaining_time": "0:00:47", "throughput": 2613.9, "total_tokens": 77835648} +{"current_steps": 134070, "total_steps": 134280, "loss": 0.8061, "lr": 2.2564054837082015e-07, "epoch": 19.968722073279714, "percentage": 99.84, "elapsed_time": "8:16:18", "remaining_time": "0:00:46", "throughput": 2613.9, "total_tokens": 77838688} +{"current_steps": 134075, "total_steps": 134280, "loss": 0.7868, "lr": 2.1507341333215635e-07, "epoch": 19.969466785820675, "percentage": 99.85, "elapsed_time": "8:16:19", "remaining_time": "0:00:45", "throughput": 2613.91, "total_tokens": 77841632} +{"current_steps": 134080, "total_steps": 134280, "loss": 0.7998, "lr": 2.0475968441291404e-07, "epoch": 19.970211498361632, "percentage": 99.85, "elapsed_time": "8:16:20", "remaining_time": "0:00:44", "throughput": 2613.91, "total_tokens": 77844544} +{"current_steps": 134085, "total_steps": 134280, "loss": 0.7966, "lr": 1.94699361791284e-07, "epoch": 19.970956210902592, "percentage": 99.85, "elapsed_time": "8:16:21", "remaining_time": "0:00:43", "throughput": 2613.92, "total_tokens": 77847648} +{"current_steps": 134090, "total_steps": 134280, "loss": 0.7938, "lr": 1.848924456337997e-07, "epoch": 19.97170092344355, "percentage": 99.86, "elapsed_time": "8:16:22", "remaining_time": "0:00:42", "throughput": 2613.92, "total_tokens": 77850432} +{"current_steps": 134095, "total_steps": 134280, "loss": 0.7942, "lr": 1.7533893610699457e-07, "epoch": 19.97244563598451, "percentage": 99.86, "elapsed_time": "8:16:24", "remaining_time": "0:00:41", "throughput": 2613.93, "total_tokens": 77853440} +{"current_steps": 134100, "total_steps": 134280, "loss": 0.7989, "lr": 1.6603883337407143e-07, "epoch": 19.97319034852547, "percentage": 99.87, "elapsed_time": "8:16:25", "remaining_time": "0:00:39", "throughput": 2613.93, "total_tokens": 77856192} +{"current_steps": 134105, "total_steps": 134280, "loss": 0.7751, "lr": 1.5699213758990638e-07, "epoch": 19.973935061066427, "percentage": 99.87, "elapsed_time": "8:16:26", "remaining_time": "0:00:38", "throughput": 2613.94, "total_tokens": 77859392} +{"current_steps": 134110, "total_steps": 134280, "loss": 0.8192, "lr": 1.4819884890771017e-07, "epoch": 19.974679773607388, "percentage": 99.87, "elapsed_time": "8:16:27", "remaining_time": "0:00:37", "throughput": 2613.95, "total_tokens": 77862304} +{"current_steps": 134115, "total_steps": 134280, "loss": 0.8138, "lr": 1.3965896747736295e-07, "epoch": 19.97542448614835, "percentage": 99.88, "elapsed_time": "8:16:28", "remaining_time": "0:00:36", "throughput": 2613.95, "total_tokens": 77865344} +{"current_steps": 134120, "total_steps": 134280, "loss": 0.7975, "lr": 1.3137249344208344e-07, "epoch": 19.976169198689306, "percentage": 99.88, "elapsed_time": "8:16:29", "remaining_time": "0:00:35", "throughput": 2613.96, "total_tokens": 77868320} +{"current_steps": 134125, "total_steps": 134280, "loss": 0.7987, "lr": 1.2333942694175982e-07, "epoch": 19.976913911230266, "percentage": 99.88, "elapsed_time": "8:16:30", "remaining_time": "0:00:34", "throughput": 2613.97, "total_tokens": 77871456} +{"current_steps": 134130, "total_steps": 134280, "loss": 0.802, "lr": 1.1555976811294942e-07, "epoch": 19.977658623771223, "percentage": 99.89, "elapsed_time": "8:16:31", "remaining_time": "0:00:33", "throughput": 2613.98, "total_tokens": 77874656} +{"current_steps": 134135, "total_steps": 134280, "loss": 0.8094, "lr": 1.0803351708721375e-07, "epoch": 19.978403336312184, "percentage": 99.89, "elapsed_time": "8:16:32", "remaining_time": "0:00:32", "throughput": 2613.98, "total_tokens": 77877536} +{"current_steps": 134140, "total_steps": 134280, "loss": 0.8023, "lr": 1.0076067398945287e-07, "epoch": 19.979148048853144, "percentage": 99.9, "elapsed_time": "8:16:33", "remaining_time": "0:00:31", "throughput": 2613.99, "total_tokens": 77880704} +{"current_steps": 134145, "total_steps": 134280, "loss": 0.7932, "lr": 9.37412389462322e-08, "epoch": 19.9798927613941, "percentage": 99.9, "elapsed_time": "8:16:34", "remaining_time": "0:00:29", "throughput": 2614.0, "total_tokens": 77883840} +{"current_steps": 134150, "total_steps": 134280, "loss": 0.7978, "lr": 8.697521207245984e-08, "epoch": 19.98063747393506, "percentage": 99.9, "elapsed_time": "8:16:35", "remaining_time": "0:00:28", "throughput": 2614.0, "total_tokens": 77886720} +{"current_steps": 134155, "total_steps": 134280, "loss": 0.7722, "lr": 8.046259348304385e-08, "epoch": 19.98138218647602, "percentage": 99.91, "elapsed_time": "8:16:37", "remaining_time": "0:00:27", "throughput": 2614.01, "total_tokens": 77889664} +{"current_steps": 134160, "total_steps": 134280, "loss": 0.7916, "lr": 7.420338329122699e-08, "epoch": 19.98212689901698, "percentage": 99.91, "elapsed_time": "8:16:38", "remaining_time": "0:00:26", "throughput": 2614.01, "total_tokens": 77892448} +{"current_steps": 134165, "total_steps": 134280, "loss": 0.7972, "lr": 6.819758159859468e-08, "epoch": 19.98287161155794, "percentage": 99.91, "elapsed_time": "8:16:39", "remaining_time": "0:00:25", "throughput": 2614.01, "total_tokens": 77895072} +{"current_steps": 134170, "total_steps": 134280, "loss": 0.8127, "lr": 6.244518851006297e-08, "epoch": 19.983616324098897, "percentage": 99.92, "elapsed_time": "8:16:40", "remaining_time": "0:00:24", "throughput": 2614.01, "total_tokens": 77897792} +{"current_steps": 134175, "total_steps": 134280, "loss": 0.8112, "lr": 5.6946204120555954e-08, "epoch": 19.984361036639857, "percentage": 99.92, "elapsed_time": "8:16:41", "remaining_time": "0:00:23", "throughput": 2614.01, "total_tokens": 77900672} +{"current_steps": 134180, "total_steps": 134280, "loss": 0.8235, "lr": 5.1700628523332346e-08, "epoch": 19.985105749180818, "percentage": 99.93, "elapsed_time": "8:16:42", "remaining_time": "0:00:22", "throughput": 2614.02, "total_tokens": 77903488} +{"current_steps": 134185, "total_steps": 134280, "loss": 0.7935, "lr": 4.670846180832022e-08, "epoch": 19.985850461721775, "percentage": 99.93, "elapsed_time": "8:16:43", "remaining_time": "0:00:21", "throughput": 2614.02, "total_tokens": 77906336} +{"current_steps": 134190, "total_steps": 134280, "loss": 0.8051, "lr": 4.1969704057120967e-08, "epoch": 19.986595174262735, "percentage": 99.93, "elapsed_time": "8:16:44", "remaining_time": "0:00:19", "throughput": 2614.02, "total_tokens": 77908960} +{"current_steps": 134195, "total_steps": 134280, "loss": 0.8039, "lr": 3.7484355353001316e-08, "epoch": 19.987339886803692, "percentage": 99.94, "elapsed_time": "8:16:45", "remaining_time": "0:00:18", "throughput": 2614.02, "total_tokens": 77911872} +{"current_steps": 134200, "total_steps": 134280, "loss": 0.8109, "lr": 3.3252415770901324e-08, "epoch": 19.988084599344653, "percentage": 99.94, "elapsed_time": "8:16:46", "remaining_time": "0:00:17", "throughput": 2614.02, "total_tokens": 77914496} +{"current_steps": 134205, "total_steps": 134280, "loss": 0.7852, "lr": 2.9273885380765028e-08, "epoch": 19.988829311885613, "percentage": 99.94, "elapsed_time": "8:16:47", "remaining_time": "0:00:16", "throughput": 2614.03, "total_tokens": 77917472} +{"current_steps": 134210, "total_steps": 134280, "loss": 0.8004, "lr": 2.5548764250871158e-08, "epoch": 19.98957402442657, "percentage": 99.95, "elapsed_time": "8:16:48", "remaining_time": "0:00:15", "throughput": 2614.03, "total_tokens": 77920352} +{"current_steps": 134215, "total_steps": 134280, "loss": 0.785, "lr": 2.2077052442837086e-08, "epoch": 19.99031873696753, "percentage": 99.95, "elapsed_time": "8:16:49", "remaining_time": "0:00:14", "throughput": 2614.04, "total_tokens": 77923168} +{"current_steps": 134220, "total_steps": 134280, "loss": 0.803, "lr": 1.885875001828019e-08, "epoch": 19.99106344950849, "percentage": 99.96, "elapsed_time": "8:16:50", "remaining_time": "0:00:13", "throughput": 2614.05, "total_tokens": 77926368} +{"current_steps": 134225, "total_steps": 134280, "loss": 0.8026, "lr": 1.5893857028825842e-08, "epoch": 19.99180816204945, "percentage": 99.96, "elapsed_time": "8:16:51", "remaining_time": "0:00:12", "throughput": 2614.06, "total_tokens": 77929440} +{"current_steps": 134230, "total_steps": 134280, "loss": 0.8162, "lr": 1.3182373526099411e-08, "epoch": 19.99255287459041, "percentage": 99.96, "elapsed_time": "8:16:52", "remaining_time": "0:00:11", "throughput": 2614.06, "total_tokens": 77932192} +{"current_steps": 134235, "total_steps": 134280, "loss": 0.7904, "lr": 1.072429955506493e-08, "epoch": 19.993297587131366, "percentage": 99.97, "elapsed_time": "8:16:53", "remaining_time": "0:00:09", "throughput": 2614.06, "total_tokens": 77935136} +{"current_steps": 134240, "total_steps": 134280, "loss": 0.81, "lr": 8.519635157355765e-09, "epoch": 19.994042299672326, "percentage": 99.97, "elapsed_time": "8:16:54", "remaining_time": "0:00:08", "throughput": 2614.07, "total_tokens": 77938048} +{"current_steps": 134245, "total_steps": 134280, "loss": 0.8076, "lr": 6.5683803712746065e-09, "epoch": 19.994787012213287, "percentage": 99.97, "elapsed_time": "8:16:55", "remaining_time": "0:00:07", "throughput": 2614.07, "total_tokens": 77940864} +{"current_steps": 134250, "total_steps": 134280, "loss": 0.7787, "lr": 4.8705352284628135e-09, "epoch": 19.995531724754244, "percentage": 99.98, "elapsed_time": "8:16:56", "remaining_time": "0:00:06", "throughput": 2614.08, "total_tokens": 77943904} +{"current_steps": 134255, "total_steps": 134280, "loss": 0.8164, "lr": 3.4260997572310714e-09, "epoch": 19.996276437295204, "percentage": 99.98, "elapsed_time": "8:16:58", "remaining_time": "0:00:05", "throughput": 2614.09, "total_tokens": 77946912} +{"current_steps": 134260, "total_steps": 134280, "loss": 0.7934, "lr": 2.2350739842247333e-09, "epoch": 19.997021149836165, "percentage": 99.99, "elapsed_time": "8:16:59", "remaining_time": "0:00:04", "throughput": 2614.09, "total_tokens": 77949824} +{"current_steps": 134265, "total_steps": 134280, "loss": 0.7855, "lr": 1.2974579277624798e-09, "epoch": 19.997765862377122, "percentage": 99.99, "elapsed_time": "8:17:00", "remaining_time": "0:00:03", "throughput": 2614.1, "total_tokens": 77953024} +{"current_steps": 134270, "total_steps": 134280, "loss": 0.8183, "lr": 6.132516028323209e-10, "epoch": 19.998510574918082, "percentage": 99.99, "elapsed_time": "8:17:01", "remaining_time": "0:00:02", "throughput": 2614.11, "total_tokens": 77956032} +{"current_steps": 134275, "total_steps": 134280, "loss": 0.7991, "lr": 1.8245502275693325e-10, "epoch": 19.99925528745904, "percentage": 100.0, "elapsed_time": "8:17:02", "remaining_time": "0:00:01", "throughput": 2614.12, "total_tokens": 77959072} +{"current_steps": 134280, "total_steps": 134280, "loss": 0.8063, "lr": 5.068195862989455e-12, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "8:17:03", "remaining_time": "0:00:00", "throughput": 2614.11, "total_tokens": 77961608} +{"current_steps": 134280, "total_steps": 134280, "eval_loss": 0.7992360591888428, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "8:18:13", "remaining_time": "0:00:00", "throughput": 2607.94, "total_tokens": 77961608} +{"current_steps": 134280, "total_steps": 134280, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "8:18:15", "remaining_time": "0:00:00", "throughput": 2607.82, "total_tokens": 77961608}