{"current_steps": 1, "total_steps": 9134, "loss": 0.6712, "learning_rate": 4.99999985212739e-05, "epoch": 0.00010947207093790197, "percentage": 0.01, "elapsed_time": "0:01:15", "remaining_time": "7 days, 23:50:35", "throughput": 2654.12, "total_tokens": 200704} {"current_steps": 2, "total_steps": 9134, "loss": 0.6784, "learning_rate": 4.9999994085095755e-05, "epoch": 0.00021894414187580393, "percentage": 0.02, "elapsed_time": "0:02:28", "remaining_time": "7 days, 20:14:11", "throughput": 2605.06, "total_tokens": 386624} {"current_steps": 3, "total_steps": 9134, "loss": 0.802, "learning_rate": 4.9999986691466115e-05, "epoch": 0.0003284162128137059, "percentage": 0.03, "elapsed_time": "0:03:40", "remaining_time": "7 days, 18:35:03", "throughput": 2682.65, "total_tokens": 592032} {"current_steps": 4, "total_steps": 9134, "loss": 0.6541, "learning_rate": 4.999997634038584e-05, "epoch": 0.00043788828375160787, "percentage": 0.04, "elapsed_time": "0:04:46", "remaining_time": "7 days, 13:53:57", "throughput": 2665.56, "total_tokens": 764736} {"current_steps": 5, "total_steps": 9134, "loss": 0.5063, "learning_rate": 4.9999963031856145e-05, "epoch": 0.0005473603546895098, "percentage": 0.05, "elapsed_time": "0:05:55", "remaining_time": "7 days, 12:18:52", "throughput": 2618.45, "total_tokens": 930944} {"current_steps": 6, "total_steps": 9134, "loss": 0.7316, "learning_rate": 4.999994676587863e-05, "epoch": 0.0006568324256274118, "percentage": 0.07, "elapsed_time": "0:07:03", "remaining_time": "7 days, 11:06:44", "throughput": 2676.85, "total_tokens": 1134560} {"current_steps": 7, "total_steps": 9134, "loss": 0.5013, "learning_rate": 4.9999927542455196e-05, "epoch": 0.0007663044965653138, "percentage": 0.08, "elapsed_time": "0:08:11", "remaining_time": "7 days, 9:51:13", "throughput": 2699.98, "total_tokens": 1325856} {"current_steps": 8, "total_steps": 9134, "loss": 0.4773, "learning_rate": 4.9999905361588115e-05, "epoch": 0.0008757765675032157, "percentage": 0.09, "elapsed_time": "0:09:19", "remaining_time": "7 days, 9:21:52", "throughput": 2722.91, "total_tokens": 1524096} {"current_steps": 9, "total_steps": 9134, "loss": 0.6527, "learning_rate": 4.999988022328004e-05, "epoch": 0.0009852486384411177, "percentage": 0.1, "elapsed_time": "0:10:26", "remaining_time": "7 days, 8:27:51", "throughput": 2694.14, "total_tokens": 1688064} {"current_steps": 10, "total_steps": 9134, "loss": 0.6857, "learning_rate": 4.999985212753391e-05, "epoch": 0.0010947207093790197, "percentage": 0.11, "elapsed_time": "0:11:34", "remaining_time": "7 days, 7:57:10", "throughput": 2680.91, "total_tokens": 1861216} {"current_steps": 11, "total_steps": 9134, "loss": 0.729, "learning_rate": 4.999982107435308e-05, "epoch": 0.0012041927803169217, "percentage": 0.12, "elapsed_time": "0:12:44", "remaining_time": "7 days, 8:11:28", "throughput": 2665.01, "total_tokens": 2038176} {"current_steps": 12, "total_steps": 9134, "loss": 0.7044, "learning_rate": 4.99997870637412e-05, "epoch": 0.0013136648512548236, "percentage": 0.13, "elapsed_time": "0:13:49", "remaining_time": "7 days, 7:14:16", "throughput": 2667.03, "total_tokens": 2213344} {"current_steps": 13, "total_steps": 9134, "loss": 0.6114, "learning_rate": 4.99997500957023e-05, "epoch": 0.0014231369221927256, "percentage": 0.14, "elapsed_time": "0:14:56", "remaining_time": "7 days, 6:44:40", "throughput": 2662.66, "total_tokens": 2387392} {"current_steps": 14, "total_steps": 9134, "loss": 0.9107, "learning_rate": 4.999971017024076e-05, "epoch": 0.0015326089931306276, "percentage": 0.15, "elapsed_time": "0:16:03", "remaining_time": "7 days, 6:25:59", "throughput": 2654.15, "total_tokens": 2558528} {"current_steps": 15, "total_steps": 9134, "loss": 0.7237, "learning_rate": 4.99996672873613e-05, "epoch": 0.0016420810640685294, "percentage": 0.16, "elapsed_time": "0:17:12", "remaining_time": "7 days, 6:23:05", "throughput": 2657.45, "total_tokens": 2744224} {"current_steps": 16, "total_steps": 9134, "loss": 0.6368, "learning_rate": 4.999962144706898e-05, "epoch": 0.0017515531350064315, "percentage": 0.18, "elapsed_time": "0:18:21", "remaining_time": "7 days, 6:20:50", "throughput": 2668.96, "total_tokens": 2939552} {"current_steps": 17, "total_steps": 9134, "loss": 0.7459, "learning_rate": 4.999957264936925e-05, "epoch": 0.0018610252059443335, "percentage": 0.19, "elapsed_time": "0:19:27", "remaining_time": "7 days, 5:58:40", "throughput": 2670.85, "total_tokens": 3119200} {"current_steps": 18, "total_steps": 9134, "loss": 0.5144, "learning_rate": 4.999952089426785e-05, "epoch": 0.0019704972768822353, "percentage": 0.2, "elapsed_time": "0:20:32", "remaining_time": "7 days, 5:26:05", "throughput": 2667.09, "total_tokens": 3288096} {"current_steps": 19, "total_steps": 9134, "loss": 0.7758, "learning_rate": 4.9999466181770934e-05, "epoch": 0.0020799693478201374, "percentage": 0.21, "elapsed_time": "0:21:43", "remaining_time": "7 days, 5:38:22", "throughput": 2683.68, "total_tokens": 3496864} {"current_steps": 20, "total_steps": 9134, "loss": 0.9462, "learning_rate": 4.999940851188495e-05, "epoch": 0.0021894414187580394, "percentage": 0.22, "elapsed_time": "0:22:53", "remaining_time": "7 days, 5:49:35", "throughput": 2702.09, "total_tokens": 3710560} {"current_steps": 21, "total_steps": 9134, "loss": 0.8865, "learning_rate": 4.999934788461673e-05, "epoch": 0.0022989134896959414, "percentage": 0.23, "elapsed_time": "0:24:00", "remaining_time": "7 days, 5:39:52", "throughput": 2702.88, "total_tokens": 3894016} {"current_steps": 22, "total_steps": 9134, "loss": 0.5197, "learning_rate": 4.9999284299973456e-05, "epoch": 0.0024083855606338435, "percentage": 0.24, "elapsed_time": "0:25:08", "remaining_time": "7 days, 5:31:50", "throughput": 2693.55, "total_tokens": 4062688} {"current_steps": 23, "total_steps": 9134, "loss": 0.6756, "learning_rate": 4.999921775796263e-05, "epoch": 0.002517857631571745, "percentage": 0.25, "elapsed_time": "0:26:15", "remaining_time": "7 days, 5:24:36", "throughput": 2691.24, "total_tokens": 4241216} {"current_steps": 24, "total_steps": 9134, "loss": 0.6375, "learning_rate": 4.999914825859214e-05, "epoch": 0.002627329702509647, "percentage": 0.26, "elapsed_time": "0:27:23", "remaining_time": "7 days, 5:17:40", "throughput": 2686.71, "total_tokens": 4415712} {"current_steps": 25, "total_steps": 9134, "loss": 0.8339, "learning_rate": 4.999907580187019e-05, "epoch": 0.002736801773447549, "percentage": 0.27, "elapsed_time": "0:28:33", "remaining_time": "7 days, 5:27:27", "throughput": 2698.21, "total_tokens": 4624256} {"current_steps": 26, "total_steps": 9134, "loss": 0.6684, "learning_rate": 4.9999000387805375e-05, "epoch": 0.002846273844385451, "percentage": 0.28, "elapsed_time": "0:29:42", "remaining_time": "7 days, 5:28:42", "throughput": 2691.47, "total_tokens": 4798304} {"current_steps": 27, "total_steps": 9134, "loss": 0.6474, "learning_rate": 4.99989220164066e-05, "epoch": 0.002955745915323353, "percentage": 0.3, "elapsed_time": "0:30:50", "remaining_time": "7 days, 5:25:12", "throughput": 2690.4, "total_tokens": 4979744} {"current_steps": 28, "total_steps": 9134, "loss": 0.7383, "learning_rate": 4.9998840687683135e-05, "epoch": 0.0030652179862612552, "percentage": 0.31, "elapsed_time": "0:31:57", "remaining_time": "7 days, 5:12:30", "throughput": 2680.26, "total_tokens": 5139008} {"current_steps": 29, "total_steps": 9134, "loss": 0.8955, "learning_rate": 4.999875640164461e-05, "epoch": 0.0031746900571991573, "percentage": 0.32, "elapsed_time": "0:33:03", "remaining_time": "7 days, 5:00:43", "throughput": 2682.41, "total_tokens": 5321344} {"current_steps": 30, "total_steps": 9134, "loss": 0.737, "learning_rate": 4.9998669158301e-05, "epoch": 0.003284162128137059, "percentage": 0.33, "elapsed_time": "0:34:13", "remaining_time": "7 days, 5:07:19", "throughput": 2685.62, "total_tokens": 5515552} {"current_steps": 31, "total_steps": 9134, "loss": 0.8718, "learning_rate": 4.999857895766261e-05, "epoch": 0.003393634199074961, "percentage": 0.34, "elapsed_time": "0:35:23", "remaining_time": "7 days, 5:15:02", "throughput": 2693.06, "total_tokens": 5720064} {"current_steps": 32, "total_steps": 9134, "loss": 0.851, "learning_rate": 4.999848579974012e-05, "epoch": 0.003503106270012863, "percentage": 0.35, "elapsed_time": "0:36:33", "remaining_time": "7 days, 5:20:14", "throughput": 2699.1, "total_tokens": 5921440} {"current_steps": 33, "total_steps": 9134, "loss": 0.7081, "learning_rate": 4.9998389684544546e-05, "epoch": 0.003612578340950765, "percentage": 0.36, "elapsed_time": "0:37:41", "remaining_time": "7 days, 5:16:15", "throughput": 2702.8, "total_tokens": 6113184} {"current_steps": 34, "total_steps": 9134, "loss": 0.5156, "learning_rate": 4.999829061208726e-05, "epoch": 0.003722050411888667, "percentage": 0.37, "elapsed_time": "0:38:48", "remaining_time": "7 days, 5:08:43", "throughput": 2698.12, "total_tokens": 6283648} {"current_steps": 35, "total_steps": 9134, "loss": 0.6898, "learning_rate": 4.999818858237999e-05, "epoch": 0.003831522482826569, "percentage": 0.38, "elapsed_time": "0:39:59", "remaining_time": "7 days, 5:15:38", "throughput": 2696.21, "total_tokens": 6468896} {"current_steps": 36, "total_steps": 9134, "loss": 0.6718, "learning_rate": 4.99980835954348e-05, "epoch": 0.003940994553764471, "percentage": 0.39, "elapsed_time": "0:41:05", "remaining_time": "7 days, 5:06:46", "throughput": 2701.29, "total_tokens": 6661312} {"current_steps": 37, "total_steps": 9134, "loss": 0.6001, "learning_rate": 4.999797565126411e-05, "epoch": 0.004050466624702373, "percentage": 0.41, "elapsed_time": "0:42:13", "remaining_time": "7 days, 5:02:37", "throughput": 2699.51, "total_tokens": 6839840} {"current_steps": 38, "total_steps": 9134, "loss": 0.5177, "learning_rate": 4.999786474988067e-05, "epoch": 0.004159938695640275, "percentage": 0.42, "elapsed_time": "0:43:19", "remaining_time": "7 days, 4:49:37", "throughput": 2701.1, "total_tokens": 7020832} {"current_steps": 39, "total_steps": 9134, "loss": 0.634, "learning_rate": 4.9997750891297636e-05, "epoch": 0.004269410766578176, "percentage": 0.43, "elapsed_time": "0:44:27", "remaining_time": "7 days, 4:48:37", "throughput": 2705.95, "total_tokens": 7218624} {"current_steps": 40, "total_steps": 9134, "loss": 0.6785, "learning_rate": 4.9997634075528454e-05, "epoch": 0.004378882837516079, "percentage": 0.44, "elapsed_time": "0:45:37", "remaining_time": "7 days, 4:51:22", "throughput": 2701.72, "total_tokens": 7394912} {"current_steps": 41, "total_steps": 9134, "loss": 0.6915, "learning_rate": 4.999751430258695e-05, "epoch": 0.00448835490845398, "percentage": 0.45, "elapsed_time": "0:46:46", "remaining_time": "7 days, 4:55:32", "throughput": 2698.24, "total_tokens": 7573888} {"current_steps": 42, "total_steps": 9134, "loss": 0.6931, "learning_rate": 4.999739157248729e-05, "epoch": 0.004597826979391883, "percentage": 0.46, "elapsed_time": "0:47:55", "remaining_time": "7 days, 4:55:43", "throughput": 2701.89, "total_tokens": 7770112} {"current_steps": 43, "total_steps": 9134, "loss": 0.7323, "learning_rate": 4.9997265885243993e-05, "epoch": 0.0047072990503297845, "percentage": 0.47, "elapsed_time": "0:49:06", "remaining_time": "7 days, 5:01:13", "throughput": 2710.96, "total_tokens": 7986944} {"current_steps": 44, "total_steps": 9134, "loss": 0.8218, "learning_rate": 4.999713724087193e-05, "epoch": 0.004816771121267687, "percentage": 0.48, "elapsed_time": "0:50:13", "remaining_time": "7 days, 4:57:09", "throughput": 2717.36, "total_tokens": 8189664} {"current_steps": 45, "total_steps": 9134, "loss": 0.9619, "learning_rate": 4.999700563938632e-05, "epoch": 0.0049262431922055885, "percentage": 0.49, "elapsed_time": "0:51:23", "remaining_time": "7 days, 5:00:18", "throughput": 2718.71, "total_tokens": 8383424} {"current_steps": 46, "total_steps": 9134, "loss": 0.6285, "learning_rate": 4.999687108080272e-05, "epoch": 0.00503571526314349, "percentage": 0.5, "elapsed_time": "0:52:33", "remaining_time": "7 days, 5:02:51", "throughput": 2720.04, "total_tokens": 8576960} {"current_steps": 47, "total_steps": 9134, "loss": 0.6056, "learning_rate": 4.999673356513707e-05, "epoch": 0.005145187334081393, "percentage": 0.51, "elapsed_time": "0:53:36", "remaining_time": "7 days, 4:44:58", "throughput": 2716.47, "total_tokens": 8737792} {"current_steps": 48, "total_steps": 9134, "loss": 0.6865, "learning_rate": 4.999659309240561e-05, "epoch": 0.005254659405019294, "percentage": 0.53, "elapsed_time": "0:54:43", "remaining_time": "7 days, 4:38:32", "throughput": 2714.86, "total_tokens": 8913856} {"current_steps": 49, "total_steps": 9134, "loss": 0.6112, "learning_rate": 4.9996449662624986e-05, "epoch": 0.005364131475957197, "percentage": 0.54, "elapsed_time": "0:55:51", "remaining_time": "7 days, 4:35:36", "throughput": 2709.91, "total_tokens": 9081408} {"current_steps": 50, "total_steps": 9134, "loss": 0.6682, "learning_rate": 4.999630327581214e-05, "epoch": 0.005473603546895098, "percentage": 0.55, "elapsed_time": "0:56:59", "remaining_time": "7 days, 4:33:18", "throughput": 2707.5, "total_tokens": 9257472} {"current_steps": 51, "total_steps": 9134, "loss": 0.8365, "learning_rate": 4.9996153931984415e-05, "epoch": 0.005583075617833001, "percentage": 0.56, "elapsed_time": "0:58:03", "remaining_time": "7 days, 4:20:21", "throughput": 2704.0, "total_tokens": 9419648} {"current_steps": 52, "total_steps": 9134, "loss": 0.7045, "learning_rate": 4.999600163115945e-05, "epoch": 0.005692547688770902, "percentage": 0.57, "elapsed_time": "0:59:09", "remaining_time": "7 days, 4:13:25", "throughput": 2703.28, "total_tokens": 9596384} {"current_steps": 53, "total_steps": 9134, "loss": 0.7067, "learning_rate": 4.999584637335529e-05, "epoch": 0.005802019759708804, "percentage": 0.58, "elapsed_time": "1:00:16", "remaining_time": "7 days, 4:06:19", "throughput": 2701.81, "total_tokens": 9769984} {"current_steps": 54, "total_steps": 9134, "loss": 0.7084, "learning_rate": 4.9995688158590284e-05, "epoch": 0.005911491830646706, "percentage": 0.59, "elapsed_time": "1:01:26", "remaining_time": "7 days, 4:10:42", "throughput": 2708.76, "total_tokens": 9985248} {"current_steps": 55, "total_steps": 9134, "loss": 0.7537, "learning_rate": 4.9995526986883146e-05, "epoch": 0.006020963901584608, "percentage": 0.6, "elapsed_time": "1:02:33", "remaining_time": "7 days, 4:07:07", "throughput": 2713.3, "total_tokens": 10184832} {"current_steps": 56, "total_steps": 9134, "loss": 0.8001, "learning_rate": 4.999536285825295e-05, "epoch": 0.0061304359725225105, "percentage": 0.61, "elapsed_time": "1:03:36", "remaining_time": "7 days, 3:52:17", "throughput": 2707.53, "total_tokens": 10334240} {"current_steps": 57, "total_steps": 9134, "loss": 0.5893, "learning_rate": 4.999519577271912e-05, "epoch": 0.006239908043460412, "percentage": 0.62, "elapsed_time": "1:04:41", "remaining_time": "7 days, 3:40:42", "throughput": 2701.46, "total_tokens": 10484544} {"current_steps": 58, "total_steps": 9134, "loss": 0.859, "learning_rate": 4.9995025730301406e-05, "epoch": 0.0063493801143983146, "percentage": 0.63, "elapsed_time": "1:05:47", "remaining_time": "7 days, 3:34:10", "throughput": 2699.46, "total_tokens": 10655008} {"current_steps": 59, "total_steps": 9134, "loss": 0.8568, "learning_rate": 4.999485273101993e-05, "epoch": 0.006458852185336216, "percentage": 0.65, "elapsed_time": "1:06:57", "remaining_time": "7 days, 3:37:58", "throughput": 2699.11, "total_tokens": 10842496} {"current_steps": 60, "total_steps": 9134, "loss": 0.5817, "learning_rate": 4.9994676774895154e-05, "epoch": 0.006568324256274118, "percentage": 0.66, "elapsed_time": "1:08:02", "remaining_time": "7 days, 3:30:55", "throughput": 2692.13, "total_tokens": 10991456} {"current_steps": 61, "total_steps": 9134, "loss": 0.7665, "learning_rate": 4.99944978619479e-05, "epoch": 0.00667779632721202, "percentage": 0.67, "elapsed_time": "1:09:10", "remaining_time": "7 days, 3:28:41", "throughput": 2695.35, "total_tokens": 11186784} {"current_steps": 62, "total_steps": 9134, "loss": 0.6607, "learning_rate": 4.9994315992199335e-05, "epoch": 0.006787268398149922, "percentage": 0.68, "elapsed_time": "1:10:18", "remaining_time": "7 days, 3:27:53", "throughput": 2696.13, "total_tokens": 11373824} {"current_steps": 63, "total_steps": 9134, "loss": 0.6294, "learning_rate": 4.9994131165670965e-05, "epoch": 0.006896740469087824, "percentage": 0.69, "elapsed_time": "1:11:26", "remaining_time": "7 days, 3:26:29", "throughput": 2696.41, "total_tokens": 11558176} {"current_steps": 64, "total_steps": 9134, "loss": 0.766, "learning_rate": 4.999394338238466e-05, "epoch": 0.007006212540025726, "percentage": 0.7, "elapsed_time": "1:12:33", "remaining_time": "7 days, 3:21:52", "throughput": 2697.89, "total_tokens": 11744096} {"current_steps": 65, "total_steps": 9134, "loss": 0.9307, "learning_rate": 4.999375264236263e-05, "epoch": 0.0071156846109636275, "percentage": 0.71, "elapsed_time": "1:13:38", "remaining_time": "7 days, 3:14:08", "throughput": 2701.08, "total_tokens": 11934048} {"current_steps": 66, "total_steps": 9134, "loss": 0.7371, "learning_rate": 4.999355894562745e-05, "epoch": 0.00722515668190153, "percentage": 0.72, "elapsed_time": "1:14:44", "remaining_time": "7 days, 3:08:35", "throughput": 2696.01, "total_tokens": 12089728} {"current_steps": 67, "total_steps": 9134, "loss": 0.7666, "learning_rate": 4.9993362292202024e-05, "epoch": 0.007334628752839432, "percentage": 0.73, "elapsed_time": "1:15:50", "remaining_time": "7 days, 3:02:45", "throughput": 2692.19, "total_tokens": 12249888} {"current_steps": 68, "total_steps": 9134, "loss": 0.6124, "learning_rate": 4.999316268210962e-05, "epoch": 0.007444100823777334, "percentage": 0.74, "elapsed_time": "1:16:59", "remaining_time": "7 days, 3:05:31", "throughput": 2692.13, "total_tokens": 12437152} {"current_steps": 69, "total_steps": 9134, "loss": 0.6846, "learning_rate": 4.999296011537384e-05, "epoch": 0.007553572894715236, "percentage": 0.76, "elapsed_time": "1:18:06", "remaining_time": "7 days, 3:01:56", "throughput": 2692.46, "total_tokens": 12618592} {"current_steps": 70, "total_steps": 9134, "loss": 0.9314, "learning_rate": 4.999275459201866e-05, "epoch": 0.007663044965653138, "percentage": 0.77, "elapsed_time": "1:19:16", "remaining_time": "7 days, 3:05:33", "throughput": 2691.52, "total_tokens": 12802944} {"current_steps": 71, "total_steps": 9134, "loss": 0.7839, "learning_rate": 4.9992546112068394e-05, "epoch": 0.00777251703659104, "percentage": 0.78, "elapsed_time": "1:20:25", "remaining_time": "7 days, 3:07:03", "throughput": 2689.51, "total_tokens": 12979456} {"current_steps": 72, "total_steps": 9134, "loss": 0.696, "learning_rate": 4.9992334675547704e-05, "epoch": 0.007881989107528941, "percentage": 0.79, "elapsed_time": "1:21:30", "remaining_time": "7 days, 2:58:54", "throughput": 2686.81, "total_tokens": 13140064} {"current_steps": 73, "total_steps": 9134, "loss": 0.598, "learning_rate": 4.999212028248159e-05, "epoch": 0.007991461178466844, "percentage": 0.8, "elapsed_time": "1:22:32", "remaining_time": "7 days, 2:45:07", "throughput": 2683.54, "total_tokens": 13289920} {"current_steps": 74, "total_steps": 9134, "loss": 0.6061, "learning_rate": 4.999190293289543e-05, "epoch": 0.008100933249404746, "percentage": 0.81, "elapsed_time": "1:23:41", "remaining_time": "7 days, 2:47:24", "throughput": 2687.78, "total_tokens": 13497792} {"current_steps": 75, "total_steps": 9134, "loss": 0.5776, "learning_rate": 4.999168262681492e-05, "epoch": 0.008210405320342647, "percentage": 0.82, "elapsed_time": "1:24:46", "remaining_time": "7 days, 2:38:47", "throughput": 2685.42, "total_tokens": 13658176} {"current_steps": 76, "total_steps": 9134, "loss": 0.6711, "learning_rate": 4.999145936426614e-05, "epoch": 0.00831987739128055, "percentage": 0.83, "elapsed_time": "1:25:53", "remaining_time": "7 days, 2:37:14", "throughput": 2683.62, "total_tokens": 13830432} {"current_steps": 77, "total_steps": 9134, "loss": 0.6841, "learning_rate": 4.9991233145275495e-05, "epoch": 0.008429349462218452, "percentage": 0.84, "elapsed_time": "1:27:03", "remaining_time": "7 days, 2:40:43", "throughput": 2681.58, "total_tokens": 14008064} {"current_steps": 78, "total_steps": 9134, "loss": 0.5426, "learning_rate": 4.999100396986974e-05, "epoch": 0.008538821533156353, "percentage": 0.85, "elapsed_time": "1:28:10", "remaining_time": "7 days, 2:38:03", "throughput": 2679.6, "total_tokens": 14177408} {"current_steps": 79, "total_steps": 9134, "loss": 0.7276, "learning_rate": 4.999077183807599e-05, "epoch": 0.008648293604094255, "percentage": 0.86, "elapsed_time": "1:29:13", "remaining_time": "7 days, 2:27:31", "throughput": 2677.07, "total_tokens": 14332416} {"current_steps": 80, "total_steps": 9134, "loss": 0.7968, "learning_rate": 4.9990536749921704e-05, "epoch": 0.008757765675032158, "percentage": 0.88, "elapsed_time": "1:30:22", "remaining_time": "7 days, 2:27:43", "throughput": 2675.44, "total_tokens": 14506912} {"current_steps": 81, "total_steps": 9134, "loss": 0.7246, "learning_rate": 4.999029870543469e-05, "epoch": 0.00886723774597006, "percentage": 0.89, "elapsed_time": "1:31:30", "remaining_time": "7 days, 2:27:21", "throughput": 2675.83, "total_tokens": 14691488} {"current_steps": 82, "total_steps": 9134, "loss": 0.6807, "learning_rate": 4.999005770464312e-05, "epoch": 0.00897670981690796, "percentage": 0.9, "elapsed_time": "1:32:37", "remaining_time": "7 days, 2:24:09", "throughput": 2676.63, "total_tokens": 14874272} {"current_steps": 83, "total_steps": 9134, "loss": 0.7125, "learning_rate": 4.99898137475755e-05, "epoch": 0.009086181887845863, "percentage": 0.91, "elapsed_time": "1:33:44", "remaining_time": "7 days, 2:22:45", "throughput": 2679.41, "total_tokens": 15070944} {"current_steps": 84, "total_steps": 9134, "loss": 0.8963, "learning_rate": 4.998956683426068e-05, "epoch": 0.009195653958783766, "percentage": 0.92, "elapsed_time": "1:34:52", "remaining_time": "7 days, 2:21:20", "throughput": 2681.51, "total_tokens": 15264032} {"current_steps": 85, "total_steps": 9134, "loss": 0.6492, "learning_rate": 4.9989316964727873e-05, "epoch": 0.009305126029721666, "percentage": 0.93, "elapsed_time": "1:35:57", "remaining_time": "7 days, 2:16:11", "throughput": 2680.49, "total_tokens": 15433824} {"current_steps": 86, "total_steps": 9134, "loss": 0.7585, "learning_rate": 4.9989064139006645e-05, "epoch": 0.009414598100659569, "percentage": 0.94, "elapsed_time": "1:37:01", "remaining_time": "7 days, 2:08:04", "throughput": 2678.19, "total_tokens": 15591296} {"current_steps": 87, "total_steps": 9134, "loss": 0.7022, "learning_rate": 4.99888083571269e-05, "epoch": 0.009524070171597471, "percentage": 0.95, "elapsed_time": "1:38:10", "remaining_time": "7 days, 2:09:12", "throughput": 2677.74, "total_tokens": 15773408} {"current_steps": 88, "total_steps": 9134, "loss": 0.6068, "learning_rate": 4.99885496191189e-05, "epoch": 0.009633542242535374, "percentage": 0.96, "elapsed_time": "1:39:20", "remaining_time": "7 days, 2:12:37", "throughput": 2680.1, "total_tokens": 15975904} {"current_steps": 89, "total_steps": 9134, "loss": 0.7437, "learning_rate": 4.998828792501324e-05, "epoch": 0.009743014313473275, "percentage": 0.97, "elapsed_time": "1:40:28", "remaining_time": "7 days, 2:10:44", "throughput": 2676.45, "total_tokens": 16134272} {"current_steps": 90, "total_steps": 9134, "loss": 0.8501, "learning_rate": 4.998802327484089e-05, "epoch": 0.009852486384411177, "percentage": 0.99, "elapsed_time": "1:41:33", "remaining_time": "7 days, 2:06:09", "throughput": 2672.82, "total_tokens": 16287936} {"current_steps": 91, "total_steps": 9134, "loss": 0.7088, "learning_rate": 4.9987755668633165e-05, "epoch": 0.00996195845534908, "percentage": 1.0, "elapsed_time": "1:42:41", "remaining_time": "7 days, 2:04:58", "throughput": 2673.02, "total_tokens": 16470048} {"current_steps": 92, "total_steps": 9134, "loss": 1.2246, "learning_rate": 4.998748510642171e-05, "epoch": 0.01007143052628698, "percentage": 1.01, "elapsed_time": "1:43:48", "remaining_time": "7 days, 2:03:19", "throughput": 2675.17, "total_tokens": 16663584} {"current_steps": 93, "total_steps": 9134, "loss": 0.7137, "learning_rate": 4.998721158823853e-05, "epoch": 0.010180902597224883, "percentage": 1.02, "elapsed_time": "1:44:59", "remaining_time": "7 days, 2:05:58", "throughput": 2676.58, "total_tokens": 16859808} {"current_steps": 94, "total_steps": 9134, "loss": 0.8742, "learning_rate": 4.998693511411599e-05, "epoch": 0.010290374668162785, "percentage": 1.03, "elapsed_time": "1:46:06", "remaining_time": "7 days, 2:04:13", "throughput": 2677.33, "total_tokens": 17044832} {"current_steps": 95, "total_steps": 9134, "loss": 0.8652, "learning_rate": 4.998665568408679e-05, "epoch": 0.010399846739100688, "percentage": 1.04, "elapsed_time": "1:47:16", "remaining_time": "7 days, 2:06:28", "throughput": 2677.89, "total_tokens": 17235456} {"current_steps": 96, "total_steps": 9134, "loss": 0.804, "learning_rate": 4.998637329818399e-05, "epoch": 0.010509318810038588, "percentage": 1.05, "elapsed_time": "1:48:25", "remaining_time": "7 days, 2:08:25", "throughput": 2679.66, "total_tokens": 17433696} {"current_steps": 97, "total_steps": 9134, "loss": 0.6367, "learning_rate": 4.9986087956441e-05, "epoch": 0.010618790880976491, "percentage": 1.06, "elapsed_time": "1:49:32", "remaining_time": "7 days, 2:05:00", "throughput": 2675.16, "total_tokens": 17581760} {"current_steps": 98, "total_steps": 9134, "loss": 0.8407, "learning_rate": 4.9985799658891563e-05, "epoch": 0.010728262951914393, "percentage": 1.07, "elapsed_time": "1:50:40", "remaining_time": "7 days, 2:05:08", "throughput": 2675.3, "total_tokens": 17766112} {"current_steps": 99, "total_steps": 9134, "loss": 0.9003, "learning_rate": 4.998550840556979e-05, "epoch": 0.010837735022852294, "percentage": 1.08, "elapsed_time": "1:51:51", "remaining_time": "7 days, 2:08:22", "throughput": 2677.71, "total_tokens": 17971296} {"current_steps": 100, "total_steps": 9134, "loss": 0.6371, "learning_rate": 4.998521419651014e-05, "epoch": 0.010947207093790197, "percentage": 1.09, "elapsed_time": "1:52:58", "remaining_time": "7 days, 2:06:04", "throughput": 2678.14, "total_tokens": 18153632} {"current_steps": 101, "total_steps": 9134, "loss": 0.8215, "learning_rate": 4.998491703174742e-05, "epoch": 0.011056679164728099, "percentage": 1.11, "elapsed_time": "1:54:04", "remaining_time": "7 days, 2:01:51", "throughput": 2677.86, "total_tokens": 18327680} {"current_steps": 102, "total_steps": 9134, "loss": 0.6554, "learning_rate": 4.998461691131677e-05, "epoch": 0.011166151235666001, "percentage": 1.12, "elapsed_time": "1:55:06", "remaining_time": "7 days, 1:52:43", "throughput": 2677.49, "total_tokens": 18492096} {"current_steps": 103, "total_steps": 9134, "loss": 0.6907, "learning_rate": 4.9984313835253705e-05, "epoch": 0.011275623306603902, "percentage": 1.13, "elapsed_time": "1:56:14", "remaining_time": "7 days, 1:51:29", "throughput": 2676.77, "total_tokens": 18668160} {"current_steps": 104, "total_steps": 9134, "loss": 0.8705, "learning_rate": 4.998400780359408e-05, "epoch": 0.011385095377541805, "percentage": 1.14, "elapsed_time": "1:57:24", "remaining_time": "7 days, 1:54:09", "throughput": 2677.8, "total_tokens": 18863712} {"current_steps": 105, "total_steps": 9134, "loss": 0.8243, "learning_rate": 4.998369881637408e-05, "epoch": 0.011494567448479707, "percentage": 1.15, "elapsed_time": "1:58:34", "remaining_time": "7 days, 1:56:54", "throughput": 2682.53, "total_tokens": 19085920} {"current_steps": 106, "total_steps": 9134, "loss": 0.7918, "learning_rate": 4.9983386873630285e-05, "epoch": 0.011604039519417608, "percentage": 1.16, "elapsed_time": "1:59:43", "remaining_time": "7 days, 1:56:35", "throughput": 2685.32, "total_tokens": 19289312} {"current_steps": 107, "total_steps": 9134, "loss": 0.8296, "learning_rate": 4.998307197539958e-05, "epoch": 0.01171351159035551, "percentage": 1.17, "elapsed_time": "2:00:53", "remaining_time": "7 days, 1:58:42", "throughput": 2689.86, "total_tokens": 19510400} {"current_steps": 108, "total_steps": 9134, "loss": 0.6138, "learning_rate": 4.998275412171921e-05, "epoch": 0.011822983661293413, "percentage": 1.18, "elapsed_time": "2:01:55", "remaining_time": "7 days, 1:49:06", "throughput": 2688.67, "total_tokens": 19667648} {"current_steps": 109, "total_steps": 9134, "loss": 0.6533, "learning_rate": 4.99824333126268e-05, "epoch": 0.011932455732231315, "percentage": 1.19, "elapsed_time": "2:02:57", "remaining_time": "7 days, 1:40:40", "throughput": 2685.64, "total_tokens": 19813248} {"current_steps": 110, "total_steps": 9134, "loss": 0.6766, "learning_rate": 4.9982109548160274e-05, "epoch": 0.012041927803169216, "percentage": 1.2, "elapsed_time": "2:04:07", "remaining_time": "7 days, 1:42:20", "throughput": 2688.2, "total_tokens": 20019552} {"current_steps": 111, "total_steps": 9134, "loss": 0.8005, "learning_rate": 4.998178282835795e-05, "epoch": 0.012151399874107119, "percentage": 1.22, "elapsed_time": "2:05:13", "remaining_time": "7 days, 1:39:47", "throughput": 2687.13, "total_tokens": 20190688} {"current_steps": 112, "total_steps": 9134, "loss": 0.7124, "learning_rate": 4.998145315325848e-05, "epoch": 0.012260871945045021, "percentage": 1.23, "elapsed_time": "2:06:22", "remaining_time": "7 days, 1:39:36", "throughput": 2689.54, "total_tokens": 20392736} {"current_steps": 113, "total_steps": 9134, "loss": 0.7671, "learning_rate": 4.998112052290086e-05, "epoch": 0.012370344015982922, "percentage": 1.24, "elapsed_time": "2:07:30", "remaining_time": "7 days, 1:39:40", "throughput": 2692.45, "total_tokens": 20599488} {"current_steps": 114, "total_steps": 9134, "loss": 0.7535, "learning_rate": 4.9980784937324434e-05, "epoch": 0.012479816086920824, "percentage": 1.25, "elapsed_time": "2:08:37", "remaining_time": "7 days, 1:37:17", "throughput": 2690.5, "total_tokens": 20764128} {"current_steps": 115, "total_steps": 9134, "loss": 0.6377, "learning_rate": 4.9980446396568906e-05, "epoch": 0.012589288157858727, "percentage": 1.26, "elapsed_time": "2:09:40", "remaining_time": "7 days, 1:29:54", "throughput": 2687.62, "total_tokens": 20911072} {"current_steps": 116, "total_steps": 9134, "loss": 0.7537, "learning_rate": 4.998010490067432e-05, "epoch": 0.012698760228796629, "percentage": 1.27, "elapsed_time": "2:10:48", "remaining_time": "7 days, 1:29:23", "throughput": 2690.47, "total_tokens": 21116480} {"current_steps": 117, "total_steps": 9134, "loss": 0.8034, "learning_rate": 4.997976044968108e-05, "epoch": 0.01280823229973453, "percentage": 1.28, "elapsed_time": "2:11:52", "remaining_time": "7 days, 1:23:57", "throughput": 2687.23, "total_tokens": 21263872} {"current_steps": 118, "total_steps": 9134, "loss": 0.7566, "learning_rate": 4.997941304362993e-05, "epoch": 0.012917704370672432, "percentage": 1.29, "elapsed_time": "2:13:02", "remaining_time": "7 days, 1:25:17", "throughput": 2686.34, "total_tokens": 21443744} {"current_steps": 119, "total_steps": 9134, "loss": 0.5467, "learning_rate": 4.997906268256197e-05, "epoch": 0.013027176441610335, "percentage": 1.3, "elapsed_time": "2:14:07", "remaining_time": "7 days, 1:21:08", "throughput": 2686.08, "total_tokens": 21616896} {"current_steps": 120, "total_steps": 9134, "loss": 0.8963, "learning_rate": 4.997870936651865e-05, "epoch": 0.013136648512548236, "percentage": 1.31, "elapsed_time": "2:15:16", "remaining_time": "7 days, 1:20:57", "throughput": 2686.93, "total_tokens": 21807520} {"current_steps": 121, "total_steps": 9134, "loss": 0.7902, "learning_rate": 4.9978353095541766e-05, "epoch": 0.013246120583486138, "percentage": 1.32, "elapsed_time": "2:16:24", "remaining_time": "7 days, 1:21:16", "throughput": 2688.08, "total_tokens": 22001728} {"current_steps": 122, "total_steps": 9134, "loss": 0.79, "learning_rate": 4.997799386967345e-05, "epoch": 0.01335559265442404, "percentage": 1.34, "elapsed_time": "2:17:34", "remaining_time": "7 days, 1:22:42", "throughput": 2689.85, "total_tokens": 22203776} {"current_steps": 123, "total_steps": 9134, "loss": 0.7779, "learning_rate": 4.9977631688956215e-05, "epoch": 0.013465064725361941, "percentage": 1.35, "elapsed_time": "2:18:40", "remaining_time": "7 days, 1:19:40", "throughput": 2689.99, "total_tokens": 22382752} {"current_steps": 124, "total_steps": 9134, "loss": 0.7406, "learning_rate": 4.99772665534329e-05, "epoch": 0.013574536796299844, "percentage": 1.36, "elapsed_time": "2:19:47", "remaining_time": "7 days, 1:17:59", "throughput": 2689.16, "total_tokens": 22556576} {"current_steps": 125, "total_steps": 9134, "loss": 0.7324, "learning_rate": 4.9976898463146706e-05, "epoch": 0.013684008867237746, "percentage": 1.37, "elapsed_time": "2:20:54", "remaining_time": "7 days, 1:16:02", "throughput": 2689.59, "total_tokens": 22740256} {"current_steps": 126, "total_steps": 9134, "loss": 0.8445, "learning_rate": 4.997652741814116e-05, "epoch": 0.013793480938175649, "percentage": 1.38, "elapsed_time": "2:22:04", "remaining_time": "7 days, 1:17:41", "throughput": 2690.14, "total_tokens": 22933120} {"current_steps": 127, "total_steps": 9134, "loss": 0.5797, "learning_rate": 4.9976153418460184e-05, "epoch": 0.01390295300911355, "percentage": 1.39, "elapsed_time": "2:23:10", "remaining_time": "7 days, 1:14:20", "throughput": 2687.82, "total_tokens": 23090144} {"current_steps": 128, "total_steps": 9134, "loss": 0.8427, "learning_rate": 4.997577646414799e-05, "epoch": 0.014012425080051452, "percentage": 1.4, "elapsed_time": "2:24:20", "remaining_time": "7 days, 1:16:01", "throughput": 2688.22, "total_tokens": 23281888} {"current_steps": 129, "total_steps": 9134, "loss": 0.8864, "learning_rate": 4.997539655524919e-05, "epoch": 0.014121897150989354, "percentage": 1.41, "elapsed_time": "2:25:30", "remaining_time": "7 days, 1:16:51", "throughput": 2687.34, "total_tokens": 23460640} {"current_steps": 130, "total_steps": 9134, "loss": 0.8312, "learning_rate": 4.997501369180872e-05, "epoch": 0.014231369221927255, "percentage": 1.42, "elapsed_time": "2:26:36", "remaining_time": "7 days, 1:14:30", "throughput": 2687.36, "total_tokens": 23639840} {"current_steps": 131, "total_steps": 9134, "loss": 0.7574, "learning_rate": 4.997462787387188e-05, "epoch": 0.014340841292865157, "percentage": 1.43, "elapsed_time": "2:27:44", "remaining_time": "7 days, 1:13:29", "throughput": 2685.57, "total_tokens": 23806048} {"current_steps": 132, "total_steps": 9134, "loss": 0.6549, "learning_rate": 4.997423910148431e-05, "epoch": 0.01445031336380306, "percentage": 1.45, "elapsed_time": "2:28:50", "remaining_time": "7 days, 1:10:50", "throughput": 2684.31, "total_tokens": 23972928} {"current_steps": 133, "total_steps": 9134, "loss": 0.6969, "learning_rate": 4.9973847374691985e-05, "epoch": 0.014559785434740962, "percentage": 1.46, "elapsed_time": "2:29:58", "remaining_time": "7 days, 1:09:23", "throughput": 2685.22, "total_tokens": 24161984} {"current_steps": 134, "total_steps": 9134, "loss": 0.6144, "learning_rate": 4.997345269354127e-05, "epoch": 0.014669257505678863, "percentage": 1.47, "elapsed_time": "2:31:01", "remaining_time": "7 days, 1:03:57", "throughput": 2682.21, "total_tokens": 24306016} {"current_steps": 135, "total_steps": 9134, "loss": 0.7967, "learning_rate": 4.9973055058078835e-05, "epoch": 0.014778729576616766, "percentage": 1.48, "elapsed_time": "2:32:10", "remaining_time": "7 days, 1:03:28", "throughput": 2682.81, "total_tokens": 24494400} {"current_steps": 136, "total_steps": 9134, "loss": 0.8719, "learning_rate": 4.997265446835172e-05, "epoch": 0.014888201647554668, "percentage": 1.49, "elapsed_time": "2:33:18", "remaining_time": "7 days, 1:03:26", "throughput": 2681.81, "total_tokens": 24669344} {"current_steps": 137, "total_steps": 9134, "loss": 0.7693, "learning_rate": 4.997225092440733e-05, "epoch": 0.014997673718492569, "percentage": 1.5, "elapsed_time": "2:34:27", "remaining_time": "7 days, 1:03:59", "throughput": 2683.09, "total_tokens": 24866688} {"current_steps": 138, "total_steps": 9134, "loss": 0.658, "learning_rate": 4.9971844426293395e-05, "epoch": 0.015107145789430471, "percentage": 1.51, "elapsed_time": "2:35:37", "remaining_time": "7 days, 1:04:26", "throughput": 2682.37, "total_tokens": 25045440} {"current_steps": 139, "total_steps": 9134, "loss": 0.8443, "learning_rate": 4.9971434974058e-05, "epoch": 0.015216617860368374, "percentage": 1.52, "elapsed_time": "2:36:44", "remaining_time": "7 days, 1:03:17", "throughput": 2681.69, "total_tokens": 25220384} {"current_steps": 140, "total_steps": 9134, "loss": 0.6314, "learning_rate": 4.997102256774959e-05, "epoch": 0.015326089931306276, "percentage": 1.53, "elapsed_time": "2:37:51", "remaining_time": "7 days, 1:00:58", "throughput": 2681.15, "total_tokens": 25393760} {"current_steps": 141, "total_steps": 9134, "loss": 0.7165, "learning_rate": 4.997060720741694e-05, "epoch": 0.015435562002244177, "percentage": 1.54, "elapsed_time": "2:38:54", "remaining_time": "7 days, 0:55:23", "throughput": 2680.57, "total_tokens": 25558400} {"current_steps": 142, "total_steps": 9134, "loss": 0.7813, "learning_rate": 4.9970188893109194e-05, "epoch": 0.01554503407318208, "percentage": 1.55, "elapsed_time": "2:40:04", "remaining_time": "7 days, 0:56:37", "throughput": 2680.6, "total_tokens": 25745888} {"current_steps": 143, "total_steps": 9134, "loss": 0.7194, "learning_rate": 4.996976762487584e-05, "epoch": 0.015654506144119982, "percentage": 1.57, "elapsed_time": "2:41:05", "remaining_time": "7 days, 0:48:22", "throughput": 2677.28, "total_tokens": 25876928} {"current_steps": 144, "total_steps": 9134, "loss": 0.7349, "learning_rate": 4.996934340276671e-05, "epoch": 0.015763978215057883, "percentage": 1.58, "elapsed_time": "2:42:09", "remaining_time": "7 days, 0:43:24", "throughput": 2675.07, "total_tokens": 26026560} {"current_steps": 145, "total_steps": 9134, "loss": 0.8035, "learning_rate": 4.996891622683199e-05, "epoch": 0.015873450285995787, "percentage": 1.59, "elapsed_time": "2:43:18", "remaining_time": "7 days, 0:43:48", "throughput": 2677.21, "total_tokens": 26232192} {"current_steps": 146, "total_steps": 9134, "loss": 0.8288, "learning_rate": 4.99684860971222e-05, "epoch": 0.015982922356933688, "percentage": 1.6, "elapsed_time": "2:44:24", "remaining_time": "7 days, 0:40:53", "throughput": 2676.81, "total_tokens": 26404448} {"current_steps": 147, "total_steps": 9134, "loss": 0.7917, "learning_rate": 4.996805301368825e-05, "epoch": 0.01609239442787159, "percentage": 1.61, "elapsed_time": "2:45:32", "remaining_time": "7 days, 0:40:56", "throughput": 2677.64, "total_tokens": 26596640} {"current_steps": 148, "total_steps": 9134, "loss": 0.9584, "learning_rate": 4.9967616976581354e-05, "epoch": 0.016201866498809493, "percentage": 1.62, "elapsed_time": "2:46:42", "remaining_time": "7 days, 0:41:55", "throughput": 2678.05, "total_tokens": 26787264} {"current_steps": 149, "total_steps": 9134, "loss": 0.4423, "learning_rate": 4.99671779858531e-05, "epoch": 0.016311338569747393, "percentage": 1.63, "elapsed_time": "2:47:48", "remaining_time": "7 days, 0:39:01", "throughput": 2677.18, "total_tokens": 26954816} {"current_steps": 150, "total_steps": 9134, "loss": 0.6417, "learning_rate": 4.996673604155542e-05, "epoch": 0.016420810640685294, "percentage": 1.64, "elapsed_time": "2:48:54", "remaining_time": "7 days, 0:36:15", "throughput": 2678.22, "total_tokens": 27141856} {"current_steps": 151, "total_steps": 9134, "loss": 0.8161, "learning_rate": 4.9966291143740595e-05, "epoch": 0.016530282711623198, "percentage": 1.65, "elapsed_time": "2:50:04", "remaining_time": "7 days, 0:37:53", "throughput": 2680.06, "total_tokens": 27349056} {"current_steps": 152, "total_steps": 9134, "loss": 0.6427, "learning_rate": 4.996584329246126e-05, "epoch": 0.0166397547825611, "percentage": 1.66, "elapsed_time": "2:51:14", "remaining_time": "7 days, 0:39:23", "throughput": 2682.41, "total_tokens": 27561408} {"current_steps": 153, "total_steps": 9134, "loss": 0.8038, "learning_rate": 4.996539248777038e-05, "epoch": 0.016749226853499, "percentage": 1.68, "elapsed_time": "2:52:22", "remaining_time": "7 days, 0:38:41", "throughput": 2684.24, "total_tokens": 27762784} {"current_steps": 154, "total_steps": 9134, "loss": 0.74, "learning_rate": 4.99649387297213e-05, "epoch": 0.016858698924436904, "percentage": 1.69, "elapsed_time": "2:53:29", "remaining_time": "7 days, 0:36:53", "throughput": 2685.38, "total_tokens": 27954304} {"current_steps": 155, "total_steps": 9134, "loss": 0.8268, "learning_rate": 4.996448201836769e-05, "epoch": 0.016968170995374805, "percentage": 1.7, "elapsed_time": "2:54:36", "remaining_time": "7 days, 0:35:13", "throughput": 2684.6, "total_tokens": 28126112} {"current_steps": 156, "total_steps": 9134, "loss": 0.682, "learning_rate": 4.9964022353763586e-05, "epoch": 0.017077643066312705, "percentage": 1.71, "elapsed_time": "2:55:44", "remaining_time": "7 days, 0:34:17", "throughput": 2686.22, "total_tokens": 28325248} {"current_steps": 157, "total_steps": 9134, "loss": 0.6126, "learning_rate": 4.996355973596336e-05, "epoch": 0.01718711513725061, "percentage": 1.72, "elapsed_time": "2:56:47", "remaining_time": "7 days, 0:28:50", "throughput": 2685.54, "total_tokens": 28487424} {"current_steps": 158, "total_steps": 9134, "loss": 0.8077, "learning_rate": 4.996309416502174e-05, "epoch": 0.01729658720818851, "percentage": 1.73, "elapsed_time": "2:57:54", "remaining_time": "7 days, 0:27:16", "throughput": 2685.85, "total_tokens": 28670880} {"current_steps": 159, "total_steps": 9134, "loss": 0.6373, "learning_rate": 4.99626256409938e-05, "epoch": 0.017406059279126414, "percentage": 1.74, "elapsed_time": "2:59:00", "remaining_time": "7 days, 0:24:49", "throughput": 2684.76, "total_tokens": 28836864} {"current_steps": 160, "total_steps": 9134, "loss": 0.6675, "learning_rate": 4.996215416393496e-05, "epoch": 0.017515531350064315, "percentage": 1.75, "elapsed_time": "3:00:10", "remaining_time": "7 days, 0:25:40", "throughput": 2685.05, "total_tokens": 29027040} {"current_steps": 161, "total_steps": 9134, "loss": 0.6027, "learning_rate": 4.996167973390101e-05, "epoch": 0.017625003421002216, "percentage": 1.76, "elapsed_time": "3:01:20", "remaining_time": "7 days, 0:26:43", "throughput": 2685.6, "total_tokens": 29220800} {"current_steps": 162, "total_steps": 9134, "loss": 0.7717, "learning_rate": 4.996120235094807e-05, "epoch": 0.01773447549194012, "percentage": 1.77, "elapsed_time": "3:02:29", "remaining_time": "7 days, 0:26:39", "throughput": 2685.32, "total_tokens": 29402240} {"current_steps": 163, "total_steps": 9134, "loss": 0.753, "learning_rate": 4.99607220151326e-05, "epoch": 0.01784394756287802, "percentage": 1.78, "elapsed_time": "3:03:38", "remaining_time": "7 days, 0:27:12", "throughput": 2686.8, "total_tokens": 29604960} {"current_steps": 164, "total_steps": 9134, "loss": 0.6594, "learning_rate": 4.9960238726511435e-05, "epoch": 0.01795341963381592, "percentage": 1.8, "elapsed_time": "3:04:46", "remaining_time": "7 days, 0:26:01", "throughput": 2686.72, "total_tokens": 29785504} {"current_steps": 165, "total_steps": 9134, "loss": 0.6007, "learning_rate": 4.995975248514175e-05, "epoch": 0.018062891704753826, "percentage": 1.81, "elapsed_time": "3:05:51", "remaining_time": "7 days, 0:23:14", "throughput": 2685.24, "total_tokens": 29945664} {"current_steps": 166, "total_steps": 9134, "loss": 0.5952, "learning_rate": 4.995926329108106e-05, "epoch": 0.018172363775691727, "percentage": 1.82, "elapsed_time": "3:06:59", "remaining_time": "7 days, 0:22:04", "throughput": 2685.3, "total_tokens": 30127776} {"current_steps": 167, "total_steps": 9134, "loss": 0.6946, "learning_rate": 4.995877114438723e-05, "epoch": 0.018281835846629627, "percentage": 1.83, "elapsed_time": "3:08:03", "remaining_time": "7 days, 0:18:00", "throughput": 2685.1, "total_tokens": 30298240} {"current_steps": 168, "total_steps": 9134, "loss": 0.641, "learning_rate": 4.995827604511849e-05, "epoch": 0.01839130791756753, "percentage": 1.84, "elapsed_time": "3:09:09", "remaining_time": "7 days, 0:15:12", "throughput": 2684.41, "total_tokens": 30466688} {"current_steps": 169, "total_steps": 9134, "loss": 0.8853, "learning_rate": 4.995777799333341e-05, "epoch": 0.018500779988505432, "percentage": 1.85, "elapsed_time": "3:10:17", "remaining_time": "7 days, 0:14:39", "throughput": 2686.65, "total_tokens": 30675456} {"current_steps": 170, "total_steps": 9134, "loss": 0.9814, "learning_rate": 4.99572769890909e-05, "epoch": 0.018610252059443333, "percentage": 1.86, "elapsed_time": "3:11:23", "remaining_time": "7 days, 0:12:08", "throughput": 2685.53, "total_tokens": 30839872} {"current_steps": 171, "total_steps": 9134, "loss": 0.7272, "learning_rate": 4.9956773032450234e-05, "epoch": 0.018719724130381237, "percentage": 1.87, "elapsed_time": "3:12:31", "remaining_time": "7 days, 0:10:56", "throughput": 2684.43, "total_tokens": 31008320} {"current_steps": 172, "total_steps": 9134, "loss": 0.6521, "learning_rate": 4.995626612347103e-05, "epoch": 0.018829196201319138, "percentage": 1.88, "elapsed_time": "3:13:40", "remaining_time": "7 days, 0:11:05", "throughput": 2682.16, "total_tokens": 31167136} {"current_steps": 173, "total_steps": 9134, "loss": 0.5594, "learning_rate": 4.995575626221325e-05, "epoch": 0.018938668272257042, "percentage": 1.89, "elapsed_time": "3:14:48", "remaining_time": "7 days, 0:10:45", "throughput": 2683.65, "total_tokens": 31368288} {"current_steps": 174, "total_steps": 9134, "loss": 0.6103, "learning_rate": 4.995524344873721e-05, "epoch": 0.019048140343194943, "percentage": 1.9, "elapsed_time": "3:15:54", "remaining_time": "7 days, 0:08:15", "throughput": 2683.65, "total_tokens": 31545248} {"current_steps": 175, "total_steps": 9134, "loss": 0.6036, "learning_rate": 4.9954727683103576e-05, "epoch": 0.019157612414132844, "percentage": 1.92, "elapsed_time": "3:16:57", "remaining_time": "7 days, 0:03:08", "throughput": 2681.57, "total_tokens": 31689504} {"current_steps": 176, "total_steps": 9134, "loss": 0.6305, "learning_rate": 4.995420896537336e-05, "epoch": 0.019267084485070748, "percentage": 1.93, "elapsed_time": "3:18:02", "remaining_time": "6 days, 23:59:46", "throughput": 2679.94, "total_tokens": 31844064} {"current_steps": 177, "total_steps": 9134, "loss": 0.8005, "learning_rate": 4.995368729560793e-05, "epoch": 0.01937655655600865, "percentage": 1.94, "elapsed_time": "3:19:12", "remaining_time": "7 days, 0:00:36", "throughput": 2681.47, "total_tokens": 32049472} {"current_steps": 178, "total_steps": 9134, "loss": 0.835, "learning_rate": 4.9953162673869005e-05, "epoch": 0.01948602862694655, "percentage": 1.95, "elapsed_time": "3:20:18", "remaining_time": "6 days, 23:58:35", "throughput": 2680.26, "total_tokens": 32213216} {"current_steps": 179, "total_steps": 9134, "loss": 0.7817, "learning_rate": 4.9952635100218623e-05, "epoch": 0.019595500697884453, "percentage": 1.96, "elapsed_time": "3:21:25", "remaining_time": "6 days, 23:56:54", "throughput": 2679.48, "total_tokens": 32383008} {"current_steps": 180, "total_steps": 9134, "loss": 0.7382, "learning_rate": 4.995210457471922e-05, "epoch": 0.019704972768822354, "percentage": 1.97, "elapsed_time": "3:22:35", "remaining_time": "6 days, 23:57:30", "throughput": 2682.13, "total_tokens": 32601632} {"current_steps": 181, "total_steps": 9134, "loss": 0.6084, "learning_rate": 4.995157109743354e-05, "epoch": 0.019814444839760255, "percentage": 1.98, "elapsed_time": "3:23:40", "remaining_time": "6 days, 23:54:36", "throughput": 2682.35, "total_tokens": 32779712} {"current_steps": 182, "total_steps": 9134, "loss": 0.887, "learning_rate": 4.99510346684247e-05, "epoch": 0.01992391691069816, "percentage": 1.99, "elapsed_time": "3:24:48", "remaining_time": "6 days, 23:54:09", "throughput": 2681.84, "total_tokens": 32956672} {"current_steps": 183, "total_steps": 9134, "loss": 0.867, "learning_rate": 4.995049528775616e-05, "epoch": 0.02003338898163606, "percentage": 2.0, "elapsed_time": "3:25:56", "remaining_time": "6 days, 23:52:52", "throughput": 2682.07, "total_tokens": 33140128} {"current_steps": 184, "total_steps": 9134, "loss": 0.6597, "learning_rate": 4.994995295549173e-05, "epoch": 0.02014286105257396, "percentage": 2.01, "elapsed_time": "3:27:00", "remaining_time": "6 days, 23:48:49", "throughput": 2680.35, "total_tokens": 33290208} {"current_steps": 185, "total_steps": 9134, "loss": 1.0128, "learning_rate": 4.9949407671695554e-05, "epoch": 0.020252333123511865, "percentage": 2.03, "elapsed_time": "3:28:09", "remaining_time": "6 days, 23:49:16", "throughput": 2683.16, "total_tokens": 33511520} {"current_steps": 186, "total_steps": 9134, "loss": 0.7103, "learning_rate": 4.994885943643215e-05, "epoch": 0.020361805194449765, "percentage": 2.04, "elapsed_time": "3:29:18", "remaining_time": "6 days, 23:49:23", "throughput": 2683.68, "total_tokens": 33703264} {"current_steps": 187, "total_steps": 9134, "loss": 0.8895, "learning_rate": 4.994830824976636e-05, "epoch": 0.02047127726538767, "percentage": 2.05, "elapsed_time": "3:30:22", "remaining_time": "6 days, 23:45:12", "throughput": 2682.17, "total_tokens": 33855136} {"current_steps": 188, "total_steps": 9134, "loss": 0.7295, "learning_rate": 4.99477541117634e-05, "epoch": 0.02058074933632557, "percentage": 2.06, "elapsed_time": "3:31:30", "remaining_time": "6 days, 23:44:53", "throughput": 2684.37, "total_tokens": 34066816} {"current_steps": 189, "total_steps": 9134, "loss": 0.5532, "learning_rate": 4.994719702248883e-05, "epoch": 0.02069022140726347, "percentage": 2.07, "elapsed_time": "3:32:40", "remaining_time": "6 days, 23:45:29", "throughput": 2685.56, "total_tokens": 34269088} {"current_steps": 190, "total_steps": 9134, "loss": 0.7301, "learning_rate": 4.9946636982008534e-05, "epoch": 0.020799693478201375, "percentage": 2.08, "elapsed_time": "3:33:46", "remaining_time": "6 days, 23:43:05", "throughput": 2686.47, "total_tokens": 34457696} {"current_steps": 191, "total_steps": 9134, "loss": 0.8629, "learning_rate": 4.994607399038877e-05, "epoch": 0.020909165549139276, "percentage": 2.09, "elapsed_time": "3:34:49", "remaining_time": "6 days, 23:38:36", "throughput": 2686.35, "total_tokens": 34625920} {"current_steps": 192, "total_steps": 9134, "loss": 0.63, "learning_rate": 4.9945508047696154e-05, "epoch": 0.021018637620077177, "percentage": 2.1, "elapsed_time": "3:35:57", "remaining_time": "6 days, 23:37:37", "throughput": 2687.53, "total_tokens": 34823040} {"current_steps": 193, "total_steps": 9134, "loss": 0.6346, "learning_rate": 4.9944939153997614e-05, "epoch": 0.02112810969101508, "percentage": 2.11, "elapsed_time": "3:37:03", "remaining_time": "6 days, 23:35:13", "throughput": 2687.72, "total_tokens": 35002464} {"current_steps": 194, "total_steps": 9134, "loss": 0.7864, "learning_rate": 4.994436730936046e-05, "epoch": 0.021237581761952982, "percentage": 2.12, "elapsed_time": "3:38:10", "remaining_time": "6 days, 23:34:22", "throughput": 2688.85, "total_tokens": 35199584} {"current_steps": 195, "total_steps": 9134, "loss": 0.6279, "learning_rate": 4.994379251385235e-05, "epoch": 0.021347053832890883, "percentage": 2.13, "elapsed_time": "3:39:20", "remaining_time": "6 days, 23:34:49", "throughput": 2690.95, "total_tokens": 35414176} {"current_steps": 196, "total_steps": 9134, "loss": 0.7367, "learning_rate": 4.9943214767541255e-05, "epoch": 0.021456525903828787, "percentage": 2.15, "elapsed_time": "3:40:26", "remaining_time": "6 days, 23:32:57", "throughput": 2691.39, "total_tokens": 35598976} {"current_steps": 197, "total_steps": 9134, "loss": 0.7586, "learning_rate": 4.994263407049554e-05, "epoch": 0.021565997974766687, "percentage": 2.16, "elapsed_time": "3:41:30", "remaining_time": "6 days, 23:28:28", "throughput": 2689.95, "total_tokens": 35749504} {"current_steps": 198, "total_steps": 9134, "loss": 0.797, "learning_rate": 4.9942050422783906e-05, "epoch": 0.021675470045704588, "percentage": 2.17, "elapsed_time": "3:42:37", "remaining_time": "6 days, 23:27:19", "throughput": 2689.85, "total_tokens": 35929600} {"current_steps": 199, "total_steps": 9134, "loss": 0.8002, "learning_rate": 4.994146382447538e-05, "epoch": 0.021784942116642492, "percentage": 2.18, "elapsed_time": "3:43:43", "remaining_time": "6 days, 23:25:15", "throughput": 2689.52, "total_tokens": 36103200} {"current_steps": 200, "total_steps": 9134, "loss": 0.9701, "learning_rate": 4.994087427563936e-05, "epoch": 0.021894414187580393, "percentage": 2.19, "elapsed_time": "3:44:52", "remaining_time": "6 days, 23:25:23", "throughput": 2688.55, "total_tokens": 36276128} {"current_steps": 201, "total_steps": 9134, "loss": 0.7224, "learning_rate": 4.9940281776345596e-05, "epoch": 0.022003886258518294, "percentage": 2.2, "elapsed_time": "3:46:00", "remaining_time": "6 days, 23:24:22", "throughput": 2688.51, "total_tokens": 36457344} {"current_steps": 202, "total_steps": 9134, "loss": 0.6799, "learning_rate": 4.993968632666417e-05, "epoch": 0.022113358329456198, "percentage": 2.21, "elapsed_time": "3:47:06", "remaining_time": "6 days, 23:22:15", "throughput": 2687.94, "total_tokens": 36627360} {"current_steps": 203, "total_steps": 9134, "loss": 0.7229, "learning_rate": 4.993908792666554e-05, "epoch": 0.0222228304003941, "percentage": 2.22, "elapsed_time": "3:48:07", "remaining_time": "6 days, 23:16:14", "throughput": 2685.81, "total_tokens": 36761536} {"current_steps": 204, "total_steps": 9134, "loss": 0.8847, "learning_rate": 4.9938486576420474e-05, "epoch": 0.022332302471332003, "percentage": 2.23, "elapsed_time": "3:49:14", "remaining_time": "6 days, 23:14:48", "throughput": 2685.19, "total_tokens": 36932896} {"current_steps": 205, "total_steps": 9134, "loss": 0.5768, "learning_rate": 4.993788227600013e-05, "epoch": 0.022441774542269904, "percentage": 2.24, "elapsed_time": "3:50:15", "remaining_time": "6 days, 23:08:51", "throughput": 2682.57, "total_tokens": 37059904} {"current_steps": 206, "total_steps": 9134, "loss": 0.6446, "learning_rate": 4.993727502547598e-05, "epoch": 0.022551246613207804, "percentage": 2.26, "elapsed_time": "3:51:22", "remaining_time": "6 days, 23:08:04", "throughput": 2682.67, "total_tokens": 37243360} {"current_steps": 207, "total_steps": 9134, "loss": 0.5917, "learning_rate": 4.9936664824919865e-05, "epoch": 0.02266071868414571, "percentage": 2.27, "elapsed_time": "3:52:29", "remaining_time": "6 days, 23:06:03", "throughput": 2683.68, "total_tokens": 37434880} {"current_steps": 208, "total_steps": 9134, "loss": 0.7557, "learning_rate": 4.993605167440397e-05, "epoch": 0.02277019075508361, "percentage": 2.28, "elapsed_time": "3:53:36", "remaining_time": "6 days, 23:04:36", "throughput": 2685.37, "total_tokens": 37638272} {"current_steps": 209, "total_steps": 9134, "loss": 0.6493, "learning_rate": 4.9935435574000834e-05, "epoch": 0.02287966282602151, "percentage": 2.29, "elapsed_time": "3:54:40", "remaining_time": "6 days, 23:01:07", "throughput": 2684.37, "total_tokens": 37796192} {"current_steps": 210, "total_steps": 9134, "loss": 0.6706, "learning_rate": 4.993481652378334e-05, "epoch": 0.022989134896959414, "percentage": 2.3, "elapsed_time": "3:55:41", "remaining_time": "6 days, 22:55:36", "throughput": 2683.12, "total_tokens": 37942688} {"current_steps": 211, "total_steps": 9134, "loss": 0.7749, "learning_rate": 4.9934194523824715e-05, "epoch": 0.023098606967897315, "percentage": 2.31, "elapsed_time": "3:56:47", "remaining_time": "6 days, 22:54:03", "throughput": 2683.92, "total_tokens": 38133088} {"current_steps": 212, "total_steps": 9134, "loss": 0.7671, "learning_rate": 4.993356957419855e-05, "epoch": 0.023208079038835216, "percentage": 2.32, "elapsed_time": "3:57:52", "remaining_time": "6 days, 22:51:02", "throughput": 2684.55, "total_tokens": 38315648} {"current_steps": 213, "total_steps": 9134, "loss": 0.7319, "learning_rate": 4.993294167497876e-05, "epoch": 0.02331755110977312, "percentage": 2.33, "elapsed_time": "3:58:56", "remaining_time": "6 days, 22:47:50", "throughput": 2684.61, "total_tokens": 38489248} {"current_steps": 214, "total_steps": 9134, "loss": 0.6718, "learning_rate": 4.993231082623965e-05, "epoch": 0.02342702318071102, "percentage": 2.34, "elapsed_time": "4:00:06", "remaining_time": "6 days, 22:48:05", "throughput": 2686.95, "total_tokens": 38708992} {"current_steps": 215, "total_steps": 9134, "loss": 0.7682, "learning_rate": 4.993167702805581e-05, "epoch": 0.02353649525164892, "percentage": 2.35, "elapsed_time": "4:01:10", "remaining_time": "6 days, 22:44:41", "throughput": 2686.55, "total_tokens": 38875200} {"current_steps": 216, "total_steps": 9134, "loss": 0.6635, "learning_rate": 4.9931040280502255e-05, "epoch": 0.023645967322586826, "percentage": 2.36, "elapsed_time": "4:02:15", "remaining_time": "6 days, 22:42:21", "throughput": 2686.12, "total_tokens": 39044992} {"current_steps": 217, "total_steps": 9134, "loss": 0.652, "learning_rate": 4.993040058365429e-05, "epoch": 0.023755439393524726, "percentage": 2.38, "elapsed_time": "4:03:21", "remaining_time": "6 days, 22:40:22", "throughput": 2685.17, "total_tokens": 39208512} {"current_steps": 218, "total_steps": 9134, "loss": 0.8437, "learning_rate": 4.992975793758759e-05, "epoch": 0.02386491146446263, "percentage": 2.39, "elapsed_time": "4:04:30", "remaining_time": "6 days, 22:39:54", "throughput": 2685.92, "total_tokens": 39402720} {"current_steps": 219, "total_steps": 9134, "loss": 0.9123, "learning_rate": 4.9929112342378194e-05, "epoch": 0.02397438353540053, "percentage": 2.4, "elapsed_time": "4:05:38", "remaining_time": "6 days, 22:39:50", "throughput": 2686.02, "total_tokens": 39589088} {"current_steps": 220, "total_steps": 9134, "loss": 0.8507, "learning_rate": 4.9928463798102456e-05, "epoch": 0.024083855606338432, "percentage": 2.41, "elapsed_time": "4:06:47", "remaining_time": "6 days, 22:39:51", "throughput": 2686.45, "total_tokens": 39780832} {"current_steps": 221, "total_steps": 9134, "loss": 0.7906, "learning_rate": 4.992781230483711e-05, "epoch": 0.024193327677276336, "percentage": 2.42, "elapsed_time": "4:07:54", "remaining_time": "6 days, 22:37:56", "throughput": 2686.81, "total_tokens": 39963840} {"current_steps": 222, "total_steps": 9134, "loss": 0.7648, "learning_rate": 4.9927157862659215e-05, "epoch": 0.024302799748214237, "percentage": 2.43, "elapsed_time": "4:09:03", "remaining_time": "6 days, 22:38:03", "throughput": 2687.96, "total_tokens": 40166784} {"current_steps": 223, "total_steps": 9134, "loss": 0.8414, "learning_rate": 4.992650047164621e-05, "epoch": 0.024412271819152138, "percentage": 2.44, "elapsed_time": "4:10:08", "remaining_time": "6 days, 22:35:42", "throughput": 2688.5, "total_tokens": 40350912} {"current_steps": 224, "total_steps": 9134, "loss": 0.6663, "learning_rate": 4.9925840131875845e-05, "epoch": 0.024521743890090042, "percentage": 2.45, "elapsed_time": "4:11:16", "remaining_time": "6 days, 22:35:11", "throughput": 2689.08, "total_tokens": 40543104} {"current_steps": 225, "total_steps": 9134, "loss": 0.708, "learning_rate": 4.9925176843426236e-05, "epoch": 0.024631215961027943, "percentage": 2.46, "elapsed_time": "4:12:20", "remaining_time": "6 days, 22:31:46", "throughput": 2689.15, "total_tokens": 40715808} {"current_steps": 226, "total_steps": 9134, "loss": 0.7908, "learning_rate": 4.9924510606375864e-05, "epoch": 0.024740688031965843, "percentage": 2.47, "elapsed_time": "4:13:28", "remaining_time": "6 days, 22:31:08", "throughput": 2690.87, "total_tokens": 40924800} {"current_steps": 227, "total_steps": 9134, "loss": 0.6441, "learning_rate": 4.992384142080353e-05, "epoch": 0.024850160102903748, "percentage": 2.49, "elapsed_time": "4:14:36", "remaining_time": "6 days, 22:30:03", "throughput": 2691.14, "total_tokens": 41110272} {"current_steps": 228, "total_steps": 9134, "loss": 0.722, "learning_rate": 4.99231692867884e-05, "epoch": 0.02495963217384165, "percentage": 2.5, "elapsed_time": "4:15:43", "remaining_time": "6 days, 22:29:15", "throughput": 2691.91, "total_tokens": 41304480} {"current_steps": 229, "total_steps": 9134, "loss": 0.8136, "learning_rate": 4.9922494204409994e-05, "epoch": 0.02506910424477955, "percentage": 2.51, "elapsed_time": "4:16:49", "remaining_time": "6 days, 22:27:18", "throughput": 2691.42, "total_tokens": 41474720} {"current_steps": 230, "total_steps": 9134, "loss": 0.7715, "learning_rate": 4.9921816173748166e-05, "epoch": 0.025178576315717453, "percentage": 2.52, "elapsed_time": "4:17:55", "remaining_time": "6 days, 22:25:09", "throughput": 2691.03, "total_tokens": 41645408} {"current_steps": 231, "total_steps": 9134, "loss": 0.7798, "learning_rate": 4.9921135194883126e-05, "epoch": 0.025288048386655354, "percentage": 2.53, "elapsed_time": "4:19:02", "remaining_time": "6 days, 22:23:37", "throughput": 2691.27, "total_tokens": 41828416} {"current_steps": 232, "total_steps": 9134, "loss": 0.7704, "learning_rate": 4.992045126789543e-05, "epoch": 0.025397520457593258, "percentage": 2.54, "elapsed_time": "4:20:04", "remaining_time": "6 days, 22:19:15", "throughput": 2691.09, "total_tokens": 41993056} {"current_steps": 233, "total_steps": 9134, "loss": 0.761, "learning_rate": 4.9919764392865994e-05, "epoch": 0.02550699252853116, "percentage": 2.55, "elapsed_time": "4:21:10", "remaining_time": "6 days, 22:17:08", "throughput": 2690.85, "total_tokens": 42166208} {"current_steps": 234, "total_steps": 9134, "loss": 0.8806, "learning_rate": 4.9919074569876066e-05, "epoch": 0.02561646459946906, "percentage": 2.56, "elapsed_time": "4:22:17", "remaining_time": "6 days, 22:16:01", "throughput": 2692.97, "total_tokens": 42380576} {"current_steps": 235, "total_steps": 9134, "loss": 0.646, "learning_rate": 4.991838179900726e-05, "epoch": 0.025725936670406964, "percentage": 2.57, "elapsed_time": "4:23:25", "remaining_time": "6 days, 22:15:32", "throughput": 2693.36, "total_tokens": 42570528} {"current_steps": 236, "total_steps": 9134, "loss": 0.8508, "learning_rate": 4.991768608034152e-05, "epoch": 0.025835408741344865, "percentage": 2.58, "elapsed_time": "4:24:34", "remaining_time": "6 days, 22:15:12", "throughput": 2694.25, "total_tokens": 42769216} {"current_steps": 237, "total_steps": 9134, "loss": 0.7227, "learning_rate": 4.991698741396115e-05, "epoch": 0.025944880812282765, "percentage": 2.59, "elapsed_time": "4:25:41", "remaining_time": "6 days, 22:13:51", "throughput": 2693.3, "total_tokens": 42934304} {"current_steps": 238, "total_steps": 9134, "loss": 0.5724, "learning_rate": 4.991628579994879e-05, "epoch": 0.02605435288322067, "percentage": 2.61, "elapsed_time": "4:26:46", "remaining_time": "6 days, 22:11:51", "throughput": 2693.61, "total_tokens": 43116640} {"current_steps": 239, "total_steps": 9134, "loss": 0.7538, "learning_rate": 4.9915581238387464e-05, "epoch": 0.02616382495415857, "percentage": 2.62, "elapsed_time": "4:27:53", "remaining_time": "6 days, 22:10:02", "throughput": 2693.75, "total_tokens": 43296960} {"current_steps": 240, "total_steps": 9134, "loss": 0.7266, "learning_rate": 4.991487372936051e-05, "epoch": 0.02627329702509647, "percentage": 2.63, "elapsed_time": "4:28:59", "remaining_time": "6 days, 22:08:05", "throughput": 2693.56, "total_tokens": 43471456} {"current_steps": 241, "total_steps": 9134, "loss": 0.7425, "learning_rate": 4.991416327295162e-05, "epoch": 0.026382769096034375, "percentage": 2.64, "elapsed_time": "4:30:03", "remaining_time": "6 days, 22:05:02", "throughput": 2692.62, "total_tokens": 43628928} {"current_steps": 242, "total_steps": 9134, "loss": 0.7924, "learning_rate": 4.9913449869244844e-05, "epoch": 0.026492241166972276, "percentage": 2.65, "elapsed_time": "4:31:11", "remaining_time": "6 days, 22:04:40", "throughput": 2693.5, "total_tokens": 43827616} {"current_steps": 243, "total_steps": 9134, "loss": 0.6683, "learning_rate": 4.991273351832457e-05, "epoch": 0.026601713237910177, "percentage": 2.66, "elapsed_time": "4:32:13", "remaining_time": "6 days, 22:00:29", "throughput": 2692.79, "total_tokens": 43983520} {"current_steps": 244, "total_steps": 9134, "loss": 0.6728, "learning_rate": 4.991201422027556e-05, "epoch": 0.02671118530884808, "percentage": 2.67, "elapsed_time": "4:33:18", "remaining_time": "6 days, 21:58:04", "throughput": 2693.51, "total_tokens": 44170560} {"current_steps": 245, "total_steps": 9134, "loss": 0.6634, "learning_rate": 4.991129197518287e-05, "epoch": 0.02682065737978598, "percentage": 2.68, "elapsed_time": "4:34:22", "remaining_time": "6 days, 21:54:29", "throughput": 2693.36, "total_tokens": 44338112} {"current_steps": 246, "total_steps": 9134, "loss": 0.8105, "learning_rate": 4.991056678313197e-05, "epoch": 0.026930129450723882, "percentage": 2.69, "elapsed_time": "4:35:25", "remaining_time": "6 days, 21:50:53", "throughput": 2692.82, "total_tokens": 44499168} {"current_steps": 247, "total_steps": 9134, "loss": 0.8705, "learning_rate": 4.990983864420865e-05, "epoch": 0.027039601521661787, "percentage": 2.7, "elapsed_time": "4:36:34", "remaining_time": "6 days, 21:51:00", "throughput": 2694.56, "total_tokens": 44714432} {"current_steps": 248, "total_steps": 9134, "loss": 0.7122, "learning_rate": 4.990910755849903e-05, "epoch": 0.027149073592599687, "percentage": 2.72, "elapsed_time": "4:37:40", "remaining_time": "6 days, 21:49:11", "throughput": 2694.19, "total_tokens": 44886240} {"current_steps": 249, "total_steps": 9134, "loss": 0.7587, "learning_rate": 4.99083735260896e-05, "epoch": 0.02725854566353759, "percentage": 2.73, "elapsed_time": "4:38:42", "remaining_time": "6 days, 21:45:11", "throughput": 2692.43, "total_tokens": 45024672} {"current_steps": 250, "total_steps": 9134, "loss": 0.7149, "learning_rate": 4.990763654706721e-05, "epoch": 0.027368017734475492, "percentage": 2.74, "elapsed_time": "4:39:48", "remaining_time": "6 days, 21:43:29", "throughput": 2691.89, "total_tokens": 45193792} {"current_steps": 251, "total_steps": 9134, "loss": 0.6512, "learning_rate": 4.990689662151903e-05, "epoch": 0.027477489805413393, "percentage": 2.75, "elapsed_time": "4:40:52", "remaining_time": "6 days, 21:40:01", "throughput": 2691.71, "total_tokens": 45360896} {"current_steps": 252, "total_steps": 9134, "loss": 0.6943, "learning_rate": 4.990615374953258e-05, "epoch": 0.027586961876351297, "percentage": 2.76, "elapsed_time": "4:41:55", "remaining_time": "6 days, 21:36:30", "throughput": 2691.89, "total_tokens": 45533600} {"current_steps": 253, "total_steps": 9134, "loss": 0.7342, "learning_rate": 4.990540793119577e-05, "epoch": 0.027696433947289198, "percentage": 2.77, "elapsed_time": "4:43:02", "remaining_time": "6 days, 21:35:26", "throughput": 2693.01, "total_tokens": 45733632} {"current_steps": 254, "total_steps": 9134, "loss": 0.7208, "learning_rate": 4.99046591665968e-05, "epoch": 0.0278059060182271, "percentage": 2.78, "elapsed_time": "4:44:11", "remaining_time": "6 days, 21:35:21", "throughput": 2693.74, "total_tokens": 45931648} {"current_steps": 255, "total_steps": 9134, "loss": 0.641, "learning_rate": 4.990390745582427e-05, "epoch": 0.027915378089165003, "percentage": 2.79, "elapsed_time": "4:45:19", "remaining_time": "6 days, 21:35:06", "throughput": 2694.37, "total_tokens": 46127200} {"current_steps": 256, "total_steps": 9134, "loss": 0.7197, "learning_rate": 4.990315279896709e-05, "epoch": 0.028024850160102904, "percentage": 2.8, "elapsed_time": "4:46:26", "remaining_time": "6 days, 21:33:48", "throughput": 2693.38, "total_tokens": 46290272} {"current_steps": 257, "total_steps": 9134, "loss": 0.7023, "learning_rate": 4.990239519611454e-05, "epoch": 0.028134322231040804, "percentage": 2.81, "elapsed_time": "4:47:30", "remaining_time": "6 days, 21:30:48", "throughput": 2692.9, "total_tokens": 46454016} {"current_steps": 258, "total_steps": 9134, "loss": 0.6438, "learning_rate": 4.990163464735624e-05, "epoch": 0.02824379430197871, "percentage": 2.82, "elapsed_time": "4:48:35", "remaining_time": "6 days, 21:28:29", "throughput": 2692.05, "total_tokens": 46614400} {"current_steps": 259, "total_steps": 9134, "loss": 0.7123, "learning_rate": 4.990087115278218e-05, "epoch": 0.02835326637291661, "percentage": 2.84, "elapsed_time": "4:49:45", "remaining_time": "6 days, 21:29:01", "throughput": 2693.94, "total_tokens": 46835712} {"current_steps": 260, "total_steps": 9134, "loss": 0.678, "learning_rate": 4.9900104712482656e-05, "epoch": 0.02846273844385451, "percentage": 2.85, "elapsed_time": "4:50:48", "remaining_time": "6 days, 21:25:26", "throughput": 2693.72, "total_tokens": 47001024} {"current_steps": 261, "total_steps": 9134, "loss": 0.9007, "learning_rate": 4.9899335326548346e-05, "epoch": 0.028572210514792414, "percentage": 2.86, "elapsed_time": "4:51:56", "remaining_time": "6 days, 21:25:06", "throughput": 2694.13, "total_tokens": 47192768} {"current_steps": 262, "total_steps": 9134, "loss": 0.7573, "learning_rate": 4.9898562995070264e-05, "epoch": 0.028681682585730315, "percentage": 2.87, "elapsed_time": "4:53:03", "remaining_time": "6 days, 21:23:32", "throughput": 2695.09, "total_tokens": 47388320} {"current_steps": 263, "total_steps": 9134, "loss": 0.7314, "learning_rate": 4.9897787718139774e-05, "epoch": 0.02879115465666822, "percentage": 2.88, "elapsed_time": "4:54:10", "remaining_time": "6 days, 21:22:16", "throughput": 2695.33, "total_tokens": 47572672} {"current_steps": 264, "total_steps": 9134, "loss": 0.8009, "learning_rate": 4.98970094958486e-05, "epoch": 0.02890062672760612, "percentage": 2.89, "elapsed_time": "4:55:19", "remaining_time": "6 days, 21:22:35", "throughput": 2696.65, "total_tokens": 47783904} {"current_steps": 265, "total_steps": 9134, "loss": 0.6173, "learning_rate": 4.98962283282888e-05, "epoch": 0.02901009879854402, "percentage": 2.9, "elapsed_time": "4:56:25", "remaining_time": "6 days, 21:20:58", "throughput": 2697.71, "total_tokens": 47981248} {"current_steps": 266, "total_steps": 9134, "loss": 0.7067, "learning_rate": 4.989544421555278e-05, "epoch": 0.029119570869481925, "percentage": 2.91, "elapsed_time": "4:57:34", "remaining_time": "6 days, 21:20:49", "throughput": 2698.98, "total_tokens": 48189792} {"current_steps": 267, "total_steps": 9134, "loss": 0.724, "learning_rate": 4.989465715773331e-05, "epoch": 0.029229042940419826, "percentage": 2.92, "elapsed_time": "4:58:41", "remaining_time": "6 days, 21:19:31", "throughput": 2699.01, "total_tokens": 48370560} {"current_steps": 268, "total_steps": 9134, "loss": 0.7957, "learning_rate": 4.989386715492347e-05, "epoch": 0.029338515011357726, "percentage": 2.93, "elapsed_time": "4:59:46", "remaining_time": "6 days, 21:17:26", "throughput": 2698.32, "total_tokens": 48534528} {"current_steps": 269, "total_steps": 9134, "loss": 0.7524, "learning_rate": 4.9893074207216745e-05, "epoch": 0.02944798708229563, "percentage": 2.95, "elapsed_time": "5:00:52", "remaining_time": "6 days, 21:15:33", "throughput": 2697.99, "total_tokens": 48705888} {"current_steps": 270, "total_steps": 9134, "loss": 0.5817, "learning_rate": 4.989227831470692e-05, "epoch": 0.02955745915323353, "percentage": 2.96, "elapsed_time": "5:01:58", "remaining_time": "6 days, 21:13:44", "throughput": 2698.19, "total_tokens": 48887104} {"current_steps": 271, "total_steps": 9134, "loss": 0.6459, "learning_rate": 4.989147947748817e-05, "epoch": 0.029666931224171432, "percentage": 2.97, "elapsed_time": "5:02:59", "remaining_time": "6 days, 21:09:23", "throughput": 2697.81, "total_tokens": 49045472} {"current_steps": 272, "total_steps": 9134, "loss": 0.7373, "learning_rate": 4.989067769565498e-05, "epoch": 0.029776403295109336, "percentage": 2.98, "elapsed_time": "5:04:09", "remaining_time": "6 days, 21:09:33", "throughput": 2698.63, "total_tokens": 49247744} {"current_steps": 273, "total_steps": 9134, "loss": 0.6751, "learning_rate": 4.9889872969302195e-05, "epoch": 0.029885875366047237, "percentage": 2.99, "elapsed_time": "5:05:15", "remaining_time": "6 days, 21:08:11", "throughput": 2699.32, "total_tokens": 49440160} {"current_steps": 274, "total_steps": 9134, "loss": 0.6307, "learning_rate": 4.988906529852502e-05, "epoch": 0.029995347436985138, "percentage": 3.0, "elapsed_time": "5:06:22", "remaining_time": "6 days, 21:06:53", "throughput": 2700.62, "total_tokens": 49644224} {"current_steps": 275, "total_steps": 9134, "loss": 0.8009, "learning_rate": 4.9888254683419e-05, "epoch": 0.030104819507923042, "percentage": 3.01, "elapsed_time": "5:07:29", "remaining_time": "6 days, 21:05:47", "throughput": 2700.7, "total_tokens": 49827008} {"current_steps": 276, "total_steps": 9134, "loss": 0.7892, "learning_rate": 4.988744112408003e-05, "epoch": 0.030214291578860943, "percentage": 3.02, "elapsed_time": "5:08:32", "remaining_time": "6 days, 21:02:27", "throughput": 2699.31, "total_tokens": 49971264} {"current_steps": 277, "total_steps": 9134, "loss": 0.6269, "learning_rate": 4.9886624620604354e-05, "epoch": 0.030323763649798847, "percentage": 3.03, "elapsed_time": "5:09:40", "remaining_time": "6 days, 21:01:32", "throughput": 2699.98, "total_tokens": 50165920} {"current_steps": 278, "total_steps": 9134, "loss": 0.659, "learning_rate": 4.9885805173088563e-05, "epoch": 0.030433235720736748, "percentage": 3.04, "elapsed_time": "5:10:46", "remaining_time": "6 days, 21:00:08", "throughput": 2700.73, "total_tokens": 50359456} {"current_steps": 279, "total_steps": 9134, "loss": 0.8028, "learning_rate": 4.988498278162959e-05, "epoch": 0.030542707791674648, "percentage": 3.05, "elapsed_time": "5:11:53", "remaining_time": "6 days, 20:58:56", "throughput": 2701.38, "total_tokens": 50552320} {"current_steps": 280, "total_steps": 9134, "loss": 0.7648, "learning_rate": 4.988415744632472e-05, "epoch": 0.030652179862612552, "percentage": 3.07, "elapsed_time": "5:12:57", "remaining_time": "6 days, 20:56:19", "throughput": 2701.29, "total_tokens": 50724128} {"current_steps": 281, "total_steps": 9134, "loss": 0.6505, "learning_rate": 4.9883329167271595e-05, "epoch": 0.030761651933550453, "percentage": 3.08, "elapsed_time": "5:14:03", "remaining_time": "6 days, 20:54:24", "throughput": 2701.59, "total_tokens": 50906912} {"current_steps": 282, "total_steps": 9134, "loss": 0.8363, "learning_rate": 4.988249794456821e-05, "epoch": 0.030871124004488354, "percentage": 3.09, "elapsed_time": "5:15:08", "remaining_time": "6 days, 20:52:31", "throughput": 2701.34, "total_tokens": 51079392} {"current_steps": 283, "total_steps": 9134, "loss": 0.7892, "learning_rate": 4.988166377831288e-05, "epoch": 0.030980596075426258, "percentage": 3.1, "elapsed_time": "5:16:17", "remaining_time": "6 days, 20:52:22", "throughput": 2701.88, "total_tokens": 51275840} {"current_steps": 284, "total_steps": 9134, "loss": 0.7993, "learning_rate": 4.988082666860429e-05, "epoch": 0.03109006814636416, "percentage": 3.11, "elapsed_time": "5:17:24", "remaining_time": "6 days, 20:51:15", "throughput": 2702.3, "total_tokens": 51464896} {"current_steps": 285, "total_steps": 9134, "loss": 1.0127, "learning_rate": 4.9879986615541464e-05, "epoch": 0.03119954021730206, "percentage": 3.12, "elapsed_time": "5:18:33", "remaining_time": "6 days, 20:50:53", "throughput": 2703.57, "total_tokens": 51674336} {"current_steps": 286, "total_steps": 9134, "loss": 0.6851, "learning_rate": 4.987914361922379e-05, "epoch": 0.031309012288239964, "percentage": 3.13, "elapsed_time": "5:19:37", "remaining_time": "6 days, 20:48:23", "throughput": 2703.61, "total_tokens": 51849280} {"current_steps": 287, "total_steps": 9134, "loss": 0.8241, "learning_rate": 4.9878297679750986e-05, "epoch": 0.031418484359177865, "percentage": 3.14, "elapsed_time": "5:20:45", "remaining_time": "6 days, 20:47:27", "throughput": 2704.33, "total_tokens": 52045280} {"current_steps": 288, "total_steps": 9134, "loss": 0.7814, "learning_rate": 4.987744879722312e-05, "epoch": 0.031527956430115765, "percentage": 3.15, "elapsed_time": "5:21:51", "remaining_time": "6 days, 20:46:10", "throughput": 2704.96, "total_tokens": 52237920} {"current_steps": 289, "total_steps": 9134, "loss": 0.7596, "learning_rate": 4.987659697174063e-05, "epoch": 0.031637428501053666, "percentage": 3.16, "elapsed_time": "5:22:58", "remaining_time": "6 days, 20:44:41", "throughput": 2704.74, "total_tokens": 52413088} {"current_steps": 290, "total_steps": 9134, "loss": 0.817, "learning_rate": 4.987574220340427e-05, "epoch": 0.031746900571991574, "percentage": 3.17, "elapsed_time": "5:24:05", "remaining_time": "6 days, 20:43:35", "throughput": 2704.93, "total_tokens": 52598336} {"current_steps": 291, "total_steps": 9134, "loss": 0.7345, "learning_rate": 4.9874884492315155e-05, "epoch": 0.031856372642929474, "percentage": 3.19, "elapsed_time": "5:25:11", "remaining_time": "6 days, 20:42:02", "throughput": 2704.66, "total_tokens": 52771936} {"current_steps": 292, "total_steps": 9134, "loss": 0.6996, "learning_rate": 4.987402383857477e-05, "epoch": 0.031965844713867375, "percentage": 3.2, "elapsed_time": "5:26:16", "remaining_time": "6 days, 20:39:55", "throughput": 2704.42, "total_tokens": 52943296} {"current_steps": 293, "total_steps": 9134, "loss": 1.0966, "learning_rate": 4.98731602422849e-05, "epoch": 0.032075316784805276, "percentage": 3.21, "elapsed_time": "5:27:25", "remaining_time": "6 days, 20:39:33", "throughput": 2704.68, "total_tokens": 53133696} {"current_steps": 294, "total_steps": 9134, "loss": 0.8492, "learning_rate": 4.9872293703547735e-05, "epoch": 0.03218478885574318, "percentage": 3.22, "elapsed_time": "5:28:34", "remaining_time": "6 days, 20:39:35", "throughput": 2705.6, "total_tokens": 53339552} {"current_steps": 295, "total_steps": 9134, "loss": 0.7442, "learning_rate": 4.987142422246577e-05, "epoch": 0.03229426092668108, "percentage": 3.23, "elapsed_time": "5:29:41", "remaining_time": "6 days, 20:38:18", "throughput": 2705.56, "total_tokens": 53519200} {"current_steps": 296, "total_steps": 9134, "loss": 0.8712, "learning_rate": 4.987055179914186e-05, "epoch": 0.032403732997618985, "percentage": 3.24, "elapsed_time": "5:30:47", "remaining_time": "6 days, 20:36:51", "throughput": 2706.19, "total_tokens": 53711392} {"current_steps": 297, "total_steps": 9134, "loss": 0.7391, "learning_rate": 4.9869676433679225e-05, "epoch": 0.032513205068556886, "percentage": 3.25, "elapsed_time": "5:31:52", "remaining_time": "6 days, 20:34:54", "throughput": 2705.72, "total_tokens": 53878944} {"current_steps": 298, "total_steps": 9134, "loss": 0.7223, "learning_rate": 4.98687981261814e-05, "epoch": 0.032622677139494786, "percentage": 3.26, "elapsed_time": "5:32:59", "remaining_time": "6 days, 20:33:31", "throughput": 2705.85, "total_tokens": 54061504} {"current_steps": 299, "total_steps": 9134, "loss": 0.6751, "learning_rate": 4.9867916876752306e-05, "epoch": 0.03273214921043269, "percentage": 3.27, "elapsed_time": "5:34:05", "remaining_time": "6 days, 20:31:59", "throughput": 2705.68, "total_tokens": 54237120} {"current_steps": 300, "total_steps": 9134, "loss": 0.8674, "learning_rate": 4.9867032685496185e-05, "epoch": 0.03284162128137059, "percentage": 3.28, "elapsed_time": "5:35:15", "remaining_time": "6 days, 20:32:12", "throughput": 2705.7, "total_tokens": 54426400} {"current_steps": 301, "total_steps": 9134, "loss": 0.7386, "learning_rate": 4.986614555251763e-05, "epoch": 0.032951093352308496, "percentage": 3.3, "elapsed_time": "5:36:21", "remaining_time": "6 days, 20:30:28", "throughput": 2704.78, "total_tokens": 54585664} {"current_steps": 302, "total_steps": 9134, "loss": 0.871, "learning_rate": 4.98652554779216e-05, "epoch": 0.033060565423246396, "percentage": 3.31, "elapsed_time": "5:37:30", "remaining_time": "6 days, 20:30:18", "throughput": 2704.84, "total_tokens": 54773600} {"current_steps": 303, "total_steps": 9134, "loss": 0.7653, "learning_rate": 4.9864362461813373e-05, "epoch": 0.0331700374941843, "percentage": 3.32, "elapsed_time": "5:38:36", "remaining_time": "6 days, 20:28:49", "throughput": 2705.21, "total_tokens": 54960416} {"current_steps": 304, "total_steps": 9134, "loss": 0.6705, "learning_rate": 4.9863466504298604e-05, "epoch": 0.0332795095651222, "percentage": 3.33, "elapsed_time": "5:39:41", "remaining_time": "6 days, 20:26:51", "throughput": 2705.76, "total_tokens": 55148352} {"current_steps": 305, "total_steps": 9134, "loss": 0.7387, "learning_rate": 4.9862567605483277e-05, "epoch": 0.0333889816360601, "percentage": 3.34, "elapsed_time": "5:40:50", "remaining_time": "6 days, 20:26:20", "throughput": 2706.24, "total_tokens": 55343008} {"current_steps": 306, "total_steps": 9134, "loss": 0.7375, "learning_rate": 4.986166576547373e-05, "epoch": 0.033498453706998, "percentage": 3.35, "elapsed_time": "5:41:58", "remaining_time": "6 days, 20:25:54", "throughput": 2706.58, "total_tokens": 55535200} {"current_steps": 307, "total_steps": 9134, "loss": 0.6705, "learning_rate": 4.9860760984376656e-05, "epoch": 0.03360792577793591, "percentage": 3.36, "elapsed_time": "5:43:07", "remaining_time": "6 days, 20:25:50", "throughput": 2707.07, "total_tokens": 55732768} {"current_steps": 308, "total_steps": 9134, "loss": 0.8133, "learning_rate": 4.985985326229907e-05, "epoch": 0.03371739784887381, "percentage": 3.37, "elapsed_time": "5:44:11", "remaining_time": "6 days, 20:22:53", "throughput": 2707.1, "total_tokens": 55904576} {"current_steps": 309, "total_steps": 9134, "loss": 0.7343, "learning_rate": 4.985894259934838e-05, "epoch": 0.03382686991981171, "percentage": 3.38, "elapsed_time": "5:45:15", "remaining_time": "6 days, 20:20:46", "throughput": 2706.56, "total_tokens": 56068992} {"current_steps": 310, "total_steps": 9134, "loss": 0.6467, "learning_rate": 4.98580289956323e-05, "epoch": 0.03393634199074961, "percentage": 3.39, "elapsed_time": "5:46:22", "remaining_time": "6 days, 20:19:24", "throughput": 2707.04, "total_tokens": 56259168} {"current_steps": 311, "total_steps": 9134, "loss": 0.7879, "learning_rate": 4.985711245125891e-05, "epoch": 0.03404581406168751, "percentage": 3.4, "elapsed_time": "5:47:31", "remaining_time": "6 days, 20:18:59", "throughput": 2708.0, "total_tokens": 56464576} {"current_steps": 312, "total_steps": 9134, "loss": 0.7653, "learning_rate": 4.9856192966336634e-05, "epoch": 0.03415528613262541, "percentage": 3.42, "elapsed_time": "5:48:36", "remaining_time": "6 days, 20:17:12", "throughput": 2706.94, "total_tokens": 56620256} {"current_steps": 313, "total_steps": 9134, "loss": 0.8726, "learning_rate": 4.985527054097425e-05, "epoch": 0.03426475820356332, "percentage": 3.43, "elapsed_time": "5:49:45", "remaining_time": "6 days, 20:17:07", "throughput": 2708.04, "total_tokens": 56830592} {"current_steps": 314, "total_steps": 9134, "loss": 0.7298, "learning_rate": 4.985434517528087e-05, "epoch": 0.03437423027450122, "percentage": 3.44, "elapsed_time": "5:50:51", "remaining_time": "6 days, 20:15:32", "throughput": 2708.37, "total_tokens": 57016512} {"current_steps": 315, "total_steps": 9134, "loss": 0.7489, "learning_rate": 4.985341686936598e-05, "epoch": 0.03448370234543912, "percentage": 3.45, "elapsed_time": "5:51:54", "remaining_time": "6 days, 20:12:17", "throughput": 2707.15, "total_tokens": 57160096} {"current_steps": 316, "total_steps": 9134, "loss": 0.8126, "learning_rate": 4.9852485623339376e-05, "epoch": 0.03459317441637702, "percentage": 3.46, "elapsed_time": "5:52:56", "remaining_time": "6 days, 20:08:38", "throughput": 2706.74, "total_tokens": 57318016} {"current_steps": 317, "total_steps": 9134, "loss": 0.727, "learning_rate": 4.985155143731124e-05, "epoch": 0.03470264648731492, "percentage": 3.47, "elapsed_time": "5:54:03", "remaining_time": "6 days, 20:07:48", "throughput": 2708.14, "total_tokens": 57530816} {"current_steps": 318, "total_steps": 9134, "loss": 0.5959, "learning_rate": 4.985061431139207e-05, "epoch": 0.03481211855825283, "percentage": 3.48, "elapsed_time": "5:54:59", "remaining_time": "6 days, 20:01:26", "throughput": 2706.41, "total_tokens": 57644608} {"current_steps": 319, "total_steps": 9134, "loss": 0.701, "learning_rate": 4.9849674245692735e-05, "epoch": 0.03492159062919073, "percentage": 3.49, "elapsed_time": "5:56:08", "remaining_time": "6 days, 20:01:08", "throughput": 2707.22, "total_tokens": 57848000} {"current_steps": 320, "total_steps": 9134, "loss": 0.793, "learning_rate": 4.9848731240324444e-05, "epoch": 0.03503106270012863, "percentage": 3.5, "elapsed_time": "5:57:14", "remaining_time": "6 days, 19:59:38", "throughput": 2708.28, "total_tokens": 58049824} {"current_steps": 321, "total_steps": 9134, "loss": 0.6787, "learning_rate": 4.984778529539875e-05, "epoch": 0.03514053477106653, "percentage": 3.51, "elapsed_time": "5:58:19", "remaining_time": "6 days, 19:57:47", "throughput": 2708.46, "total_tokens": 58230816} {"current_steps": 322, "total_steps": 9134, "loss": 0.6446, "learning_rate": 4.984683641102755e-05, "epoch": 0.03525000684200443, "percentage": 3.53, "elapsed_time": "5:59:20", "remaining_time": "6 days, 19:53:49", "throughput": 2707.45, "total_tokens": 58373504} {"current_steps": 323, "total_steps": 9134, "loss": 0.8173, "learning_rate": 4.984588458732311e-05, "epoch": 0.03535947891294233, "percentage": 3.54, "elapsed_time": "6:00:25", "remaining_time": "6 days, 19:51:42", "throughput": 2706.94, "total_tokens": 58537920} {"current_steps": 324, "total_steps": 9134, "loss": 0.6818, "learning_rate": 4.984492982439802e-05, "epoch": 0.03546895098388024, "percentage": 3.55, "elapsed_time": "6:01:31", "remaining_time": "6 days, 19:50:19", "throughput": 2707.18, "total_tokens": 58722496} {"current_steps": 325, "total_steps": 9134, "loss": 0.9523, "learning_rate": 4.984397212236522e-05, "epoch": 0.03557842305481814, "percentage": 3.56, "elapsed_time": "6:02:40", "remaining_time": "6 days, 19:50:09", "throughput": 2707.67, "total_tokens": 58920064} {"current_steps": 326, "total_steps": 9134, "loss": 0.8442, "learning_rate": 4.984301148133802e-05, "epoch": 0.03568789512575604, "percentage": 3.57, "elapsed_time": "6:03:47", "remaining_time": "6 days, 19:48:53", "throughput": 2707.93, "total_tokens": 59106208} {"current_steps": 327, "total_steps": 9134, "loss": 0.7644, "learning_rate": 4.9842047901430044e-05, "epoch": 0.03579736719669394, "percentage": 3.58, "elapsed_time": "6:04:52", "remaining_time": "6 days, 19:47:15", "throughput": 2708.68, "total_tokens": 59300864} {"current_steps": 328, "total_steps": 9134, "loss": 0.5848, "learning_rate": 4.98410813827553e-05, "epoch": 0.03590683926763184, "percentage": 3.59, "elapsed_time": "6:05:56", "remaining_time": "6 days, 19:44:44", "throughput": 2707.58, "total_tokens": 59449600} {"current_steps": 329, "total_steps": 9134, "loss": 0.8383, "learning_rate": 4.984011192542811e-05, "epoch": 0.036016311338569744, "percentage": 3.6, "elapsed_time": "6:07:01", "remaining_time": "6 days, 19:42:46", "throughput": 2707.5, "total_tokens": 59623872} {"current_steps": 330, "total_steps": 9134, "loss": 0.6117, "learning_rate": 4.983913952956317e-05, "epoch": 0.03612578340950765, "percentage": 3.61, "elapsed_time": "6:08:08", "remaining_time": "6 days, 19:41:34", "throughput": 2707.76, "total_tokens": 59810240} {"current_steps": 331, "total_steps": 9134, "loss": 0.778, "learning_rate": 4.983816419527551e-05, "epoch": 0.03623525548044555, "percentage": 3.62, "elapsed_time": "6:09:16", "remaining_time": "6 days, 19:40:49", "throughput": 2707.46, "total_tokens": 59987200} {"current_steps": 332, "total_steps": 9134, "loss": 0.9366, "learning_rate": 4.983718592268051e-05, "epoch": 0.03634472755138345, "percentage": 3.63, "elapsed_time": "6:10:25", "remaining_time": "6 days, 19:40:50", "throughput": 2708.02, "total_tokens": 60187680} {"current_steps": 333, "total_steps": 9134, "loss": 0.867, "learning_rate": 4.983620471189389e-05, "epoch": 0.036454199622321354, "percentage": 3.65, "elapsed_time": "6:11:31", "remaining_time": "6 days, 19:39:22", "throughput": 2708.31, "total_tokens": 60373376} {"current_steps": 334, "total_steps": 9134, "loss": 0.6922, "learning_rate": 4.9835220563031726e-05, "epoch": 0.036563671693259255, "percentage": 3.66, "elapsed_time": "6:12:41", "remaining_time": "6 days, 19:39:18", "throughput": 2708.62, "total_tokens": 60568032} {"current_steps": 335, "total_steps": 9134, "loss": 0.7688, "learning_rate": 4.9834233476210456e-05, "epoch": 0.03667314376419716, "percentage": 3.67, "elapsed_time": "6:13:49", "remaining_time": "6 days, 19:38:55", "throughput": 2709.32, "total_tokens": 60769632} {"current_steps": 336, "total_steps": 9134, "loss": 0.7368, "learning_rate": 4.9833243451546834e-05, "epoch": 0.03678261583513506, "percentage": 3.68, "elapsed_time": "6:14:55", "remaining_time": "6 days, 19:37:14", "throughput": 2709.61, "total_tokens": 60954208} {"current_steps": 337, "total_steps": 9134, "loss": 0.7211, "learning_rate": 4.9832250489157994e-05, "epoch": 0.036892087906072964, "percentage": 3.69, "elapsed_time": "6:15:57", "remaining_time": "6 days, 19:34:05", "throughput": 2708.47, "total_tokens": 61097120} {"current_steps": 338, "total_steps": 9134, "loss": 0.7405, "learning_rate": 4.983125458916138e-05, "epoch": 0.037001559977010864, "percentage": 3.7, "elapsed_time": "6:17:02", "remaining_time": "6 days, 19:32:03", "throughput": 2708.2, "total_tokens": 61266464} {"current_steps": 339, "total_steps": 9134, "loss": 0.8812, "learning_rate": 4.9830255751674825e-05, "epoch": 0.037111032047948765, "percentage": 3.71, "elapsed_time": "6:18:11", "remaining_time": "6 days, 19:31:43", "throughput": 2708.95, "total_tokens": 61469856} {"current_steps": 340, "total_steps": 9134, "loss": 0.6313, "learning_rate": 4.982925397681648e-05, "epoch": 0.037220504118886666, "percentage": 3.72, "elapsed_time": "6:19:20", "remaining_time": "6 days, 19:31:34", "throughput": 2708.3, "total_tokens": 61642336} {"current_steps": 341, "total_steps": 9134, "loss": 0.6163, "learning_rate": 4.982824926470486e-05, "epoch": 0.037329976189824574, "percentage": 3.73, "elapsed_time": "6:20:22", "remaining_time": "6 days, 19:28:21", "throughput": 2707.6, "total_tokens": 61794432} {"current_steps": 342, "total_steps": 9134, "loss": 0.851, "learning_rate": 4.982724161545881e-05, "epoch": 0.037439448260762474, "percentage": 3.74, "elapsed_time": "6:21:31", "remaining_time": "6 days, 19:28:15", "throughput": 2708.16, "total_tokens": 61994912} {"current_steps": 343, "total_steps": 9134, "loss": 0.5694, "learning_rate": 4.982623102919754e-05, "epoch": 0.037548920331700375, "percentage": 3.76, "elapsed_time": "6:22:35", "remaining_time": "6 days, 19:25:50", "throughput": 2707.97, "total_tokens": 62163584} {"current_steps": 344, "total_steps": 9134, "loss": 0.6746, "learning_rate": 4.98252175060406e-05, "epoch": 0.037658392402638276, "percentage": 3.77, "elapsed_time": "6:23:39", "remaining_time": "6 days, 19:23:27", "throughput": 2708.12, "total_tokens": 62340096} {"current_steps": 345, "total_steps": 9134, "loss": 0.7022, "learning_rate": 4.9824201046107885e-05, "epoch": 0.037767864473576176, "percentage": 3.78, "elapsed_time": "6:24:46", "remaining_time": "6 days, 19:22:23", "throughput": 2708.17, "total_tokens": 62522880} {"current_steps": 346, "total_steps": 9134, "loss": 0.7107, "learning_rate": 4.9823181649519645e-05, "epoch": 0.037877336544514084, "percentage": 3.79, "elapsed_time": "6:25:53", "remaining_time": "6 days, 19:21:05", "throughput": 2708.36, "total_tokens": 62707232} {"current_steps": 347, "total_steps": 9134, "loss": 0.8567, "learning_rate": 4.9822159316396465e-05, "epoch": 0.037986808615451985, "percentage": 3.8, "elapsed_time": "6:26:57", "remaining_time": "6 days, 19:18:56", "throughput": 2707.76, "total_tokens": 62868064} {"current_steps": 348, "total_steps": 9134, "loss": 0.6395, "learning_rate": 4.9821134046859295e-05, "epoch": 0.038096280686389886, "percentage": 3.81, "elapsed_time": "6:28:02", "remaining_time": "6 days, 19:16:45", "throughput": 2707.43, "total_tokens": 63034496} {"current_steps": 349, "total_steps": 9134, "loss": 0.7132, "learning_rate": 4.9820105841029416e-05, "epoch": 0.038205752757327786, "percentage": 3.82, "elapsed_time": "6:29:04", "remaining_time": "6 days, 19:13:51", "throughput": 2706.87, "total_tokens": 63191072} {"current_steps": 350, "total_steps": 9134, "loss": 0.6755, "learning_rate": 4.9819074699028455e-05, "epoch": 0.03831522482826569, "percentage": 3.83, "elapsed_time": "6:30:06", "remaining_time": "6 days, 19:10:42", "throughput": 2705.6, "total_tokens": 63329280} {"current_steps": 351, "total_steps": 9134, "loss": 0.757, "learning_rate": 4.981804062097841e-05, "epoch": 0.03842469689920359, "percentage": 3.84, "elapsed_time": "6:31:12", "remaining_time": "6 days, 19:09:13", "throughput": 2706.5, "total_tokens": 63528864} {"current_steps": 352, "total_steps": 9134, "loss": 0.6294, "learning_rate": 4.9817003607001614e-05, "epoch": 0.038534168970141496, "percentage": 3.85, "elapsed_time": "6:32:19", "remaining_time": "6 days, 19:07:59", "throughput": 2707.39, "total_tokens": 63730240} {"current_steps": 353, "total_steps": 9134, "loss": 0.9477, "learning_rate": 4.981596365722072e-05, "epoch": 0.038643641041079396, "percentage": 3.86, "elapsed_time": "6:33:25", "remaining_time": "6 days, 19:06:39", "throughput": 2707.44, "total_tokens": 63911008} {"current_steps": 354, "total_steps": 9134, "loss": 0.7056, "learning_rate": 4.981492077175877e-05, "epoch": 0.0387531131120173, "percentage": 3.88, "elapsed_time": "6:34:32", "remaining_time": "6 days, 19:05:23", "throughput": 2708.41, "total_tokens": 64113952} {"current_steps": 355, "total_steps": 9134, "loss": 0.7086, "learning_rate": 4.9813874950739124e-05, "epoch": 0.0388625851829552, "percentage": 3.89, "elapsed_time": "6:35:41", "remaining_time": "6 days, 19:05:11", "throughput": 2708.88, "total_tokens": 64312192} {"current_steps": 356, "total_steps": 9134, "loss": 0.7446, "learning_rate": 4.9812826194285515e-05, "epoch": 0.0389720572538931, "percentage": 3.9, "elapsed_time": "6:36:50", "remaining_time": "6 days, 19:05:09", "throughput": 2709.53, "total_tokens": 64516032} {"current_steps": 357, "total_steps": 9134, "loss": 0.6315, "learning_rate": 4.9811774502522e-05, "epoch": 0.039081529324831, "percentage": 3.91, "elapsed_time": "6:37:59", "remaining_time": "6 days, 19:04:36", "throughput": 2710.09, "total_tokens": 64714272} {"current_steps": 358, "total_steps": 9134, "loss": 0.6953, "learning_rate": 4.9810719875573e-05, "epoch": 0.03919100139576891, "percentage": 3.92, "elapsed_time": "6:39:07", "remaining_time": "6 days, 19:04:20", "throughput": 2710.25, "total_tokens": 64905120} {"current_steps": 359, "total_steps": 9134, "loss": 0.9811, "learning_rate": 4.980966231356326e-05, "epoch": 0.03930047346670681, "percentage": 3.93, "elapsed_time": "6:40:16", "remaining_time": "6 days, 19:03:46", "throughput": 2710.57, "total_tokens": 65097760} {"current_steps": 360, "total_steps": 9134, "loss": 0.734, "learning_rate": 4.98086018166179e-05, "epoch": 0.03940994553764471, "percentage": 3.94, "elapsed_time": "6:41:21", "remaining_time": "6 days, 19:02:07", "throughput": 2710.36, "total_tokens": 65270464} {"current_steps": 361, "total_steps": 9134, "loss": 0.6851, "learning_rate": 4.980753838486236e-05, "epoch": 0.03951941760858261, "percentage": 3.95, "elapsed_time": "6:42:26", "remaining_time": "6 days, 19:00:02", "throughput": 2710.47, "total_tokens": 65447872} {"current_steps": 362, "total_steps": 9134, "loss": 0.721, "learning_rate": 4.980647201842247e-05, "epoch": 0.03962888967952051, "percentage": 3.96, "elapsed_time": "6:43:35", "remaining_time": "6 days, 18:59:51", "throughput": 2711.54, "total_tokens": 65661344} {"current_steps": 363, "total_steps": 9134, "loss": 0.7708, "learning_rate": 4.980540271742435e-05, "epoch": 0.03973836175045842, "percentage": 3.97, "elapsed_time": "6:44:41", "remaining_time": "6 days, 18:58:20", "throughput": 2712.04, "total_tokens": 65852192} {"current_steps": 364, "total_steps": 9134, "loss": 0.5962, "learning_rate": 4.980433048199451e-05, "epoch": 0.03984783382139632, "percentage": 3.99, "elapsed_time": "6:45:47", "remaining_time": "6 days, 18:56:44", "throughput": 2712.2, "total_tokens": 66034304} {"current_steps": 365, "total_steps": 9134, "loss": 0.7858, "learning_rate": 4.98032553122598e-05, "epoch": 0.03995730589233422, "percentage": 4.0, "elapsed_time": "6:46:54", "remaining_time": "6 days, 18:55:43", "throughput": 2712.16, "total_tokens": 66215296} {"current_steps": 366, "total_steps": 9134, "loss": 0.8307, "learning_rate": 4.98021772083474e-05, "epoch": 0.04006677796327212, "percentage": 4.01, "elapsed_time": "6:47:57", "remaining_time": "6 days, 18:53:06", "throughput": 2711.58, "total_tokens": 66372320} {"current_steps": 367, "total_steps": 9134, "loss": 0.8013, "learning_rate": 4.980109617038484e-05, "epoch": 0.04017625003421002, "percentage": 4.02, "elapsed_time": "6:49:06", "remaining_time": "6 days, 18:52:45", "throughput": 2712.06, "total_tokens": 66570560} {"current_steps": 368, "total_steps": 9134, "loss": 0.9296, "learning_rate": 4.980001219850002e-05, "epoch": 0.04028572210514792, "percentage": 4.03, "elapsed_time": "6:50:14", "remaining_time": "6 days, 18:52:14", "throughput": 2712.71, "total_tokens": 66772160} {"current_steps": 369, "total_steps": 9134, "loss": 0.7534, "learning_rate": 4.979892529282117e-05, "epoch": 0.04039519417608583, "percentage": 4.04, "elapsed_time": "6:51:19", "remaining_time": "6 days, 18:50:18", "throughput": 2712.68, "total_tokens": 66947104} {"current_steps": 370, "total_steps": 9134, "loss": 0.8313, "learning_rate": 4.979783545347686e-05, "epoch": 0.04050466624702373, "percentage": 4.05, "elapsed_time": "6:52:25", "remaining_time": "6 days, 18:48:49", "throughput": 2713.38, "total_tokens": 67143328} {"current_steps": 371, "total_steps": 9134, "loss": 0.5908, "learning_rate": 4.9796742680596034e-05, "epoch": 0.04061413831796163, "percentage": 4.06, "elapsed_time": "6:53:29", "remaining_time": "6 days, 18:46:50", "throughput": 2713.77, "total_tokens": 67328576} {"current_steps": 372, "total_steps": 9134, "loss": 0.6283, "learning_rate": 4.9795646974307936e-05, "epoch": 0.04072361038889953, "percentage": 4.07, "elapsed_time": "6:54:34", "remaining_time": "6 days, 18:44:50", "throughput": 2713.77, "total_tokens": 67503968} {"current_steps": 373, "total_steps": 9134, "loss": 0.5829, "learning_rate": 4.979454833474221e-05, "epoch": 0.04083308245983743, "percentage": 4.08, "elapsed_time": "6:55:36", "remaining_time": "6 days, 18:41:52", "throughput": 2713.01, "total_tokens": 67653600} {"current_steps": 374, "total_steps": 9134, "loss": 0.7869, "learning_rate": 4.9793446762028816e-05, "epoch": 0.04094255453077534, "percentage": 4.09, "elapsed_time": "6:56:46", "remaining_time": "6 days, 18:41:42", "throughput": 2714.12, "total_tokens": 67869312} {"current_steps": 375, "total_steps": 9134, "loss": 0.6395, "learning_rate": 4.9792342256298064e-05, "epoch": 0.04105202660171324, "percentage": 4.11, "elapsed_time": "6:57:55", "remaining_time": "6 days, 18:41:28", "throughput": 2714.95, "total_tokens": 68077856} {"current_steps": 376, "total_steps": 9134, "loss": 0.9702, "learning_rate": 4.979123481768062e-05, "epoch": 0.04116149867265114, "percentage": 4.12, "elapsed_time": "6:59:00", "remaining_time": "6 days, 18:39:48", "throughput": 2715.5, "total_tokens": 68269376} {"current_steps": 377, "total_steps": 9134, "loss": 0.6403, "learning_rate": 4.979012444630748e-05, "epoch": 0.04127097074358904, "percentage": 4.13, "elapsed_time": "7:00:06", "remaining_time": "6 days, 18:38:12", "throughput": 2715.43, "total_tokens": 68445664} {"current_steps": 378, "total_steps": 9134, "loss": 0.6456, "learning_rate": 4.978901114231003e-05, "epoch": 0.04138044281452694, "percentage": 4.14, "elapsed_time": "7:01:14", "remaining_time": "6 days, 18:37:44", "throughput": 2715.88, "total_tokens": 68643232} {"current_steps": 379, "total_steps": 9134, "loss": 0.589, "learning_rate": 4.978789490581993e-05, "epoch": 0.04148991488546484, "percentage": 4.15, "elapsed_time": "7:02:16", "remaining_time": "6 days, 18:34:48", "throughput": 2715.12, "total_tokens": 68792640} {"current_steps": 380, "total_steps": 9134, "loss": 0.7765, "learning_rate": 4.978677573696926e-05, "epoch": 0.04159938695640275, "percentage": 4.16, "elapsed_time": "7:03:22", "remaining_time": "6 days, 18:33:10", "throughput": 2715.01, "total_tokens": 68967584} {"current_steps": 381, "total_steps": 9134, "loss": 0.7147, "learning_rate": 4.978565363589041e-05, "epoch": 0.04170885902734065, "percentage": 4.17, "elapsed_time": "7:04:28", "remaining_time": "6 days, 18:31:58", "throughput": 2715.41, "total_tokens": 69158656} {"current_steps": 382, "total_steps": 9134, "loss": 0.5852, "learning_rate": 4.97845286027161e-05, "epoch": 0.04181833109827855, "percentage": 4.18, "elapsed_time": "7:05:36", "remaining_time": "6 days, 18:31:16", "throughput": 2715.83, "total_tokens": 69353984} {"current_steps": 383, "total_steps": 9134, "loss": 1.0631, "learning_rate": 4.978340063757945e-05, "epoch": 0.04192780316921645, "percentage": 4.19, "elapsed_time": "7:06:39", "remaining_time": "6 days, 18:28:28", "throughput": 2715.44, "total_tokens": 69513472} {"current_steps": 384, "total_steps": 9134, "loss": 0.8497, "learning_rate": 4.978226974061388e-05, "epoch": 0.042037275240154354, "percentage": 4.2, "elapsed_time": "7:07:46", "remaining_time": "6 days, 18:27:35", "throughput": 2716.19, "total_tokens": 69715744} {"current_steps": 385, "total_steps": 9134, "loss": 0.7276, "learning_rate": 4.978113591195317e-05, "epoch": 0.042146747311092254, "percentage": 4.22, "elapsed_time": "7:08:54", "remaining_time": "6 days, 18:26:45", "throughput": 2715.93, "total_tokens": 69892704} {"current_steps": 386, "total_steps": 9134, "loss": 0.8139, "learning_rate": 4.9779999151731456e-05, "epoch": 0.04225621938203016, "percentage": 4.23, "elapsed_time": "7:09:57", "remaining_time": "6 days, 18:24:07", "throughput": 2715.96, "total_tokens": 70064288} {"current_steps": 387, "total_steps": 9134, "loss": 0.6561, "learning_rate": 4.977885946008322e-05, "epoch": 0.04236569145296806, "percentage": 4.24, "elapsed_time": "7:11:03", "remaining_time": "6 days, 18:22:57", "throughput": 2716.02, "total_tokens": 70246848} {"current_steps": 388, "total_steps": 9134, "loss": 0.8013, "learning_rate": 4.977771683714327e-05, "epoch": 0.042475163523905964, "percentage": 4.25, "elapsed_time": "7:12:12", "remaining_time": "6 days, 18:22:32", "throughput": 2716.36, "total_tokens": 70442176} {"current_steps": 389, "total_steps": 9134, "loss": 0.65, "learning_rate": 4.9776571283046794e-05, "epoch": 0.042584635594843864, "percentage": 4.26, "elapsed_time": "7:13:12", "remaining_time": "6 days, 18:18:43", "throughput": 2714.95, "total_tokens": 70567616} {"current_steps": 390, "total_steps": 9134, "loss": 0.7558, "learning_rate": 4.977542279792929e-05, "epoch": 0.042694107665781765, "percentage": 4.27, "elapsed_time": "7:14:19", "remaining_time": "6 days, 18:17:50", "throughput": 2716.09, "total_tokens": 70780192} {"current_steps": 391, "total_steps": 9134, "loss": 0.5578, "learning_rate": 4.9774271381926644e-05, "epoch": 0.04280357973671967, "percentage": 4.28, "elapsed_time": "7:15:26", "remaining_time": "6 days, 18:16:50", "throughput": 2716.28, "total_tokens": 70967680} {"current_steps": 392, "total_steps": 9134, "loss": 0.6114, "learning_rate": 4.977311703517504e-05, "epoch": 0.04291305180765757, "percentage": 4.29, "elapsed_time": "7:16:30", "remaining_time": "6 days, 18:14:28", "throughput": 2715.42, "total_tokens": 71117312} {"current_steps": 393, "total_steps": 9134, "loss": 0.7356, "learning_rate": 4.977195975781106e-05, "epoch": 0.043022523878595474, "percentage": 4.3, "elapsed_time": "7:17:34", "remaining_time": "6 days, 18:12:18", "throughput": 2714.98, "total_tokens": 71279712} {"current_steps": 394, "total_steps": 9134, "loss": 0.9309, "learning_rate": 4.977079954997159e-05, "epoch": 0.043131995949533375, "percentage": 4.31, "elapsed_time": "7:18:43", "remaining_time": "6 days, 18:12:04", "throughput": 2715.47, "total_tokens": 71480192} {"current_steps": 395, "total_steps": 9134, "loss": 0.5393, "learning_rate": 4.9769636411793894e-05, "epoch": 0.043241468020471276, "percentage": 4.32, "elapsed_time": "7:19:42", "remaining_time": "6 days, 18:08:09", "throughput": 2714.6, "total_tokens": 71618176} {"current_steps": 396, "total_steps": 9134, "loss": 0.6832, "learning_rate": 4.976847034341555e-05, "epoch": 0.043350940091409176, "percentage": 4.34, "elapsed_time": "7:20:45", "remaining_time": "6 days, 18:05:34", "throughput": 2714.89, "total_tokens": 71796256} {"current_steps": 397, "total_steps": 9134, "loss": 0.9092, "learning_rate": 4.976730134497453e-05, "epoch": 0.043460412162347084, "percentage": 4.35, "elapsed_time": "7:21:54", "remaining_time": "6 days, 18:05:22", "throughput": 2715.68, "total_tokens": 72005472} {"current_steps": 398, "total_steps": 9134, "loss": 0.7243, "learning_rate": 4.97661294166091e-05, "epoch": 0.043569884233284985, "percentage": 4.36, "elapsed_time": "7:23:01", "remaining_time": "6 days, 18:04:14", "throughput": 2716.18, "total_tokens": 72199904} {"current_steps": 399, "total_steps": 9134, "loss": 0.808, "learning_rate": 4.97649545584579e-05, "epoch": 0.043679356304222886, "percentage": 4.37, "elapsed_time": "7:24:08", "remaining_time": "6 days, 18:03:09", "throughput": 2716.89, "total_tokens": 72400384} {"current_steps": 400, "total_steps": 9134, "loss": 0.8544, "learning_rate": 4.976377677065992e-05, "epoch": 0.043788828375160786, "percentage": 4.38, "elapsed_time": "7:25:14", "remaining_time": "6 days, 18:01:53", "throughput": 2717.03, "total_tokens": 72584288} {"current_steps": 401, "total_steps": 9134, "loss": 0.8907, "learning_rate": 4.9762596053354496e-05, "epoch": 0.04389830044609869, "percentage": 4.39, "elapsed_time": "7:26:22", "remaining_time": "6 days, 18:01:13", "throughput": 2717.0, "total_tokens": 72768416} {"current_steps": 402, "total_steps": 9134, "loss": 0.7397, "learning_rate": 4.976141240668129e-05, "epoch": 0.04400777251703659, "percentage": 4.4, "elapsed_time": "7:27:23", "remaining_time": "6 days, 17:58:05", "throughput": 2715.97, "total_tokens": 72907072} {"current_steps": 403, "total_steps": 9134, "loss": 0.6544, "learning_rate": 4.976022583078033e-05, "epoch": 0.044117244587974495, "percentage": 4.41, "elapsed_time": "7:28:30", "remaining_time": "6 days, 17:56:48", "throughput": 2715.6, "total_tokens": 73077088} {"current_steps": 404, "total_steps": 9134, "loss": 0.8024, "learning_rate": 4.975903632579199e-05, "epoch": 0.044226716658912396, "percentage": 4.42, "elapsed_time": "7:29:33", "remaining_time": "6 days, 17:54:23", "throughput": 2715.72, "total_tokens": 73252032} {"current_steps": 405, "total_steps": 9134, "loss": 0.7861, "learning_rate": 4.9757843891856986e-05, "epoch": 0.0443361887298503, "percentage": 4.43, "elapsed_time": "7:30:42", "remaining_time": "6 days, 17:54:03", "throughput": 2715.93, "total_tokens": 73444672} {"current_steps": 406, "total_steps": 9134, "loss": 0.594, "learning_rate": 4.975664852911638e-05, "epoch": 0.0444456608007882, "percentage": 4.44, "elapsed_time": "7:31:47", "remaining_time": "6 days, 17:52:25", "throughput": 2715.02, "total_tokens": 73597440} {"current_steps": 407, "total_steps": 9134, "loss": 0.8075, "learning_rate": 4.9755450237711575e-05, "epoch": 0.0445551328717261, "percentage": 4.46, "elapsed_time": "7:32:56", "remaining_time": "6 days, 17:52:08", "throughput": 2714.59, "total_tokens": 73773504} {"current_steps": 408, "total_steps": 9134, "loss": 0.7298, "learning_rate": 4.975424901778434e-05, "epoch": 0.044664604942664006, "percentage": 4.47, "elapsed_time": "7:34:05", "remaining_time": "6 days, 17:51:53", "throughput": 2715.54, "total_tokens": 73987200} {"current_steps": 409, "total_steps": 9134, "loss": 0.6233, "learning_rate": 4.975304486947676e-05, "epoch": 0.04477407701360191, "percentage": 4.48, "elapsed_time": "7:35:09", "remaining_time": "6 days, 17:49:40", "throughput": 2714.85, "total_tokens": 74141088} {"current_steps": 410, "total_steps": 9134, "loss": 0.7581, "learning_rate": 4.975183779293129e-05, "epoch": 0.04488354908453981, "percentage": 4.49, "elapsed_time": "7:36:10", "remaining_time": "6 days, 17:46:40", "throughput": 2714.73, "total_tokens": 74304608} {"current_steps": 411, "total_steps": 9134, "loss": 0.7161, "learning_rate": 4.975062778829073e-05, "epoch": 0.04499302115547771, "percentage": 4.5, "elapsed_time": "7:37:18", "remaining_time": "6 days, 17:45:44", "throughput": 2714.8, "total_tokens": 74489408} {"current_steps": 412, "total_steps": 9134, "loss": 0.6762, "learning_rate": 4.9749414855698216e-05, "epoch": 0.04510249322641561, "percentage": 4.51, "elapsed_time": "7:38:26", "remaining_time": "6 days, 17:45:17", "throughput": 2715.42, "total_tokens": 74692800} {"current_steps": 413, "total_steps": 9134, "loss": 0.6548, "learning_rate": 4.974819899529725e-05, "epoch": 0.04521196529735351, "percentage": 4.52, "elapsed_time": "7:39:32", "remaining_time": "6 days, 17:43:51", "throughput": 2715.37, "total_tokens": 74869984} {"current_steps": 414, "total_steps": 9134, "loss": 0.7919, "learning_rate": 4.9746980207231634e-05, "epoch": 0.04532143736829142, "percentage": 4.53, "elapsed_time": "7:40:42", "remaining_time": "6 days, 17:43:38", "throughput": 2715.79, "total_tokens": 75069792} {"current_steps": 415, "total_steps": 9134, "loss": 0.7385, "learning_rate": 4.9745758491645576e-05, "epoch": 0.04543090943922932, "percentage": 4.54, "elapsed_time": "7:41:49", "remaining_time": "6 days, 17:42:36", "throughput": 2716.14, "total_tokens": 75261536} {"current_steps": 416, "total_steps": 9134, "loss": 0.6277, "learning_rate": 4.97445338486836e-05, "epoch": 0.04554038151016722, "percentage": 4.55, "elapsed_time": "7:42:53", "remaining_time": "6 days, 17:40:47", "throughput": 2715.58, "total_tokens": 75421920} {"current_steps": 417, "total_steps": 9134, "loss": 0.9815, "learning_rate": 4.974330627849057e-05, "epoch": 0.04564985358110512, "percentage": 4.57, "elapsed_time": "7:44:02", "remaining_time": "6 days, 17:40:29", "throughput": 2716.2, "total_tokens": 75626880} {"current_steps": 418, "total_steps": 9134, "loss": 0.7137, "learning_rate": 4.974207578121171e-05, "epoch": 0.04575932565204302, "percentage": 4.58, "elapsed_time": "7:45:11", "remaining_time": "6 days, 17:40:07", "throughput": 2716.22, "total_tokens": 75814592} {"current_steps": 419, "total_steps": 9134, "loss": 0.6356, "learning_rate": 4.974084235699258e-05, "epoch": 0.04586879772298093, "percentage": 4.59, "elapsed_time": "7:46:16", "remaining_time": "6 days, 17:38:11", "throughput": 2716.44, "total_tokens": 75995584} {"current_steps": 420, "total_steps": 9134, "loss": 0.6455, "learning_rate": 4.973960600597909e-05, "epoch": 0.04597826979391883, "percentage": 4.6, "elapsed_time": "7:47:21", "remaining_time": "6 days, 17:36:37", "throughput": 2717.24, "total_tokens": 76195840} {"current_steps": 421, "total_steps": 9134, "loss": 0.6132, "learning_rate": 4.973836672831751e-05, "epoch": 0.04608774186485673, "percentage": 4.61, "elapsed_time": "7:48:26", "remaining_time": "6 days, 17:34:56", "throughput": 2716.74, "total_tokens": 76358912} {"current_steps": 422, "total_steps": 9134, "loss": 0.7666, "learning_rate": 4.973712452415444e-05, "epoch": 0.04619721393579463, "percentage": 4.62, "elapsed_time": "7:49:32", "remaining_time": "6 days, 17:33:35", "throughput": 2717.3, "total_tokens": 76554016} {"current_steps": 423, "total_steps": 9134, "loss": 0.7632, "learning_rate": 4.9735879393636826e-05, "epoch": 0.04630668600673253, "percentage": 4.63, "elapsed_time": "7:50:35", "remaining_time": "6 days, 17:31:14", "throughput": 2717.28, "total_tokens": 76725152} {"current_steps": 424, "total_steps": 9134, "loss": 0.5968, "learning_rate": 4.9734631336911964e-05, "epoch": 0.04641615807767043, "percentage": 4.64, "elapsed_time": "7:51:43", "remaining_time": "6 days, 17:30:27", "throughput": 2717.87, "total_tokens": 76925856} {"current_steps": 425, "total_steps": 9134, "loss": 0.7795, "learning_rate": 4.97333803541275e-05, "epoch": 0.04652563014860834, "percentage": 4.65, "elapsed_time": "7:52:52", "remaining_time": "6 days, 17:30:06", "throughput": 2717.39, "total_tokens": 77099680} {"current_steps": 426, "total_steps": 9134, "loss": 0.8507, "learning_rate": 4.973212644543143e-05, "epoch": 0.04663510221954624, "percentage": 4.66, "elapsed_time": "7:54:01", "remaining_time": "6 days, 17:29:45", "throughput": 2717.89, "total_tokens": 77301280} {"current_steps": 427, "total_steps": 9134, "loss": 0.6908, "learning_rate": 4.973086961097207e-05, "epoch": 0.04674457429048414, "percentage": 4.67, "elapsed_time": "7:55:07", "remaining_time": "6 days, 17:28:20", "throughput": 2717.41, "total_tokens": 77466816} {"current_steps": 428, "total_steps": 9134, "loss": 0.7843, "learning_rate": 4.972960985089812e-05, "epoch": 0.04685404636142204, "percentage": 4.69, "elapsed_time": "7:56:15", "remaining_time": "6 days, 17:27:28", "throughput": 2717.45, "total_tokens": 77651392} {"current_steps": 429, "total_steps": 9134, "loss": 0.741, "learning_rate": 4.97283471653586e-05, "epoch": 0.04696351843235994, "percentage": 4.7, "elapsed_time": "7:57:18", "remaining_time": "6 days, 17:25:23", "throughput": 2717.15, "total_tokens": 77816256} {"current_steps": 430, "total_steps": 9134, "loss": 0.8123, "learning_rate": 4.972708155450288e-05, "epoch": 0.04707299050329784, "percentage": 4.71, "elapsed_time": "7:58:24", "remaining_time": "6 days, 17:23:46", "throughput": 2716.99, "total_tokens": 77988960} {"current_steps": 431, "total_steps": 9134, "loss": 0.7105, "learning_rate": 4.972581301848068e-05, "epoch": 0.04718246257423575, "percentage": 4.72, "elapsed_time": "7:59:28", "remaining_time": "6 days, 17:21:40", "throughput": 2716.74, "total_tokens": 78155392} {"current_steps": 432, "total_steps": 9134, "loss": 0.6943, "learning_rate": 4.972454155744207e-05, "epoch": 0.04729193464517365, "percentage": 4.73, "elapsed_time": "8:00:35", "remaining_time": "6 days, 17:20:43", "throughput": 2717.23, "total_tokens": 78351840} {"current_steps": 433, "total_steps": 9134, "loss": 0.8766, "learning_rate": 4.9723267171537455e-05, "epoch": 0.04740140671611155, "percentage": 4.74, "elapsed_time": "8:01:40", "remaining_time": "6 days, 17:19:15", "throughput": 2716.56, "total_tokens": 78511328} {"current_steps": 434, "total_steps": 9134, "loss": 0.7637, "learning_rate": 4.9721989860917605e-05, "epoch": 0.04751087878704945, "percentage": 4.75, "elapsed_time": "8:02:49", "remaining_time": "6 days, 17:18:40", "throughput": 2716.95, "total_tokens": 78708000} {"current_steps": 435, "total_steps": 9134, "loss": 0.6539, "learning_rate": 4.9720709625733614e-05, "epoch": 0.047620350857987354, "percentage": 4.76, "elapsed_time": "8:03:58", "remaining_time": "6 days, 17:18:15", "throughput": 2717.06, "total_tokens": 78898400} {"current_steps": 436, "total_steps": 9134, "loss": 0.5621, "learning_rate": 4.971942646613693e-05, "epoch": 0.04772982292892526, "percentage": 4.77, "elapsed_time": "8:05:04", "remaining_time": "6 days, 17:16:53", "throughput": 2717.08, "total_tokens": 79078272} {"current_steps": 437, "total_steps": 9134, "loss": 0.757, "learning_rate": 4.971814038227934e-05, "epoch": 0.04783929499986316, "percentage": 4.78, "elapsed_time": "8:06:09", "remaining_time": "6 days, 17:15:17", "throughput": 2716.98, "total_tokens": 79252544} {"current_steps": 438, "total_steps": 9134, "loss": 0.5888, "learning_rate": 4.971685137431301e-05, "epoch": 0.04794876707080106, "percentage": 4.8, "elapsed_time": "8:07:12", "remaining_time": "6 days, 17:13:01", "throughput": 2716.83, "total_tokens": 79420096} {"current_steps": 439, "total_steps": 9134, "loss": 0.7311, "learning_rate": 4.971555944239041e-05, "epoch": 0.04805823914173896, "percentage": 4.81, "elapsed_time": "8:08:18", "remaining_time": "6 days, 17:11:41", "throughput": 2716.9, "total_tokens": 79601760} {"current_steps": 440, "total_steps": 9134, "loss": 0.8492, "learning_rate": 4.971426458666437e-05, "epoch": 0.048167711212676864, "percentage": 4.82, "elapsed_time": "8:09:23", "remaining_time": "6 days, 17:09:49", "throughput": 2716.5, "total_tokens": 79765056} {"current_steps": 441, "total_steps": 9134, "loss": 0.6302, "learning_rate": 4.9712966807288085e-05, "epoch": 0.048277183283614765, "percentage": 4.83, "elapsed_time": "8:10:30", "remaining_time": "6 days, 17:08:59", "throughput": 2716.67, "total_tokens": 79953664} {"current_steps": 442, "total_steps": 9134, "loss": 0.7277, "learning_rate": 4.971166610441507e-05, "epoch": 0.04838665535455267, "percentage": 4.84, "elapsed_time": "8:11:36", "remaining_time": "6 days, 17:07:24", "throughput": 2716.75, "total_tokens": 80133536} {"current_steps": 443, "total_steps": 9134, "loss": 0.7773, "learning_rate": 4.9710362478199186e-05, "epoch": 0.04849612742549057, "percentage": 4.85, "elapsed_time": "8:12:43", "remaining_time": "6 days, 17:06:34", "throughput": 2717.1, "total_tokens": 80327296} {"current_steps": 444, "total_steps": 9134, "loss": 1.0182, "learning_rate": 4.9709055928794664e-05, "epoch": 0.048605599496428474, "percentage": 4.86, "elapsed_time": "8:13:50", "remaining_time": "6 days, 17:05:36", "throughput": 2717.82, "total_tokens": 80531136} {"current_steps": 445, "total_steps": 9134, "loss": 0.6257, "learning_rate": 4.970774645635606e-05, "epoch": 0.048715071567366375, "percentage": 4.87, "elapsed_time": "8:14:57", "remaining_time": "6 days, 17:04:21", "throughput": 2718.28, "total_tokens": 80725120} {"current_steps": 446, "total_steps": 9134, "loss": 0.9036, "learning_rate": 4.970643406103828e-05, "epoch": 0.048824543638304276, "percentage": 4.88, "elapsed_time": "8:16:04", "remaining_time": "6 days, 17:03:20", "throughput": 2717.51, "total_tokens": 80884384} {"current_steps": 447, "total_steps": 9134, "loss": 0.7362, "learning_rate": 4.970511874299659e-05, "epoch": 0.048934015709242176, "percentage": 4.89, "elapsed_time": "8:17:07", "remaining_time": "6 days, 17:01:02", "throughput": 2717.47, "total_tokens": 81054624} {"current_steps": 448, "total_steps": 9134, "loss": 0.7956, "learning_rate": 4.9703800502386574e-05, "epoch": 0.049043487780180084, "percentage": 4.9, "elapsed_time": "8:18:15", "remaining_time": "6 days, 17:00:35", "throughput": 2717.37, "total_tokens": 81238528} {"current_steps": 449, "total_steps": 9134, "loss": 0.5557, "learning_rate": 4.970247933936418e-05, "epoch": 0.049152959851117985, "percentage": 4.92, "elapsed_time": "8:19:24", "remaining_time": "6 days, 16:59:59", "throughput": 2717.23, "total_tokens": 81419968} {"current_steps": 450, "total_steps": 9134, "loss": 0.6252, "learning_rate": 4.970115525408572e-05, "epoch": 0.049262431922055885, "percentage": 4.93, "elapsed_time": "8:20:31", "remaining_time": "6 days, 16:58:57", "throughput": 2717.15, "total_tokens": 81599392} {"current_steps": 451, "total_steps": 9134, "loss": 0.76, "learning_rate": 4.96998282467078e-05, "epoch": 0.049371903992993786, "percentage": 4.94, "elapsed_time": "8:21:33", "remaining_time": "6 days, 16:56:14", "throughput": 2716.61, "total_tokens": 81751040} {"current_steps": 452, "total_steps": 9134, "loss": 0.9865, "learning_rate": 4.969849831738742e-05, "epoch": 0.04948137606393169, "percentage": 4.95, "elapsed_time": "8:22:39", "remaining_time": "6 days, 16:55:02", "throughput": 2716.72, "total_tokens": 81934944} {"current_steps": 453, "total_steps": 9134, "loss": 0.6187, "learning_rate": 4.96971654662819e-05, "epoch": 0.049590848134869595, "percentage": 4.96, "elapsed_time": "8:23:43", "remaining_time": "6 days, 16:53:02", "throughput": 2716.07, "total_tokens": 82089056} {"current_steps": 454, "total_steps": 9134, "loss": 0.6141, "learning_rate": 4.969582969354892e-05, "epoch": 0.049700320205807495, "percentage": 4.97, "elapsed_time": "8:24:49", "remaining_time": "6 days, 16:51:35", "throughput": 2716.58, "total_tokens": 82282816} {"current_steps": 455, "total_steps": 9134, "loss": 0.7181, "learning_rate": 4.96944909993465e-05, "epoch": 0.049809792276745396, "percentage": 4.98, "elapsed_time": "8:25:50", "remaining_time": "6 days, 16:48:53", "throughput": 2716.28, "total_tokens": 82441408} {"current_steps": 456, "total_steps": 9134, "loss": 0.8364, "learning_rate": 4.969314938383301e-05, "epoch": 0.0499192643476833, "percentage": 4.99, "elapsed_time": "8:26:57", "remaining_time": "6 days, 16:47:45", "throughput": 2717.13, "total_tokens": 82648160} {"current_steps": 457, "total_steps": 9134, "loss": 0.6264, "learning_rate": 4.9691804847167146e-05, "epoch": 0.0500287364186212, "percentage": 5.0, "elapsed_time": "8:27:57", "remaining_time": "6 days, 16:44:29", "throughput": 2716.22, "total_tokens": 82783232} {"current_steps": 458, "total_steps": 9134, "loss": 0.5421, "learning_rate": 4.969045738950797e-05, "epoch": 0.0501382084895591, "percentage": 5.01, "elapsed_time": "8:28:59", "remaining_time": "6 days, 16:42:00", "throughput": 2715.8, "total_tokens": 82939584} {"current_steps": 459, "total_steps": 9134, "loss": 0.8048, "learning_rate": 4.968910701101489e-05, "epoch": 0.050247680560497006, "percentage": 5.03, "elapsed_time": "8:30:08", "remaining_time": "6 days, 16:41:39", "throughput": 2715.12, "total_tokens": 83106464} {"current_steps": 460, "total_steps": 9134, "loss": 0.7047, "learning_rate": 4.968775371184764e-05, "epoch": 0.05035715263143491, "percentage": 5.04, "elapsed_time": "8:31:14", "remaining_time": "6 days, 16:40:12", "throughput": 2714.9, "total_tokens": 83278048} {"current_steps": 461, "total_steps": 9134, "loss": 0.7417, "learning_rate": 4.968639749216632e-05, "epoch": 0.05046662470237281, "percentage": 5.05, "elapsed_time": "8:32:20", "remaining_time": "6 days, 16:38:50", "throughput": 2714.35, "total_tokens": 83439776} {"current_steps": 462, "total_steps": 9134, "loss": 0.9568, "learning_rate": 4.968503835213138e-05, "epoch": 0.05057609677331071, "percentage": 5.06, "elapsed_time": "8:33:26", "remaining_time": "6 days, 16:37:40", "throughput": 2715.04, "total_tokens": 83641600} {"current_steps": 463, "total_steps": 9134, "loss": 0.676, "learning_rate": 4.9683676291903594e-05, "epoch": 0.05068556884424861, "percentage": 5.07, "elapsed_time": "8:34:34", "remaining_time": "6 days, 16:36:44", "throughput": 2715.42, "total_tokens": 83836032} {"current_steps": 464, "total_steps": 9134, "loss": 0.6472, "learning_rate": 4.968231131164408e-05, "epoch": 0.050795040915186516, "percentage": 5.08, "elapsed_time": "8:35:42", "remaining_time": "6 days, 16:36:19", "throughput": 2716.05, "total_tokens": 84042560} {"current_steps": 465, "total_steps": 9134, "loss": 0.7965, "learning_rate": 4.968094341151433e-05, "epoch": 0.05090451298612442, "percentage": 5.09, "elapsed_time": "8:36:49", "remaining_time": "6 days, 16:35:14", "throughput": 2716.25, "total_tokens": 84230048} {"current_steps": 466, "total_steps": 9134, "loss": 0.7549, "learning_rate": 4.967957259167615e-05, "epoch": 0.05101398505706232, "percentage": 5.1, "elapsed_time": "8:37:57", "remaining_time": "6 days, 16:34:28", "throughput": 2716.58, "total_tokens": 84424480} {"current_steps": 467, "total_steps": 9134, "loss": 0.8055, "learning_rate": 4.967819885229171e-05, "epoch": 0.05112345712800022, "percentage": 5.11, "elapsed_time": "8:39:00", "remaining_time": "6 days, 16:32:21", "throughput": 2716.58, "total_tokens": 84596736} {"current_steps": 468, "total_steps": 9134, "loss": 0.789, "learning_rate": 4.967682219352353e-05, "epoch": 0.05123292919893812, "percentage": 5.12, "elapsed_time": "8:40:04", "remaining_time": "6 days, 16:30:25", "throughput": 2716.24, "total_tokens": 84760256} {"current_steps": 469, "total_steps": 9134, "loss": 0.6364, "learning_rate": 4.967544261553445e-05, "epoch": 0.05134240126987602, "percentage": 5.13, "elapsed_time": "8:41:07", "remaining_time": "6 days, 16:27:53", "throughput": 2715.63, "total_tokens": 84909664} {"current_steps": 470, "total_steps": 9134, "loss": 0.715, "learning_rate": 4.967406011848769e-05, "epoch": 0.05145187334081393, "percentage": 5.15, "elapsed_time": "8:42:13", "remaining_time": "6 days, 16:26:42", "throughput": 2715.37, "total_tokens": 85081920} {"current_steps": 471, "total_steps": 9134, "loss": 0.8409, "learning_rate": 4.967267470254678e-05, "epoch": 0.05156134541175183, "percentage": 5.16, "elapsed_time": "8:43:22", "remaining_time": "6 days, 16:26:17", "throughput": 2715.81, "total_tokens": 85282848} {"current_steps": 472, "total_steps": 9134, "loss": 0.6408, "learning_rate": 4.967128636787562e-05, "epoch": 0.05167081748268973, "percentage": 5.17, "elapsed_time": "8:44:24", "remaining_time": "6 days, 16:23:55", "throughput": 2715.25, "total_tokens": 85435168} {"current_steps": 473, "total_steps": 9134, "loss": 0.7552, "learning_rate": 4.9669895114638445e-05, "epoch": 0.05178028955362763, "percentage": 5.18, "elapsed_time": "8:45:30", "remaining_time": "6 days, 16:22:32", "throughput": 2715.32, "total_tokens": 85615936} {"current_steps": 474, "total_steps": 9134, "loss": 0.74, "learning_rate": 4.966850094299984e-05, "epoch": 0.05188976162456553, "percentage": 5.19, "elapsed_time": "8:46:38", "remaining_time": "6 days, 16:21:38", "throughput": 2715.55, "total_tokens": 85806112} {"current_steps": 475, "total_steps": 9134, "loss": 0.7766, "learning_rate": 4.966710385312473e-05, "epoch": 0.05199923369550343, "percentage": 5.2, "elapsed_time": "8:47:47", "remaining_time": "6 days, 16:21:23", "throughput": 2715.85, "total_tokens": 86004352} {"current_steps": 476, "total_steps": 9134, "loss": 0.9263, "learning_rate": 4.966570384517839e-05, "epoch": 0.05210870576644134, "percentage": 5.21, "elapsed_time": "8:48:57", "remaining_time": "6 days, 16:21:07", "throughput": 2716.7, "total_tokens": 86220064} {"current_steps": 477, "total_steps": 9134, "loss": 0.8275, "learning_rate": 4.966430091932645e-05, "epoch": 0.05221817783737924, "percentage": 5.22, "elapsed_time": "8:50:04", "remaining_time": "6 days, 16:20:08", "throughput": 2716.82, "total_tokens": 86406208} {"current_steps": 478, "total_steps": 9134, "loss": 0.5834, "learning_rate": 4.9662895075734844e-05, "epoch": 0.05232764990831714, "percentage": 5.23, "elapsed_time": "8:51:12", "remaining_time": "6 days, 16:19:28", "throughput": 2717.28, "total_tokens": 86605792} {"current_steps": 479, "total_steps": 9134, "loss": 0.7686, "learning_rate": 4.9661486314569904e-05, "epoch": 0.05243712197925504, "percentage": 5.24, "elapsed_time": "8:52:19", "remaining_time": "6 days, 16:18:22", "throughput": 2716.99, "total_tokens": 86778048} {"current_steps": 480, "total_steps": 9134, "loss": 0.645, "learning_rate": 4.966007463599828e-05, "epoch": 0.05254659405019294, "percentage": 5.26, "elapsed_time": "8:53:27", "remaining_time": "6 days, 16:17:42", "throughput": 2717.46, "total_tokens": 86978304} {"current_steps": 481, "total_steps": 9134, "loss": 0.6926, "learning_rate": 4.9658660040186967e-05, "epoch": 0.05265606612113085, "percentage": 5.27, "elapsed_time": "8:54:34", "remaining_time": "6 days, 16:16:53", "throughput": 2717.73, "total_tokens": 87170720} {"current_steps": 482, "total_steps": 9134, "loss": 0.8736, "learning_rate": 4.965724252730331e-05, "epoch": 0.05276553819206875, "percentage": 5.28, "elapsed_time": "8:55:39", "remaining_time": "6 days, 16:15:15", "throughput": 2717.13, "total_tokens": 87327968} {"current_steps": 483, "total_steps": 9134, "loss": 0.7194, "learning_rate": 4.9655822097515e-05, "epoch": 0.05287501026300665, "percentage": 5.29, "elapsed_time": "8:56:42", "remaining_time": "6 days, 16:12:54", "throughput": 2716.76, "total_tokens": 87485888} {"current_steps": 484, "total_steps": 9134, "loss": 0.9113, "learning_rate": 4.9654398750990075e-05, "epoch": 0.05298448233394455, "percentage": 5.3, "elapsed_time": "8:57:46", "remaining_time": "6 days, 16:11:05", "throughput": 2716.24, "total_tokens": 87643808} {"current_steps": 485, "total_steps": 9134, "loss": 0.6416, "learning_rate": 4.96529724878969e-05, "epoch": 0.05309395440488245, "percentage": 5.31, "elapsed_time": "8:58:55", "remaining_time": "6 days, 16:10:44", "throughput": 2716.86, "total_tokens": 87852128} {"current_steps": 486, "total_steps": 9134, "loss": 0.707, "learning_rate": 4.9651543308404217e-05, "epoch": 0.05320342647582035, "percentage": 5.32, "elapsed_time": "9:00:05", "remaining_time": "6 days, 16:10:29", "throughput": 2717.54, "total_tokens": 88062912} {"current_steps": 487, "total_steps": 9134, "loss": 0.7899, "learning_rate": 4.9650111212681073e-05, "epoch": 0.05331289854675826, "percentage": 5.33, "elapsed_time": "9:01:13", "remaining_time": "6 days, 16:09:39", "throughput": 2717.58, "total_tokens": 88247936} {"current_steps": 488, "total_steps": 9134, "loss": 0.8035, "learning_rate": 4.96486762008969e-05, "epoch": 0.05342237061769616, "percentage": 5.34, "elapsed_time": "9:02:22", "remaining_time": "6 days, 16:09:15", "throughput": 2717.5, "total_tokens": 88433184} {"current_steps": 489, "total_steps": 9134, "loss": 0.6418, "learning_rate": 4.964723827322147e-05, "epoch": 0.05353184268863406, "percentage": 5.35, "elapsed_time": "9:03:25", "remaining_time": "6 days, 16:07:15", "throughput": 2716.91, "total_tokens": 88586848} {"current_steps": 490, "total_steps": 9134, "loss": 0.6706, "learning_rate": 4.9645797429824846e-05, "epoch": 0.05364131475957196, "percentage": 5.36, "elapsed_time": "9:04:29", "remaining_time": "6 days, 16:05:23", "throughput": 2717.1, "total_tokens": 88767392} {"current_steps": 491, "total_steps": 9134, "loss": 0.9752, "learning_rate": 4.964435367087751e-05, "epoch": 0.053750786830509864, "percentage": 5.38, "elapsed_time": "9:05:36", "remaining_time": "6 days, 16:04:13", "throughput": 2717.46, "total_tokens": 88959808} {"current_steps": 492, "total_steps": 9134, "loss": 0.8196, "learning_rate": 4.9642906996550256e-05, "epoch": 0.053860258901447765, "percentage": 5.39, "elapsed_time": "9:06:43", "remaining_time": "6 days, 16:03:10", "throughput": 2717.82, "total_tokens": 89153568} {"current_steps": 493, "total_steps": 9134, "loss": 0.8177, "learning_rate": 4.96414574070142e-05, "epoch": 0.05396973097238567, "percentage": 5.4, "elapsed_time": "9:07:46", "remaining_time": "6 days, 16:01:08", "throughput": 2717.22, "total_tokens": 89306112} {"current_steps": 494, "total_steps": 9134, "loss": 0.6267, "learning_rate": 4.964000490244084e-05, "epoch": 0.05407920304332357, "percentage": 5.41, "elapsed_time": "9:08:51", "remaining_time": "6 days, 15:59:34", "throughput": 2716.92, "total_tokens": 89473440} {"current_steps": 495, "total_steps": 9134, "loss": 0.7453, "learning_rate": 4.963854948300201e-05, "epoch": 0.054188675114261474, "percentage": 5.42, "elapsed_time": "9:09:54", "remaining_time": "6 days, 15:57:25", "throughput": 2716.58, "total_tokens": 89633376} {"current_steps": 496, "total_steps": 9134, "loss": 0.7179, "learning_rate": 4.963709114886988e-05, "epoch": 0.054298147185199375, "percentage": 5.43, "elapsed_time": "9:10:58", "remaining_time": "6 days, 15:55:23", "throughput": 2716.29, "total_tokens": 89796224} {"current_steps": 497, "total_steps": 9134, "loss": 0.707, "learning_rate": 4.9635629900216956e-05, "epoch": 0.054407619256137275, "percentage": 5.44, "elapsed_time": "9:12:05", "remaining_time": "6 days, 15:54:23", "throughput": 2715.71, "total_tokens": 89959296} {"current_steps": 498, "total_steps": 9134, "loss": 0.6263, "learning_rate": 4.963416573721611e-05, "epoch": 0.05451709132707518, "percentage": 5.45, "elapsed_time": "9:13:09", "remaining_time": "6 days, 15:52:38", "throughput": 2715.64, "total_tokens": 90131776} {"current_steps": 499, "total_steps": 9134, "loss": 0.6307, "learning_rate": 4.9632698660040556e-05, "epoch": 0.054626563398013084, "percentage": 5.46, "elapsed_time": "9:14:14", "remaining_time": "6 days, 15:50:47", "throughput": 2715.66, "total_tokens": 90306720} {"current_steps": 500, "total_steps": 9134, "loss": 0.7336, "learning_rate": 4.963122866886384e-05, "epoch": 0.054736035468950985, "percentage": 5.47, "elapsed_time": "9:15:23", "remaining_time": "6 days, 15:50:21", "throughput": 2715.85, "total_tokens": 90500480} {"current_steps": 501, "total_steps": 9134, "loss": 0.8413, "learning_rate": 4.9629755763859855e-05, "epoch": 0.054845507539888885, "percentage": 5.49, "elapsed_time": "9:16:27", "remaining_time": "6 days, 15:48:30", "throughput": 2715.62, "total_tokens": 90666688} {"current_steps": 502, "total_steps": 9134, "loss": 0.8012, "learning_rate": 4.9628279945202856e-05, "epoch": 0.054954979610826786, "percentage": 5.5, "elapsed_time": "9:17:34", "remaining_time": "6 days, 15:47:35", "throughput": 2716.04, "total_tokens": 90863360} {"current_steps": 503, "total_steps": 9134, "loss": 0.7848, "learning_rate": 4.962680121306741e-05, "epoch": 0.05506445168176469, "percentage": 5.51, "elapsed_time": "9:18:44", "remaining_time": "6 days, 15:47:19", "throughput": 2716.62, "total_tokens": 91072128} {"current_steps": 504, "total_steps": 9134, "loss": 0.8546, "learning_rate": 4.962531956762847e-05, "epoch": 0.055173923752702594, "percentage": 5.52, "elapsed_time": "9:19:48", "remaining_time": "6 days, 15:45:34", "throughput": 2716.33, "total_tokens": 91237216} {"current_steps": 505, "total_steps": 9134, "loss": 0.5563, "learning_rate": 4.9623835009061294e-05, "epoch": 0.055283395823640495, "percentage": 5.53, "elapsed_time": "9:20:51", "remaining_time": "6 days, 15:43:33", "throughput": 2715.94, "total_tokens": 91396480} {"current_steps": 506, "total_steps": 9134, "loss": 1.0451, "learning_rate": 4.962234753754151e-05, "epoch": 0.055392867894578396, "percentage": 5.54, "elapsed_time": "9:22:00", "remaining_time": "6 days, 15:43:02", "throughput": 2716.72, "total_tokens": 91609504} {"current_steps": 507, "total_steps": 9134, "loss": 0.7494, "learning_rate": 4.962085715324508e-05, "epoch": 0.0555023399655163, "percentage": 5.55, "elapsed_time": "9:23:09", "remaining_time": "6 days, 15:42:30", "throughput": 2717.03, "total_tokens": 91806400} {"current_steps": 508, "total_steps": 9134, "loss": 0.7988, "learning_rate": 4.9619363856348324e-05, "epoch": 0.0556118120364542, "percentage": 5.56, "elapsed_time": "9:24:13", "remaining_time": "6 days, 15:40:40", "throughput": 2716.57, "total_tokens": 91965216} {"current_steps": 509, "total_steps": 9134, "loss": 0.6388, "learning_rate": 4.9617867647027876e-05, "epoch": 0.055721284107392105, "percentage": 5.57, "elapsed_time": "9:25:17", "remaining_time": "6 days, 15:38:44", "throughput": 2716.21, "total_tokens": 92125824} {"current_steps": 510, "total_steps": 9134, "loss": 0.6663, "learning_rate": 4.961636852546075e-05, "epoch": 0.055830756178330006, "percentage": 5.58, "elapsed_time": "9:26:19", "remaining_time": "6 days, 15:36:35", "throughput": 2715.25, "total_tokens": 92264256} {"current_steps": 511, "total_steps": 9134, "loss": 0.6275, "learning_rate": 4.961486649182429e-05, "epoch": 0.055940228249267906, "percentage": 5.59, "elapsed_time": "9:27:25", "remaining_time": "6 days, 15:35:04", "throughput": 2715.5, "total_tokens": 92449952} {"current_steps": 512, "total_steps": 9134, "loss": 0.9085, "learning_rate": 4.961336154629618e-05, "epoch": 0.05604970032020581, "percentage": 5.61, "elapsed_time": "9:28:31", "remaining_time": "6 days, 15:33:50", "throughput": 2715.67, "total_tokens": 92635200} {"current_steps": 513, "total_steps": 9134, "loss": 0.6674, "learning_rate": 4.961185368905445e-05, "epoch": 0.05615917239114371, "percentage": 5.62, "elapsed_time": "9:29:40", "remaining_time": "6 days, 15:33:22", "throughput": 2716.61, "total_tokens": 92854720} {"current_steps": 514, "total_steps": 9134, "loss": 0.8299, "learning_rate": 4.9610342920277475e-05, "epoch": 0.05626864446208161, "percentage": 5.63, "elapsed_time": "9:30:48", "remaining_time": "6 days, 15:32:47", "throughput": 2717.37, "total_tokens": 93066848} {"current_steps": 515, "total_steps": 9134, "loss": 0.6689, "learning_rate": 4.960882924014398e-05, "epoch": 0.056378116533019516, "percentage": 5.64, "elapsed_time": "9:31:54", "remaining_time": "6 days, 15:31:24", "throughput": 2717.56, "total_tokens": 93251648} {"current_steps": 516, "total_steps": 9134, "loss": 0.5849, "learning_rate": 4.960731264883304e-05, "epoch": 0.05648758860395742, "percentage": 5.65, "elapsed_time": "9:32:58", "remaining_time": "6 days, 15:29:37", "throughput": 2716.77, "total_tokens": 93399040} {"current_steps": 517, "total_steps": 9134, "loss": 0.689, "learning_rate": 4.960579314652405e-05, "epoch": 0.05659706067489532, "percentage": 5.66, "elapsed_time": "9:34:06", "remaining_time": "6 days, 15:28:42", "throughput": 2716.48, "total_tokens": 93571968} {"current_steps": 518, "total_steps": 9134, "loss": 1.0275, "learning_rate": 4.960427073339676e-05, "epoch": 0.05670653274583322, "percentage": 5.67, "elapsed_time": "9:35:12", "remaining_time": "6 days, 15:27:33", "throughput": 2716.56, "total_tokens": 93755200} {"current_steps": 519, "total_steps": 9134, "loss": 0.7858, "learning_rate": 4.960274540963129e-05, "epoch": 0.05681600481677112, "percentage": 5.68, "elapsed_time": "9:36:18", "remaining_time": "6 days, 15:26:09", "throughput": 2715.93, "total_tokens": 93911776} {"current_steps": 520, "total_steps": 9134, "loss": 0.6032, "learning_rate": 4.9601217175408064e-05, "epoch": 0.05692547688770902, "percentage": 5.69, "elapsed_time": "9:37:21", "remaining_time": "6 days, 15:24:04", "throughput": 2715.09, "total_tokens": 94054016} {"current_steps": 521, "total_steps": 9134, "loss": 0.9303, "learning_rate": 4.959968603090788e-05, "epoch": 0.05703494895864693, "percentage": 5.7, "elapsed_time": "9:38:30", "remaining_time": "6 days, 15:23:41", "throughput": 2715.9, "total_tokens": 94269952} {"current_steps": 522, "total_steps": 9134, "loss": 0.7497, "learning_rate": 4.959815197631186e-05, "epoch": 0.05714442102958483, "percentage": 5.71, "elapsed_time": "9:39:39", "remaining_time": "6 days, 15:23:14", "throughput": 2716.21, "total_tokens": 94468416} {"current_steps": 523, "total_steps": 9134, "loss": 0.5854, "learning_rate": 4.9596615011801486e-05, "epoch": 0.05725389310052273, "percentage": 5.73, "elapsed_time": "9:40:47", "remaining_time": "6 days, 15:22:33", "throughput": 2716.43, "total_tokens": 94661280} {"current_steps": 524, "total_steps": 9134, "loss": 0.6438, "learning_rate": 4.959507513755858e-05, "epoch": 0.05736336517146063, "percentage": 5.74, "elapsed_time": "9:41:51", "remaining_time": "6 days, 15:20:37", "throughput": 2716.48, "total_tokens": 94835776} {"current_steps": 525, "total_steps": 9134, "loss": 0.8989, "learning_rate": 4.95935323537653e-05, "epoch": 0.05747283724239853, "percentage": 5.75, "elapsed_time": "9:42:57", "remaining_time": "6 days, 15:19:24", "throughput": 2716.53, "total_tokens": 95017216} {"current_steps": 526, "total_steps": 9134, "loss": 0.6791, "learning_rate": 4.9591986660604164e-05, "epoch": 0.05758230931333644, "percentage": 5.76, "elapsed_time": "9:44:06", "remaining_time": "6 days, 15:18:56", "throughput": 2716.97, "total_tokens": 95220384} {"current_steps": 527, "total_steps": 9134, "loss": 0.7801, "learning_rate": 4.959043805825801e-05, "epoch": 0.05769178138427434, "percentage": 5.77, "elapsed_time": "9:45:13", "remaining_time": "6 days, 15:17:53", "throughput": 2717.01, "total_tokens": 95403392} {"current_steps": 528, "total_steps": 9134, "loss": 0.8164, "learning_rate": 4.958888654691004e-05, "epoch": 0.05780125345521224, "percentage": 5.78, "elapsed_time": "9:46:22", "remaining_time": "6 days, 15:17:26", "throughput": 2717.15, "total_tokens": 95595808} {"current_steps": 529, "total_steps": 9134, "loss": 0.7436, "learning_rate": 4.95873321267438e-05, "epoch": 0.05791072552615014, "percentage": 5.79, "elapsed_time": "9:47:28", "remaining_time": "6 days, 15:16:06", "throughput": 2717.18, "total_tokens": 95775680} {"current_steps": 530, "total_steps": 9134, "loss": 0.6967, "learning_rate": 4.958577479794317e-05, "epoch": 0.05802019759708804, "percentage": 5.8, "elapsed_time": "9:48:36", "remaining_time": "6 days, 15:15:27", "throughput": 2717.17, "total_tokens": 95961152} {"current_steps": 531, "total_steps": 9134, "loss": 0.6337, "learning_rate": 4.958421456069239e-05, "epoch": 0.05812966966802594, "percentage": 5.81, "elapsed_time": "9:49:45", "remaining_time": "6 days, 15:15:02", "throughput": 2717.83, "total_tokens": 96172384} {"current_steps": 532, "total_steps": 9134, "loss": 0.6596, "learning_rate": 4.9582651415176026e-05, "epoch": 0.05823914173896385, "percentage": 5.82, "elapsed_time": "9:50:53", "remaining_time": "6 days, 15:14:17", "throughput": 2718.01, "total_tokens": 96363680} {"current_steps": 533, "total_steps": 9134, "loss": 0.664, "learning_rate": 4.958108536157899e-05, "epoch": 0.05834861380990175, "percentage": 5.84, "elapsed_time": "9:51:59", "remaining_time": "6 days, 15:12:58", "throughput": 2717.47, "total_tokens": 96523392} {"current_steps": 534, "total_steps": 9134, "loss": 0.687, "learning_rate": 4.9579516400086545e-05, "epoch": 0.05845808588083965, "percentage": 5.85, "elapsed_time": "9:53:03", "remaining_time": "6 days, 15:11:15", "throughput": 2717.18, "total_tokens": 96688256} {"current_steps": 535, "total_steps": 9134, "loss": 0.6981, "learning_rate": 4.9577944530884295e-05, "epoch": 0.05856755795177755, "percentage": 5.86, "elapsed_time": "9:54:06", "remaining_time": "6 days, 15:09:10", "throughput": 2717.14, "total_tokens": 96857824} {"current_steps": 536, "total_steps": 9134, "loss": 0.6295, "learning_rate": 4.9576369754158194e-05, "epoch": 0.05867703002271545, "percentage": 5.87, "elapsed_time": "9:55:15", "remaining_time": "6 days, 15:08:31", "throughput": 2717.19, "total_tokens": 97045312} {"current_steps": 537, "total_steps": 9134, "loss": 0.9087, "learning_rate": 4.9574792070094534e-05, "epoch": 0.05878650209365335, "percentage": 5.88, "elapsed_time": "9:56:24", "remaining_time": "6 days, 15:08:04", "throughput": 2717.02, "total_tokens": 97227200} {"current_steps": 538, "total_steps": 9134, "loss": 0.7898, "learning_rate": 4.9573211478879955e-05, "epoch": 0.05889597416459126, "percentage": 5.89, "elapsed_time": "9:57:28", "remaining_time": "6 days, 15:06:17", "throughput": 2716.59, "total_tokens": 97385792} {"current_steps": 539, "total_steps": 9134, "loss": 0.63, "learning_rate": 4.9571627980701426e-05, "epoch": 0.05900544623552916, "percentage": 5.9, "elapsed_time": "9:58:37", "remaining_time": "6 days, 15:05:47", "throughput": 2716.4, "total_tokens": 97566336} {"current_steps": 540, "total_steps": 9134, "loss": 0.6892, "learning_rate": 4.9570041575746285e-05, "epoch": 0.05911491830646706, "percentage": 5.91, "elapsed_time": "9:59:42", "remaining_time": "6 days, 15:04:11", "throughput": 2716.38, "total_tokens": 97741504} {"current_steps": 541, "total_steps": 9134, "loss": 0.7597, "learning_rate": 4.9568452264202194e-05, "epoch": 0.05922439037740496, "percentage": 5.92, "elapsed_time": "10:00:47", "remaining_time": "6 days, 15:02:35", "throughput": 2716.61, "total_tokens": 97925856} {"current_steps": 542, "total_steps": 9134, "loss": 0.756, "learning_rate": 4.9566860046257166e-05, "epoch": 0.059333862448342864, "percentage": 5.93, "elapsed_time": "10:01:51", "remaining_time": "6 days, 15:01:00", "throughput": 2716.52, "total_tokens": 98098560} {"current_steps": 543, "total_steps": 9134, "loss": 0.6924, "learning_rate": 4.956526492209956e-05, "epoch": 0.05944333451928077, "percentage": 5.94, "elapsed_time": "10:02:59", "remaining_time": "6 days, 15:00:15", "throughput": 2716.72, "total_tokens": 98290528} {"current_steps": 544, "total_steps": 9134, "loss": 0.5497, "learning_rate": 4.956366689191808e-05, "epoch": 0.05955280659021867, "percentage": 5.96, "elapsed_time": "10:04:04", "remaining_time": "6 days, 14:58:39", "throughput": 2716.47, "total_tokens": 98457408} {"current_steps": 545, "total_steps": 9134, "loss": 0.8472, "learning_rate": 4.956206595590176e-05, "epoch": 0.05966227866115657, "percentage": 5.97, "elapsed_time": "10:05:11", "remaining_time": "6 days, 14:57:32", "throughput": 2716.48, "total_tokens": 98638848} {"current_steps": 546, "total_steps": 9134, "loss": 0.7207, "learning_rate": 4.9560462114239995e-05, "epoch": 0.059771750732094474, "percentage": 5.98, "elapsed_time": "10:06:15", "remaining_time": "6 days, 14:55:40", "throughput": 2716.35, "total_tokens": 98807520} {"current_steps": 547, "total_steps": 9134, "loss": 0.6397, "learning_rate": 4.9558855367122505e-05, "epoch": 0.059881222803032375, "percentage": 5.99, "elapsed_time": "10:07:24", "remaining_time": "6 days, 14:55:16", "throughput": 2717.24, "total_tokens": 99027936} {"current_steps": 548, "total_steps": 9134, "loss": 0.5435, "learning_rate": 4.9557245714739374e-05, "epoch": 0.059990694873970275, "percentage": 6.0, "elapsed_time": "10:08:26", "remaining_time": "6 days, 14:53:05", "throughput": 2717.06, "total_tokens": 99191232} {"current_steps": 549, "total_steps": 9134, "loss": 0.7598, "learning_rate": 4.955563315728103e-05, "epoch": 0.06010016694490818, "percentage": 6.01, "elapsed_time": "10:09:31", "remaining_time": "6 days, 14:51:25", "throughput": 2717.2, "total_tokens": 99371552} {"current_steps": 550, "total_steps": 9134, "loss": 0.7534, "learning_rate": 4.955401769493822e-05, "epoch": 0.060209639015846084, "percentage": 6.02, "elapsed_time": "10:10:34", "remaining_time": "6 days, 14:49:18", "throughput": 2717.25, "total_tokens": 99544032} {"current_steps": 551, "total_steps": 9134, "loss": 0.6839, "learning_rate": 4.9552399327902054e-05, "epoch": 0.060319111086783984, "percentage": 6.03, "elapsed_time": "10:11:42", "remaining_time": "6 days, 14:48:45", "throughput": 2716.96, "total_tokens": 99720096} {"current_steps": 552, "total_steps": 9134, "loss": 0.5825, "learning_rate": 4.955077805636399e-05, "epoch": 0.060428583157721885, "percentage": 6.04, "elapsed_time": "10:12:47", "remaining_time": "6 days, 14:47:04", "throughput": 2716.58, "total_tokens": 99881152} {"current_steps": 553, "total_steps": 9134, "loss": 0.9622, "learning_rate": 4.954915388051581e-05, "epoch": 0.060538055228659786, "percentage": 6.05, "elapsed_time": "10:13:56", "remaining_time": "6 days, 14:46:33", "throughput": 2715.94, "total_tokens": 100044672} {"current_steps": 554, "total_steps": 9134, "loss": 0.6319, "learning_rate": 4.954752680054966e-05, "epoch": 0.060647527299597694, "percentage": 6.07, "elapsed_time": "10:15:02", "remaining_time": "6 days, 14:45:24", "throughput": 2716.01, "total_tokens": 100227680} {"current_steps": 555, "total_steps": 9134, "loss": 0.7092, "learning_rate": 4.954589681665801e-05, "epoch": 0.060756999370535594, "percentage": 6.08, "elapsed_time": "10:16:07", "remaining_time": "6 days, 14:43:47", "throughput": 2716.06, "total_tokens": 100405312} {"current_steps": 556, "total_steps": 9134, "loss": 0.7141, "learning_rate": 4.95442639290337e-05, "epoch": 0.060866471441473495, "percentage": 6.09, "elapsed_time": "10:17:09", "remaining_time": "6 days, 14:41:26", "throughput": 2715.53, "total_tokens": 100553600} {"current_steps": 557, "total_steps": 9134, "loss": 0.6965, "learning_rate": 4.954262813786988e-05, "epoch": 0.060975943512411396, "percentage": 6.1, "elapsed_time": "10:18:10", "remaining_time": "6 days, 14:38:55", "throughput": 2715.57, "total_tokens": 100721152} {"current_steps": 558, "total_steps": 9134, "loss": 0.7073, "learning_rate": 4.954098944336007e-05, "epoch": 0.061085415583349296, "percentage": 6.11, "elapsed_time": "10:19:14", "remaining_time": "6 days, 14:37:09", "throughput": 2715.7, "total_tokens": 100899456} {"current_steps": 559, "total_steps": 9134, "loss": 0.8067, "learning_rate": 4.953934784569812e-05, "epoch": 0.0611948876542872, "percentage": 6.12, "elapsed_time": "10:20:23", "remaining_time": "6 days, 14:36:47", "throughput": 2716.59, "total_tokens": 101121440} {"current_steps": 560, "total_steps": 9134, "loss": 0.5724, "learning_rate": 4.953770334507824e-05, "epoch": 0.061304359725225105, "percentage": 6.13, "elapsed_time": "10:21:31", "remaining_time": "6 days, 14:35:59", "throughput": 2716.56, "total_tokens": 101304448} {"current_steps": 561, "total_steps": 9134, "loss": 0.6555, "learning_rate": 4.9536055941694956e-05, "epoch": 0.061413831796163006, "percentage": 6.14, "elapsed_time": "10:22:37", "remaining_time": "6 days, 14:34:43", "throughput": 2716.49, "total_tokens": 101481184} {"current_steps": 562, "total_steps": 9134, "loss": 0.6492, "learning_rate": 4.9534405635743165e-05, "epoch": 0.061523303867100906, "percentage": 6.15, "elapsed_time": "10:23:47", "remaining_time": "6 days, 14:34:22", "throughput": 2716.72, "total_tokens": 101678976} {"current_steps": 563, "total_steps": 9134, "loss": 0.7577, "learning_rate": 4.953275242741808e-05, "epoch": 0.06163277593803881, "percentage": 6.16, "elapsed_time": "10:24:53", "remaining_time": "6 days, 14:33:06", "throughput": 2716.6, "total_tokens": 101853472} {"current_steps": 564, "total_steps": 9134, "loss": 0.7937, "learning_rate": 4.953109631691529e-05, "epoch": 0.06174224800897671, "percentage": 6.17, "elapsed_time": "10:25:55", "remaining_time": "6 days, 14:30:52", "throughput": 2716.01, "total_tokens": 102000192} {"current_steps": 565, "total_steps": 9134, "loss": 0.6746, "learning_rate": 4.952943730443069e-05, "epoch": 0.06185172007991461, "percentage": 6.19, "elapsed_time": "10:27:02", "remaining_time": "6 days, 14:29:53", "throughput": 2715.68, "total_tokens": 102169984} {"current_steps": 566, "total_steps": 9134, "loss": 0.6961, "learning_rate": 4.952777539016056e-05, "epoch": 0.061961192150852516, "percentage": 6.2, "elapsed_time": "10:28:04", "remaining_time": "6 days, 14:27:42", "throughput": 2715.47, "total_tokens": 102331712} {"current_steps": 567, "total_steps": 9134, "loss": 0.5973, "learning_rate": 4.9526110574301485e-05, "epoch": 0.06207066422179042, "percentage": 6.21, "elapsed_time": "10:29:12", "remaining_time": "6 days, 14:26:57", "throughput": 2715.64, "total_tokens": 102522560} {"current_steps": 568, "total_steps": 9134, "loss": 0.7482, "learning_rate": 4.9524442857050424e-05, "epoch": 0.06218013629272832, "percentage": 6.22, "elapsed_time": "10:30:21", "remaining_time": "6 days, 14:26:30", "throughput": 2715.57, "total_tokens": 102707584} {"current_steps": 569, "total_steps": 9134, "loss": 0.9118, "learning_rate": 4.952277223860465e-05, "epoch": 0.06228960836366622, "percentage": 6.23, "elapsed_time": "10:31:31", "remaining_time": "6 days, 14:26:05", "throughput": 2716.31, "total_tokens": 102924192} {"current_steps": 570, "total_steps": 9134, "loss": 0.8055, "learning_rate": 4.9521098719161795e-05, "epoch": 0.06239908043460412, "percentage": 6.24, "elapsed_time": "10:32:37", "remaining_time": "6 days, 14:24:55", "throughput": 2716.72, "total_tokens": 103119968} {"current_steps": 571, "total_steps": 9134, "loss": 0.7654, "learning_rate": 4.9519422298919844e-05, "epoch": 0.06250855250554202, "percentage": 6.25, "elapsed_time": "10:33:45", "remaining_time": "6 days, 14:24:08", "throughput": 2716.62, "total_tokens": 103300736} {"current_steps": 572, "total_steps": 9134, "loss": 0.7273, "learning_rate": 4.9517742978077106e-05, "epoch": 0.06261802457647993, "percentage": 6.26, "elapsed_time": "10:34:53", "remaining_time": "6 days, 14:23:17", "throughput": 2716.53, "total_tokens": 103480832} {"current_steps": 573, "total_steps": 9134, "loss": 0.7502, "learning_rate": 4.951606075683224e-05, "epoch": 0.06272749664741782, "percentage": 6.27, "elapsed_time": "10:36:02", "remaining_time": "6 days, 14:22:52", "throughput": 2716.85, "total_tokens": 103681536} {"current_steps": 574, "total_steps": 9134, "loss": 0.8977, "learning_rate": 4.9514375635384255e-05, "epoch": 0.06283696871835573, "percentage": 6.28, "elapsed_time": "10:37:09", "remaining_time": "6 days, 14:21:59", "throughput": 2716.73, "total_tokens": 103860512} {"current_steps": 575, "total_steps": 9134, "loss": 0.6015, "learning_rate": 4.9512687613932505e-05, "epoch": 0.06294644078929364, "percentage": 6.3, "elapsed_time": "10:38:13", "remaining_time": "6 days, 14:20:07", "throughput": 2716.99, "total_tokens": 104043072} {"current_steps": 576, "total_steps": 9134, "loss": 0.6893, "learning_rate": 4.951099669267666e-05, "epoch": 0.06305591286023153, "percentage": 6.31, "elapsed_time": "10:39:16", "remaining_time": "6 days, 14:18:00", "throughput": 2716.4, "total_tokens": 104190464} {"current_steps": 577, "total_steps": 9134, "loss": 0.8904, "learning_rate": 4.950930287181677e-05, "epoch": 0.06316538493116944, "percentage": 6.32, "elapsed_time": "10:40:22", "remaining_time": "6 days, 14:16:51", "throughput": 2716.94, "total_tokens": 104391616} {"current_steps": 578, "total_steps": 9134, "loss": 0.6306, "learning_rate": 4.95076061515532e-05, "epoch": 0.06327485700210733, "percentage": 6.33, "elapsed_time": "10:41:28", "remaining_time": "6 days, 14:15:38", "throughput": 2717.02, "total_tokens": 104574400} {"current_steps": 579, "total_steps": 9134, "loss": 0.679, "learning_rate": 4.9505906532086676e-05, "epoch": 0.06338432907304524, "percentage": 6.34, "elapsed_time": "10:42:34", "remaining_time": "6 days, 14:14:18", "throughput": 2716.69, "total_tokens": 104740384} {"current_steps": 580, "total_steps": 9134, "loss": 0.7566, "learning_rate": 4.950420401361825e-05, "epoch": 0.06349380114398315, "percentage": 6.35, "elapsed_time": "10:43:37", "remaining_time": "6 days, 14:12:18", "throughput": 2716.1, "total_tokens": 104888448} {"current_steps": 581, "total_steps": 9134, "loss": 0.7865, "learning_rate": 4.950249859634934e-05, "epoch": 0.06360327321492104, "percentage": 6.36, "elapsed_time": "10:44:43", "remaining_time": "6 days, 14:11:06", "throughput": 2716.14, "total_tokens": 105069888} {"current_steps": 582, "total_steps": 9134, "loss": 0.7362, "learning_rate": 4.9500790280481684e-05, "epoch": 0.06371274528585895, "percentage": 6.37, "elapsed_time": "10:45:48", "remaining_time": "6 days, 14:09:39", "throughput": 2716.57, "total_tokens": 105263424} {"current_steps": 583, "total_steps": 9134, "loss": 0.8289, "learning_rate": 4.9499079066217374e-05, "epoch": 0.06382221735679684, "percentage": 6.38, "elapsed_time": "10:46:53", "remaining_time": "6 days, 14:08:11", "throughput": 2716.38, "total_tokens": 105433216} {"current_steps": 584, "total_steps": 9134, "loss": 0.9543, "learning_rate": 4.9497364953758854e-05, "epoch": 0.06393168942773475, "percentage": 6.39, "elapsed_time": "10:48:03", "remaining_time": "6 days, 14:07:50", "throughput": 2717.16, "total_tokens": 105652736} {"current_steps": 585, "total_steps": 9134, "loss": 0.802, "learning_rate": 4.9495647943308877e-05, "epoch": 0.06404116149867266, "percentage": 6.4, "elapsed_time": "10:49:11", "remaining_time": "6 days, 14:07:02", "throughput": 2717.05, "total_tokens": 105832608} {"current_steps": 586, "total_steps": 9134, "loss": 0.6763, "learning_rate": 4.949392803507058e-05, "epoch": 0.06415063356961055, "percentage": 6.42, "elapsed_time": "10:50:19", "remaining_time": "6 days, 14:06:13", "throughput": 2717.36, "total_tokens": 106029056} {"current_steps": 587, "total_steps": 9134, "loss": 0.6194, "learning_rate": 4.949220522924742e-05, "epoch": 0.06426010564054846, "percentage": 6.43, "elapsed_time": "10:51:28", "remaining_time": "6 days, 14:05:43", "throughput": 2716.69, "total_tokens": 106190560} {"current_steps": 588, "total_steps": 9134, "loss": 0.7022, "learning_rate": 4.949047952604321e-05, "epoch": 0.06436957771148635, "percentage": 6.44, "elapsed_time": "10:52:34", "remaining_time": "6 days, 14:04:31", "throughput": 2716.59, "total_tokens": 106366624} {"current_steps": 589, "total_steps": 9134, "loss": 0.9235, "learning_rate": 4.9488750925662083e-05, "epoch": 0.06447904978242426, "percentage": 6.45, "elapsed_time": "10:53:40", "remaining_time": "6 days, 14:03:20", "throughput": 2716.79, "total_tokens": 106554560} {"current_steps": 590, "total_steps": 9134, "loss": 0.7205, "learning_rate": 4.9487019428308547e-05, "epoch": 0.06458852185336215, "percentage": 6.46, "elapsed_time": "10:54:50", "remaining_time": "6 days, 14:02:57", "throughput": 2717.26, "total_tokens": 106761984} {"current_steps": 591, "total_steps": 9134, "loss": 0.8584, "learning_rate": 4.948528503418741e-05, "epoch": 0.06469799392430006, "percentage": 6.47, "elapsed_time": "10:55:54", "remaining_time": "6 days, 14:01:17", "throughput": 2717.33, "total_tokens": 106939392} {"current_steps": 592, "total_steps": 9134, "loss": 0.7038, "learning_rate": 4.9483547743503874e-05, "epoch": 0.06480746599523797, "percentage": 6.48, "elapsed_time": "10:57:00", "remaining_time": "6 days, 14:00:06", "throughput": 2717.31, "total_tokens": 107119040} {"current_steps": 593, "total_steps": 9134, "loss": 0.7352, "learning_rate": 4.9481807556463435e-05, "epoch": 0.06491693806617586, "percentage": 6.49, "elapsed_time": "10:58:03", "remaining_time": "6 days, 13:57:57", "throughput": 2716.81, "total_tokens": 107268224} {"current_steps": 594, "total_steps": 9134, "loss": 0.6351, "learning_rate": 4.948006447327197e-05, "epoch": 0.06502641013711377, "percentage": 6.5, "elapsed_time": "10:59:12", "remaining_time": "6 days, 13:57:35", "throughput": 2717.43, "total_tokens": 107481920} {"current_steps": 595, "total_steps": 9134, "loss": 0.667, "learning_rate": 4.947831849413567e-05, "epoch": 0.06513588220805167, "percentage": 6.51, "elapsed_time": "11:00:21", "remaining_time": "6 days, 13:56:53", "throughput": 2717.98, "total_tokens": 107689344} {"current_steps": 596, "total_steps": 9134, "loss": 0.8247, "learning_rate": 4.947656961926109e-05, "epoch": 0.06524535427898957, "percentage": 6.53, "elapsed_time": "11:01:27", "remaining_time": "6 days, 13:55:45", "throughput": 2718.24, "total_tokens": 107880640} {"current_steps": 597, "total_steps": 9134, "loss": 0.7345, "learning_rate": 4.947481784885511e-05, "epoch": 0.06535482634992748, "percentage": 6.54, "elapsed_time": "11:02:33", "remaining_time": "6 days, 13:54:23", "throughput": 2718.19, "total_tokens": 108056480} {"current_steps": 598, "total_steps": 9134, "loss": 0.7812, "learning_rate": 4.947306318312497e-05, "epoch": 0.06546429842086537, "percentage": 6.55, "elapsed_time": "11:03:38", "remaining_time": "6 days, 13:53:03", "throughput": 2718.11, "total_tokens": 108231648} {"current_steps": 599, "total_steps": 9134, "loss": 0.9278, "learning_rate": 4.947130562227824e-05, "epoch": 0.06557377049180328, "percentage": 6.56, "elapsed_time": "11:04:48", "remaining_time": "6 days, 13:52:36", "throughput": 2718.14, "total_tokens": 108421824} {"current_steps": 600, "total_steps": 9134, "loss": 0.8514, "learning_rate": 4.9469545166522836e-05, "epoch": 0.06568324256274118, "percentage": 6.57, "elapsed_time": "11:05:50", "remaining_time": "6 days, 13:50:29", "throughput": 2718.09, "total_tokens": 108588928} {"current_steps": 601, "total_steps": 9134, "loss": 0.8285, "learning_rate": 4.946778181606702e-05, "epoch": 0.06579271463367908, "percentage": 6.58, "elapsed_time": "11:06:59", "remaining_time": "6 days, 13:50:00", "throughput": 2717.78, "total_tokens": 108764768} {"current_steps": 602, "total_steps": 9134, "loss": 0.6031, "learning_rate": 4.946601557111938e-05, "epoch": 0.06590218670461699, "percentage": 6.59, "elapsed_time": "11:08:07", "remaining_time": "6 days, 13:49:04", "throughput": 2718.15, "total_tokens": 108962560} {"current_steps": 603, "total_steps": 9134, "loss": 0.744, "learning_rate": 4.9464246431888885e-05, "epoch": 0.06601165877555489, "percentage": 6.6, "elapsed_time": "11:09:15", "remaining_time": "6 days, 13:48:22", "throughput": 2718.37, "total_tokens": 109157440} {"current_steps": 604, "total_steps": 9134, "loss": 0.829, "learning_rate": 4.946247439858479e-05, "epoch": 0.06612113084649279, "percentage": 6.61, "elapsed_time": "11:10:21", "remaining_time": "6 days, 13:47:05", "throughput": 2718.7, "total_tokens": 109349408} {"current_steps": 605, "total_steps": 9134, "loss": 0.5337, "learning_rate": 4.9460699471416745e-05, "epoch": 0.06623060291743069, "percentage": 6.62, "elapsed_time": "11:11:29", "remaining_time": "6 days, 13:46:17", "throughput": 2719.02, "total_tokens": 109546976} {"current_steps": 606, "total_steps": 9134, "loss": 0.9072, "learning_rate": 4.945892165059472e-05, "epoch": 0.0663400749883686, "percentage": 6.63, "elapsed_time": "11:12:36", "remaining_time": "6 days, 13:45:20", "throughput": 2718.6, "total_tokens": 109713184} {"current_steps": 607, "total_steps": 9134, "loss": 0.8036, "learning_rate": 4.9457140936329004e-05, "epoch": 0.06644954705930649, "percentage": 6.65, "elapsed_time": "11:13:43", "remaining_time": "6 days, 13:44:13", "throughput": 2718.77, "total_tokens": 109901120} {"current_steps": 608, "total_steps": 9134, "loss": 0.7907, "learning_rate": 4.9455357328830275e-05, "epoch": 0.0665590191302444, "percentage": 6.66, "elapsed_time": "11:14:51", "remaining_time": "6 days, 13:43:34", "throughput": 2718.66, "total_tokens": 110082784} {"current_steps": 609, "total_steps": 9134, "loss": 0.584, "learning_rate": 4.9453570828309536e-05, "epoch": 0.0666684912011823, "percentage": 6.67, "elapsed_time": "11:15:53", "remaining_time": "6 days, 13:41:18", "throughput": 2718.43, "total_tokens": 110241152} {"current_steps": 610, "total_steps": 9134, "loss": 0.6707, "learning_rate": 4.9451781434978104e-05, "epoch": 0.0667779632721202, "percentage": 6.68, "elapsed_time": "11:16:58", "remaining_time": "6 days, 13:39:56", "throughput": 2718.2, "total_tokens": 110409824} {"current_steps": 611, "total_steps": 9134, "loss": 0.6707, "learning_rate": 4.944998914904768e-05, "epoch": 0.0668874353430581, "percentage": 6.69, "elapsed_time": "11:18:07", "remaining_time": "6 days, 13:39:21", "throughput": 2717.81, "total_tokens": 110580960} {"current_steps": 612, "total_steps": 9134, "loss": 0.6299, "learning_rate": 4.944819397073027e-05, "epoch": 0.066996907413996, "percentage": 6.7, "elapsed_time": "11:19:16", "remaining_time": "6 days, 13:38:44", "throughput": 2718.08, "total_tokens": 110778752} {"current_steps": 613, "total_steps": 9134, "loss": 0.7124, "learning_rate": 4.944639590023826e-05, "epoch": 0.0671063794849339, "percentage": 6.71, "elapsed_time": "11:20:15", "remaining_time": "6 days, 13:35:54", "throughput": 2717.56, "total_tokens": 110918528} {"current_steps": 614, "total_steps": 9134, "loss": 0.6447, "learning_rate": 4.9444594937784336e-05, "epoch": 0.06721585155587181, "percentage": 6.72, "elapsed_time": "11:21:24", "remaining_time": "6 days, 13:35:20", "throughput": 2718.17, "total_tokens": 111130432} {"current_steps": 615, "total_steps": 9134, "loss": 0.6201, "learning_rate": 4.9442791083581575e-05, "epoch": 0.06732532362680971, "percentage": 6.73, "elapsed_time": "11:22:25", "remaining_time": "6 days, 13:32:55", "throughput": 2717.91, "total_tokens": 111285664} {"current_steps": 616, "total_steps": 9134, "loss": 0.8074, "learning_rate": 4.944098433784335e-05, "epoch": 0.06743479569774762, "percentage": 6.74, "elapsed_time": "11:23:31", "remaining_time": "6 days, 13:31:50", "throughput": 2718.01, "total_tokens": 111470688} {"current_steps": 617, "total_steps": 9134, "loss": 0.7161, "learning_rate": 4.94391747007834e-05, "epoch": 0.06754426776868551, "percentage": 6.75, "elapsed_time": "11:24:41", "remaining_time": "6 days, 13:31:22", "throughput": 2718.54, "total_tokens": 111681472} {"current_steps": 618, "total_steps": 9134, "loss": 0.7683, "learning_rate": 4.9437362172615806e-05, "epoch": 0.06765373983962342, "percentage": 6.77, "elapsed_time": "11:25:46", "remaining_time": "6 days, 13:29:49", "throughput": 2718.29, "total_tokens": 111847008} {"current_steps": 619, "total_steps": 9134, "loss": 0.7126, "learning_rate": 4.9435546753554985e-05, "epoch": 0.06776321191056132, "percentage": 6.78, "elapsed_time": "11:26:51", "remaining_time": "6 days, 13:28:26", "throughput": 2718.25, "total_tokens": 112023072} {"current_steps": 620, "total_steps": 9134, "loss": 0.7069, "learning_rate": 4.943372844381568e-05, "epoch": 0.06787268398149922, "percentage": 6.79, "elapsed_time": "11:27:56", "remaining_time": "6 days, 13:26:54", "throughput": 2717.83, "total_tokens": 112181664} {"current_steps": 621, "total_steps": 9134, "loss": 0.6956, "learning_rate": 4.943190724361303e-05, "epoch": 0.06798215605243713, "percentage": 6.8, "elapsed_time": "11:29:05", "remaining_time": "6 days, 13:26:28", "throughput": 2718.47, "total_tokens": 112396928} {"current_steps": 622, "total_steps": 9134, "loss": 0.7277, "learning_rate": 4.9430083153162456e-05, "epoch": 0.06809162812337502, "percentage": 6.81, "elapsed_time": "11:30:11", "remaining_time": "6 days, 13:25:08", "throughput": 2719.01, "total_tokens": 112597632} {"current_steps": 623, "total_steps": 9134, "loss": 0.7074, "learning_rate": 4.942825617267973e-05, "epoch": 0.06820110019431293, "percentage": 6.82, "elapsed_time": "11:31:16", "remaining_time": "6 days, 13:23:41", "throughput": 2718.98, "total_tokens": 112773248} {"current_steps": 624, "total_steps": 9134, "loss": 0.6544, "learning_rate": 4.9426426302381014e-05, "epoch": 0.06831057226525082, "percentage": 6.83, "elapsed_time": "11:32:22", "remaining_time": "6 days, 13:22:25", "throughput": 2718.66, "total_tokens": 112939456} {"current_steps": 625, "total_steps": 9134, "loss": 0.7088, "learning_rate": 4.9424593542482754e-05, "epoch": 0.06842004433618873, "percentage": 6.84, "elapsed_time": "11:33:30", "remaining_time": "6 days, 13:21:37", "throughput": 2718.65, "total_tokens": 113123584} {"current_steps": 626, "total_steps": 9134, "loss": 0.7974, "learning_rate": 4.942275789320178e-05, "epoch": 0.06852951640712664, "percentage": 6.85, "elapsed_time": "11:34:38", "remaining_time": "6 days, 13:20:59", "throughput": 2719.12, "total_tokens": 113329888} {"current_steps": 627, "total_steps": 9134, "loss": 0.7588, "learning_rate": 4.9420919354755225e-05, "epoch": 0.06863898847806453, "percentage": 6.86, "elapsed_time": "11:35:40", "remaining_time": "6 days, 13:18:47", "throughput": 2719.04, "total_tokens": 113494304} {"current_steps": 628, "total_steps": 9134, "loss": 0.724, "learning_rate": 4.9419077927360605e-05, "epoch": 0.06874846054900244, "percentage": 6.88, "elapsed_time": "11:36:49", "remaining_time": "6 days, 13:18:13", "throughput": 2719.42, "total_tokens": 113697696} {"current_steps": 629, "total_steps": 9134, "loss": 0.7036, "learning_rate": 4.9417233611235735e-05, "epoch": 0.06885793261994033, "percentage": 6.89, "elapsed_time": "11:37:55", "remaining_time": "6 days, 13:16:52", "throughput": 2719.48, "total_tokens": 113878464} {"current_steps": 630, "total_steps": 9134, "loss": 0.8195, "learning_rate": 4.9415386406598816e-05, "epoch": 0.06896740469087824, "percentage": 6.9, "elapsed_time": "11:39:03", "remaining_time": "6 days, 13:16:07", "throughput": 2719.84, "total_tokens": 114079168} {"current_steps": 631, "total_steps": 9134, "loss": 0.7532, "learning_rate": 4.941353631366836e-05, "epoch": 0.06907687676181615, "percentage": 6.91, "elapsed_time": "11:40:08", "remaining_time": "6 days, 13:14:41", "throughput": 2719.35, "total_tokens": 114235744} {"current_steps": 632, "total_steps": 9134, "loss": 0.6755, "learning_rate": 4.9411683332663225e-05, "epoch": 0.06918634883275404, "percentage": 6.92, "elapsed_time": "11:41:14", "remaining_time": "6 days, 13:13:30", "throughput": 2719.33, "total_tokens": 114414944} {"current_steps": 633, "total_steps": 9134, "loss": 0.9562, "learning_rate": 4.940982746380262e-05, "epoch": 0.06929582090369195, "percentage": 6.93, "elapsed_time": "11:42:22", "remaining_time": "6 days, 13:12:46", "throughput": 2719.29, "total_tokens": 114598624} {"current_steps": 634, "total_steps": 9134, "loss": 0.8508, "learning_rate": 4.9407968707306085e-05, "epoch": 0.06940529297462984, "percentage": 6.94, "elapsed_time": "11:43:31", "remaining_time": "6 days, 13:12:13", "throughput": 2719.96, "total_tokens": 114815008} {"current_steps": 635, "total_steps": 9134, "loss": 0.6447, "learning_rate": 4.940610706339351e-05, "epoch": 0.06951476504556775, "percentage": 6.95, "elapsed_time": "11:44:35", "remaining_time": "6 days, 13:10:23", "throughput": 2719.23, "total_tokens": 114956352} {"current_steps": 636, "total_steps": 9134, "loss": 0.9054, "learning_rate": 4.940424253228514e-05, "epoch": 0.06962423711650566, "percentage": 6.96, "elapsed_time": "11:45:41", "remaining_time": "6 days, 13:09:16", "throughput": 2719.0, "total_tokens": 115127488} {"current_steps": 637, "total_steps": 9134, "loss": 0.816, "learning_rate": 4.940237511420152e-05, "epoch": 0.06973370918744355, "percentage": 6.97, "elapsed_time": "11:46:49", "remaining_time": "6 days, 13:08:22", "throughput": 2718.91, "total_tokens": 115307136} {"current_steps": 638, "total_steps": 9134, "loss": 0.693, "learning_rate": 4.9400504809363576e-05, "epoch": 0.06984318125838146, "percentage": 6.98, "elapsed_time": "11:47:58", "remaining_time": "6 days, 13:07:46", "throughput": 2719.28, "total_tokens": 115510080} {"current_steps": 639, "total_steps": 9134, "loss": 0.825, "learning_rate": 4.9398631617992565e-05, "epoch": 0.06995265332931935, "percentage": 7.0, "elapsed_time": "11:48:59", "remaining_time": "6 days, 13:05:30", "throughput": 2718.97, "total_tokens": 115663744} {"current_steps": 640, "total_steps": 9134, "loss": 0.9089, "learning_rate": 4.939675554031007e-05, "epoch": 0.07006212540025726, "percentage": 7.01, "elapsed_time": "11:50:08", "remaining_time": "6 days, 13:04:59", "throughput": 2719.47, "total_tokens": 115873408} {"current_steps": 641, "total_steps": 9134, "loss": 0.6972, "learning_rate": 4.939487657653803e-05, "epoch": 0.07017159747119515, "percentage": 7.02, "elapsed_time": "11:51:10", "remaining_time": "6 days, 13:02:44", "throughput": 2718.69, "total_tokens": 116007136} {"current_steps": 642, "total_steps": 9134, "loss": 0.7176, "learning_rate": 4.9392994726898735e-05, "epoch": 0.07028106954213306, "percentage": 7.03, "elapsed_time": "11:52:14", "remaining_time": "6 days, 13:01:11", "throughput": 2718.5, "total_tokens": 116174912} {"current_steps": 643, "total_steps": 9134, "loss": 0.8517, "learning_rate": 4.939110999161479e-05, "epoch": 0.07039054161307097, "percentage": 7.04, "elapsed_time": "11:53:22", "remaining_time": "6 days, 13:00:16", "throughput": 2718.52, "total_tokens": 116358816} {"current_steps": 644, "total_steps": 9134, "loss": 0.615, "learning_rate": 4.938922237090916e-05, "epoch": 0.07050001368400886, "percentage": 7.05, "elapsed_time": "11:54:27", "remaining_time": "6 days, 12:58:57", "throughput": 2718.38, "total_tokens": 116531072} {"current_steps": 645, "total_steps": 9134, "loss": 0.6759, "learning_rate": 4.938733186500515e-05, "epoch": 0.07060948575494677, "percentage": 7.06, "elapsed_time": "11:55:33", "remaining_time": "6 days, 12:57:32", "throughput": 2718.2, "total_tokens": 116700864} {"current_steps": 646, "total_steps": 9134, "loss": 0.7622, "learning_rate": 4.93854384741264e-05, "epoch": 0.07071895782588467, "percentage": 7.07, "elapsed_time": "11:56:41", "remaining_time": "6 days, 12:56:50", "throughput": 2718.8, "total_tokens": 116912320} {"current_steps": 647, "total_steps": 9134, "loss": 0.6514, "learning_rate": 4.938354219849689e-05, "epoch": 0.07082842989682257, "percentage": 7.08, "elapsed_time": "11:57:47", "remaining_time": "6 days, 12:55:33", "throughput": 2718.61, "total_tokens": 117083232} {"current_steps": 648, "total_steps": 9134, "loss": 0.5842, "learning_rate": 4.9381643038340966e-05, "epoch": 0.07093790196776048, "percentage": 7.09, "elapsed_time": "11:58:54", "remaining_time": "6 days, 12:54:33", "throughput": 2718.25, "total_tokens": 117249664} {"current_steps": 649, "total_steps": 9134, "loss": 0.849, "learning_rate": 4.937974099388326e-05, "epoch": 0.07104737403869837, "percentage": 7.11, "elapsed_time": "11:59:59", "remaining_time": "6 days, 12:53:13", "throughput": 2718.52, "total_tokens": 117439616} {"current_steps": 650, "total_steps": 9134, "loss": 0.6723, "learning_rate": 4.9377836065348814e-05, "epoch": 0.07115684610963628, "percentage": 7.12, "elapsed_time": "12:01:05", "remaining_time": "6 days, 12:51:58", "throughput": 2718.42, "total_tokens": 117614560} {"current_steps": 651, "total_steps": 9134, "loss": 1.2026, "learning_rate": 4.937592825296297e-05, "epoch": 0.07126631818057418, "percentage": 7.13, "elapsed_time": "12:02:11", "remaining_time": "6 days, 12:50:39", "throughput": 2718.34, "total_tokens": 117789280} {"current_steps": 652, "total_steps": 9134, "loss": 0.7484, "learning_rate": 4.93740175569514e-05, "epoch": 0.07137579025151208, "percentage": 7.14, "elapsed_time": "12:03:17", "remaining_time": "6 days, 12:49:25", "throughput": 2718.05, "total_tokens": 117956384} {"current_steps": 653, "total_steps": 9134, "loss": 0.8211, "learning_rate": 4.9372103977540154e-05, "epoch": 0.07148526232244999, "percentage": 7.15, "elapsed_time": "12:04:24", "remaining_time": "6 days, 12:48:21", "throughput": 2718.18, "total_tokens": 118143424} {"current_steps": 654, "total_steps": 9134, "loss": 0.684, "learning_rate": 4.937018751495559e-05, "epoch": 0.07159473439338788, "percentage": 7.16, "elapsed_time": "12:05:32", "remaining_time": "6 days, 12:47:37", "throughput": 2718.43, "total_tokens": 118340096} {"current_steps": 655, "total_steps": 9134, "loss": 0.7986, "learning_rate": 4.9368268169424444e-05, "epoch": 0.07170420646432579, "percentage": 7.17, "elapsed_time": "12:06:38", "remaining_time": "6 days, 12:46:27", "throughput": 2718.68, "total_tokens": 118531168} {"current_steps": 656, "total_steps": 9134, "loss": 0.7139, "learning_rate": 4.936634594117375e-05, "epoch": 0.07181367853526369, "percentage": 7.18, "elapsed_time": "12:07:40", "remaining_time": "6 days, 12:44:15", "throughput": 2718.46, "total_tokens": 118688640} {"current_steps": 657, "total_steps": 9134, "loss": 0.8582, "learning_rate": 4.936442083043091e-05, "epoch": 0.0719231506062016, "percentage": 7.19, "elapsed_time": "12:08:49", "remaining_time": "6 days, 12:43:39", "throughput": 2719.05, "total_tokens": 118901888} {"current_steps": 658, "total_steps": 9134, "loss": 0.6959, "learning_rate": 4.936249283742367e-05, "epoch": 0.07203262267713949, "percentage": 7.2, "elapsed_time": "12:09:52", "remaining_time": "6 days, 12:41:55", "throughput": 2718.92, "total_tokens": 119069216} {"current_steps": 659, "total_steps": 9134, "loss": 0.6639, "learning_rate": 4.93605619623801e-05, "epoch": 0.0721420947480774, "percentage": 7.21, "elapsed_time": "12:10:56", "remaining_time": "6 days, 12:40:11", "throughput": 2718.86, "total_tokens": 119239456} {"current_steps": 660, "total_steps": 9134, "loss": 0.564, "learning_rate": 4.935862820552861e-05, "epoch": 0.0722515668190153, "percentage": 7.23, "elapsed_time": "12:12:01", "remaining_time": "6 days, 12:38:43", "throughput": 2718.63, "total_tokens": 119405664} {"current_steps": 661, "total_steps": 9134, "loss": 0.7854, "learning_rate": 4.935669156709798e-05, "epoch": 0.0723610388899532, "percentage": 7.24, "elapsed_time": "12:13:03", "remaining_time": "6 days, 12:36:43", "throughput": 2718.53, "total_tokens": 119570976} {"current_steps": 662, "total_steps": 9134, "loss": 0.7308, "learning_rate": 4.93547520473173e-05, "epoch": 0.0724705109608911, "percentage": 7.25, "elapsed_time": "12:14:07", "remaining_time": "6 days, 12:34:59", "throughput": 2718.28, "total_tokens": 119732928} {"current_steps": 663, "total_steps": 9134, "loss": 0.7933, "learning_rate": 4.9352809646416e-05, "epoch": 0.072579983031829, "percentage": 7.26, "elapsed_time": "12:15:16", "remaining_time": "6 days, 12:34:30", "throughput": 2718.62, "total_tokens": 119936768} {"current_steps": 664, "total_steps": 9134, "loss": 0.9965, "learning_rate": 4.935086436462388e-05, "epoch": 0.0726894551027669, "percentage": 7.27, "elapsed_time": "12:16:23", "remaining_time": "6 days, 12:33:20", "throughput": 2719.11, "total_tokens": 120138816} {"current_steps": 665, "total_steps": 9134, "loss": 0.8763, "learning_rate": 4.934891620217106e-05, "epoch": 0.07279892717370481, "percentage": 7.28, "elapsed_time": "12:17:29", "remaining_time": "6 days, 12:32:07", "throughput": 2719.32, "total_tokens": 120327648} {"current_steps": 666, "total_steps": 9134, "loss": 0.7658, "learning_rate": 4.934696515928799e-05, "epoch": 0.07290839924464271, "percentage": 7.29, "elapsed_time": "12:18:36", "remaining_time": "6 days, 12:31:17", "throughput": 2719.79, "total_tokens": 120532832} {"current_steps": 667, "total_steps": 9134, "loss": 0.9149, "learning_rate": 4.93450112362055e-05, "epoch": 0.07301787131558062, "percentage": 7.3, "elapsed_time": "12:19:40", "remaining_time": "6 days, 12:29:36", "throughput": 2719.64, "total_tokens": 120699936} {"current_steps": 668, "total_steps": 9134, "loss": 0.6005, "learning_rate": 4.934305443315471e-05, "epoch": 0.07312734338651851, "percentage": 7.31, "elapsed_time": "12:20:47", "remaining_time": "6 days, 12:28:26", "throughput": 2719.15, "total_tokens": 120858304} {"current_steps": 669, "total_steps": 9134, "loss": 0.7429, "learning_rate": 4.9341094750367126e-05, "epoch": 0.07323681545745642, "percentage": 7.32, "elapsed_time": "12:21:52", "remaining_time": "6 days, 12:27:08", "throughput": 2719.07, "total_tokens": 121033248} {"current_steps": 670, "total_steps": 9134, "loss": 0.7919, "learning_rate": 4.9339132188074556e-05, "epoch": 0.07334628752839432, "percentage": 7.34, "elapsed_time": "12:22:59", "remaining_time": "6 days, 12:26:03", "throughput": 2718.77, "total_tokens": 121201024} {"current_steps": 671, "total_steps": 9134, "loss": 0.8113, "learning_rate": 4.933716674650918e-05, "epoch": 0.07345575959933222, "percentage": 7.35, "elapsed_time": "12:24:04", "remaining_time": "6 days, 12:24:42", "throughput": 2718.35, "total_tokens": 121359840} {"current_steps": 672, "total_steps": 9134, "loss": 0.6825, "learning_rate": 4.9335198425903497e-05, "epoch": 0.07356523167027013, "percentage": 7.36, "elapsed_time": "12:25:09", "remaining_time": "6 days, 12:23:18", "throughput": 2718.57, "total_tokens": 121547104} {"current_steps": 673, "total_steps": 9134, "loss": 0.5768, "learning_rate": 4.933322722649037e-05, "epoch": 0.07367470374120802, "percentage": 7.37, "elapsed_time": "12:26:15", "remaining_time": "6 days, 12:22:04", "throughput": 2718.96, "total_tokens": 121743552} {"current_steps": 674, "total_steps": 9134, "loss": 0.6768, "learning_rate": 4.933125314850297e-05, "epoch": 0.07378417581214593, "percentage": 7.38, "elapsed_time": "12:27:23", "remaining_time": "6 days, 12:21:11", "throughput": 2719.09, "total_tokens": 121933280} {"current_steps": 675, "total_steps": 9134, "loss": 0.7264, "learning_rate": 4.9329276192174845e-05, "epoch": 0.07389364788308384, "percentage": 7.39, "elapsed_time": "12:28:29", "remaining_time": "6 days, 12:19:54", "throughput": 2718.89, "total_tokens": 122102848} {"current_steps": 676, "total_steps": 9134, "loss": 0.5635, "learning_rate": 4.932729635773985e-05, "epoch": 0.07400311995402173, "percentage": 7.4, "elapsed_time": "12:29:37", "remaining_time": "6 days, 12:19:05", "throughput": 2719.36, "total_tokens": 122308704} {"current_steps": 677, "total_steps": 9134, "loss": 0.5059, "learning_rate": 4.93253136454322e-05, "epoch": 0.07411259202495964, "percentage": 7.41, "elapsed_time": "12:30:44", "remaining_time": "6 days, 12:18:10", "throughput": 2719.36, "total_tokens": 122492384} {"current_steps": 678, "total_steps": 9134, "loss": 0.7137, "learning_rate": 4.9323328055486464e-05, "epoch": 0.07422206409589753, "percentage": 7.42, "elapsed_time": "12:31:52", "remaining_time": "6 days, 12:17:21", "throughput": 2719.64, "total_tokens": 122689728} {"current_steps": 679, "total_steps": 9134, "loss": 0.7443, "learning_rate": 4.93213395881375e-05, "epoch": 0.07433153616683544, "percentage": 7.43, "elapsed_time": "12:32:59", "remaining_time": "6 days, 12:16:18", "throughput": 2719.44, "total_tokens": 122862432} {"current_steps": 680, "total_steps": 9134, "loss": 0.8724, "learning_rate": 4.9319348243620566e-05, "epoch": 0.07444100823777333, "percentage": 7.44, "elapsed_time": "12:34:08", "remaining_time": "6 days, 12:15:42", "throughput": 2720.19, "total_tokens": 123083968} {"current_steps": 681, "total_steps": 9134, "loss": 0.7734, "learning_rate": 4.931735402217122e-05, "epoch": 0.07455048030871124, "percentage": 7.46, "elapsed_time": "12:35:13", "remaining_time": "6 days, 12:14:24", "throughput": 2720.41, "total_tokens": 123272128} {"current_steps": 682, "total_steps": 9134, "loss": 0.7111, "learning_rate": 4.931535692402538e-05, "epoch": 0.07465995237964915, "percentage": 7.47, "elapsed_time": "12:36:21", "remaining_time": "6 days, 12:13:34", "throughput": 2720.66, "total_tokens": 123468352} {"current_steps": 683, "total_steps": 9134, "loss": 0.6262, "learning_rate": 4.93133569494193e-05, "epoch": 0.07476942445058704, "percentage": 7.48, "elapsed_time": "12:37:31", "remaining_time": "6 days, 12:13:03", "throughput": 2720.8, "total_tokens": 123663680} {"current_steps": 684, "total_steps": 9134, "loss": 0.7148, "learning_rate": 4.931135409858958e-05, "epoch": 0.07487889652152495, "percentage": 7.49, "elapsed_time": "12:38:32", "remaining_time": "6 days, 12:10:48", "throughput": 2720.2, "total_tokens": 123802560} {"current_steps": 685, "total_steps": 9134, "loss": 0.7853, "learning_rate": 4.930934837177313e-05, "epoch": 0.07498836859246284, "percentage": 7.5, "elapsed_time": "12:39:41", "remaining_time": "6 days, 12:10:10", "throughput": 2719.94, "total_tokens": 123977728} {"current_steps": 686, "total_steps": 9134, "loss": 0.8035, "learning_rate": 4.9307339769207257e-05, "epoch": 0.07509784066340075, "percentage": 7.51, "elapsed_time": "12:40:48", "remaining_time": "6 days, 12:09:12", "throughput": 2719.88, "total_tokens": 124157824} {"current_steps": 687, "total_steps": 9134, "loss": 0.9152, "learning_rate": 4.930532829112955e-05, "epoch": 0.07520731273433866, "percentage": 7.52, "elapsed_time": "12:41:56", "remaining_time": "6 days, 12:08:22", "throughput": 2720.24, "total_tokens": 124358976} {"current_steps": 688, "total_steps": 9134, "loss": 0.7773, "learning_rate": 4.930331393777796e-05, "epoch": 0.07531678480527655, "percentage": 7.53, "elapsed_time": "12:43:05", "remaining_time": "6 days, 12:07:48", "throughput": 2720.74, "total_tokens": 124570208} {"current_steps": 689, "total_steps": 9134, "loss": 0.7395, "learning_rate": 4.93012967093908e-05, "epoch": 0.07542625687621446, "percentage": 7.54, "elapsed_time": "12:44:12", "remaining_time": "6 days, 12:06:52", "throughput": 2721.01, "total_tokens": 124765984} {"current_steps": 690, "total_steps": 9134, "loss": 0.7581, "learning_rate": 4.92992766062067e-05, "epoch": 0.07553572894715235, "percentage": 7.55, "elapsed_time": "12:45:18", "remaining_time": "6 days, 12:05:40", "throughput": 2720.97, "total_tokens": 124943616} {"current_steps": 691, "total_steps": 9134, "loss": 0.7719, "learning_rate": 4.9297253628464624e-05, "epoch": 0.07564520101809026, "percentage": 7.57, "elapsed_time": "12:46:25", "remaining_time": "6 days, 12:04:38", "throughput": 2720.96, "total_tokens": 125125280} {"current_steps": 692, "total_steps": 9134, "loss": 0.7598, "learning_rate": 4.9295227776403893e-05, "epoch": 0.07575467308902817, "percentage": 7.58, "elapsed_time": "12:47:29", "remaining_time": "6 days, 12:02:52", "throughput": 2720.41, "total_tokens": 125272448} {"current_steps": 693, "total_steps": 9134, "loss": 0.6961, "learning_rate": 4.929319905026416e-05, "epoch": 0.07586414515996606, "percentage": 7.59, "elapsed_time": "12:48:37", "remaining_time": "6 days, 12:02:10", "throughput": 2720.1, "total_tokens": 125444704} {"current_steps": 694, "total_steps": 9134, "loss": 0.681, "learning_rate": 4.929116745028542e-05, "epoch": 0.07597361723090397, "percentage": 7.6, "elapsed_time": "12:49:39", "remaining_time": "6 days, 12:00:03", "throughput": 2719.64, "total_tokens": 125590976} {"current_steps": 695, "total_steps": 9134, "loss": 0.7037, "learning_rate": 4.928913297670801e-05, "epoch": 0.07608308930184186, "percentage": 7.61, "elapsed_time": "12:50:42", "remaining_time": "6 days, 11:58:11", "throughput": 2719.1, "total_tokens": 125737024} {"current_steps": 696, "total_steps": 9134, "loss": 0.6665, "learning_rate": 4.92870956297726e-05, "epoch": 0.07619256137277977, "percentage": 7.62, "elapsed_time": "12:51:48", "remaining_time": "6 days, 11:57:07", "throughput": 2719.25, "total_tokens": 125925184} {"current_steps": 697, "total_steps": 9134, "loss": 0.6778, "learning_rate": 4.92850554097202e-05, "epoch": 0.07630203344371767, "percentage": 7.63, "elapsed_time": "12:52:57", "remaining_time": "6 days, 11:56:33", "throughput": 2719.17, "total_tokens": 126109536} {"current_steps": 698, "total_steps": 9134, "loss": 0.688, "learning_rate": 4.928301231679218e-05, "epoch": 0.07641150551465557, "percentage": 7.64, "elapsed_time": "12:54:06", "remaining_time": "6 days, 11:55:48", "throughput": 2719.18, "total_tokens": 126295904} {"current_steps": 699, "total_steps": 9134, "loss": 0.6903, "learning_rate": 4.9280966351230226e-05, "epoch": 0.07652097758559348, "percentage": 7.65, "elapsed_time": "12:55:13", "remaining_time": "6 days, 11:54:49", "throughput": 2719.37, "total_tokens": 126487424} {"current_steps": 700, "total_steps": 9134, "loss": 0.6162, "learning_rate": 4.927891751327636e-05, "epoch": 0.07663044965653137, "percentage": 7.66, "elapsed_time": "12:56:20", "remaining_time": "6 days, 11:53:50", "throughput": 2719.7, "total_tokens": 126685664} {"current_steps": 701, "total_steps": 9134, "loss": 0.8016, "learning_rate": 4.9276865803172965e-05, "epoch": 0.07673992172746928, "percentage": 7.67, "elapsed_time": "12:57:26", "remaining_time": "6 days, 11:52:30", "throughput": 2719.71, "total_tokens": 126863744} {"current_steps": 702, "total_steps": 9134, "loss": 0.858, "learning_rate": 4.9274811221162764e-05, "epoch": 0.07684939379840718, "percentage": 7.69, "elapsed_time": "12:58:32", "remaining_time": "6 days, 11:51:25", "throughput": 2720.07, "total_tokens": 127062208} {"current_steps": 703, "total_steps": 9134, "loss": 0.8053, "learning_rate": 4.92727537674888e-05, "epoch": 0.07695886586934508, "percentage": 7.7, "elapsed_time": "12:59:40", "remaining_time": "6 days, 11:50:34", "throughput": 2720.34, "total_tokens": 127258880} {"current_steps": 704, "total_steps": 9134, "loss": 0.8269, "learning_rate": 4.927069344239447e-05, "epoch": 0.07706833794028299, "percentage": 7.71, "elapsed_time": "13:00:47", "remaining_time": "6 days, 11:49:27", "throughput": 2720.71, "total_tokens": 127457568} {"current_steps": 705, "total_steps": 9134, "loss": 0.7908, "learning_rate": 4.9268630246123495e-05, "epoch": 0.07717781001122088, "percentage": 7.72, "elapsed_time": "13:01:52", "remaining_time": "6 days, 11:48:10", "throughput": 2720.8, "total_tokens": 127640128} {"current_steps": 706, "total_steps": 9134, "loss": 0.8948, "learning_rate": 4.926656417891996e-05, "epoch": 0.07728728208215879, "percentage": 7.73, "elapsed_time": "13:02:56", "remaining_time": "6 days, 11:46:33", "throughput": 2720.24, "total_tokens": 127787968} {"current_steps": 707, "total_steps": 9134, "loss": 0.765, "learning_rate": 4.926449524102826e-05, "epoch": 0.07739675415309669, "percentage": 7.74, "elapsed_time": "13:03:56", "remaining_time": "6 days, 11:44:03", "throughput": 2720.06, "total_tokens": 127941632} {"current_steps": 708, "total_steps": 9134, "loss": 0.6304, "learning_rate": 4.9262423432693175e-05, "epoch": 0.0775062262240346, "percentage": 7.75, "elapsed_time": "13:05:03", "remaining_time": "6 days, 11:43:08", "throughput": 2720.17, "total_tokens": 128130464} {"current_steps": 709, "total_steps": 9134, "loss": 0.9715, "learning_rate": 4.926034875415977e-05, "epoch": 0.0776156982949725, "percentage": 7.76, "elapsed_time": "13:06:12", "remaining_time": "6 days, 11:42:25", "throughput": 2720.64, "total_tokens": 128338784} {"current_steps": 710, "total_steps": 9134, "loss": 0.748, "learning_rate": 4.925827120567349e-05, "epoch": 0.0777251703659104, "percentage": 7.77, "elapsed_time": "13:07:21", "remaining_time": "6 days, 11:41:52", "throughput": 2720.93, "total_tokens": 128541280} {"current_steps": 711, "total_steps": 9134, "loss": 0.7341, "learning_rate": 4.9256190787480104e-05, "epoch": 0.0778346424368483, "percentage": 7.78, "elapsed_time": "13:08:30", "remaining_time": "6 days, 11:41:18", "throughput": 2721.27, "total_tokens": 128745792} {"current_steps": 712, "total_steps": 9134, "loss": 0.7121, "learning_rate": 4.9254107499825705e-05, "epoch": 0.0779441145077862, "percentage": 7.8, "elapsed_time": "13:09:39", "remaining_time": "6 days, 11:40:39", "throughput": 2721.52, "total_tokens": 128944928} {"current_steps": 713, "total_steps": 9134, "loss": 1.073, "learning_rate": 4.925202134295677e-05, "epoch": 0.0780535865787241, "percentage": 7.81, "elapsed_time": "13:10:45", "remaining_time": "6 days, 11:39:27", "throughput": 2721.24, "total_tokens": 129112032} {"current_steps": 714, "total_steps": 9134, "loss": 0.7132, "learning_rate": 4.924993231712006e-05, "epoch": 0.078163058649662, "percentage": 7.82, "elapsed_time": "13:11:48", "remaining_time": "6 days, 11:37:37", "throughput": 2720.99, "total_tokens": 129271072} {"current_steps": 715, "total_steps": 9134, "loss": 0.7086, "learning_rate": 4.924784042256273e-05, "epoch": 0.0782725307205999, "percentage": 7.83, "elapsed_time": "13:12:57", "remaining_time": "6 days, 11:36:54", "throughput": 2721.27, "total_tokens": 129470432} {"current_steps": 716, "total_steps": 9134, "loss": 0.708, "learning_rate": 4.9245745659532214e-05, "epoch": 0.07838200279153781, "percentage": 7.84, "elapsed_time": "13:14:01", "remaining_time": "6 days, 11:35:17", "throughput": 2720.93, "total_tokens": 129628576} {"current_steps": 717, "total_steps": 9134, "loss": 0.8432, "learning_rate": 4.924364802827635e-05, "epoch": 0.07849147486247571, "percentage": 7.85, "elapsed_time": "13:15:10", "remaining_time": "6 days, 11:34:47", "throughput": 2721.42, "total_tokens": 129841376} {"current_steps": 718, "total_steps": 9134, "loss": 0.8947, "learning_rate": 4.924154752904326e-05, "epoch": 0.07860094693341362, "percentage": 7.86, "elapsed_time": "13:16:17", "remaining_time": "6 days, 11:33:44", "throughput": 2721.55, "total_tokens": 130029536} {"current_steps": 719, "total_steps": 9134, "loss": 0.7372, "learning_rate": 4.923944416208145e-05, "epoch": 0.07871041900435151, "percentage": 7.87, "elapsed_time": "13:17:23", "remaining_time": "6 days, 11:32:25", "throughput": 2721.34, "total_tokens": 130197536} {"current_steps": 720, "total_steps": 9134, "loss": 0.6077, "learning_rate": 4.9237337927639725e-05, "epoch": 0.07881989107528942, "percentage": 7.88, "elapsed_time": "13:18:28", "remaining_time": "6 days, 11:31:01", "throughput": 2721.08, "total_tokens": 130362400} {"current_steps": 721, "total_steps": 9134, "loss": 0.757, "learning_rate": 4.923522882596726e-05, "epoch": 0.07892936314622732, "percentage": 7.89, "elapsed_time": "13:19:36", "remaining_time": "6 days, 11:30:13", "throughput": 2721.59, "total_tokens": 130571840} {"current_steps": 722, "total_steps": 9134, "loss": 0.6372, "learning_rate": 4.9233116857313554e-05, "epoch": 0.07903883521716522, "percentage": 7.9, "elapsed_time": "13:20:42", "remaining_time": "6 days, 11:29:04", "throughput": 2721.62, "total_tokens": 130753952} {"current_steps": 723, "total_steps": 9134, "loss": 0.5178, "learning_rate": 4.923100202192845e-05, "epoch": 0.07914830728810313, "percentage": 7.92, "elapsed_time": "13:21:46", "remaining_time": "6 days, 11:27:29", "throughput": 2721.24, "total_tokens": 130910304} {"current_steps": 724, "total_steps": 9134, "loss": 0.6108, "learning_rate": 4.922888432006213e-05, "epoch": 0.07925777935904102, "percentage": 7.93, "elapsed_time": "13:22:50", "remaining_time": "6 days, 11:25:44", "throughput": 2721.28, "total_tokens": 131084352} {"current_steps": 725, "total_steps": 9134, "loss": 0.6605, "learning_rate": 4.922676375196511e-05, "epoch": 0.07936725142997893, "percentage": 7.94, "elapsed_time": "13:23:54", "remaining_time": "6 days, 11:24:16", "throughput": 2721.35, "total_tokens": 131263776} {"current_steps": 726, "total_steps": 9134, "loss": 0.7337, "learning_rate": 4.922464031788826e-05, "epoch": 0.07947672350091683, "percentage": 7.95, "elapsed_time": "13:25:02", "remaining_time": "6 days, 11:23:24", "throughput": 2721.99, "total_tokens": 131479264} {"current_steps": 727, "total_steps": 9134, "loss": 0.6106, "learning_rate": 4.922251401808276e-05, "epoch": 0.07958619557185473, "percentage": 7.96, "elapsed_time": "13:26:06", "remaining_time": "6 days, 11:21:45", "throughput": 2721.75, "total_tokens": 131640992} {"current_steps": 728, "total_steps": 9134, "loss": 0.6467, "learning_rate": 4.922038485280016e-05, "epoch": 0.07969566764279264, "percentage": 7.97, "elapsed_time": "13:27:12", "remaining_time": "6 days, 11:20:35", "throughput": 2722.07, "total_tokens": 131836768} {"current_steps": 729, "total_steps": 9134, "loss": 0.7412, "learning_rate": 4.921825282229233e-05, "epoch": 0.07980513971373053, "percentage": 7.98, "elapsed_time": "13:28:18", "remaining_time": "6 days, 11:19:20", "throughput": 2721.71, "total_tokens": 131998272} {"current_steps": 730, "total_steps": 9134, "loss": 0.54, "learning_rate": 4.92161179268115e-05, "epoch": 0.07991461178466844, "percentage": 7.99, "elapsed_time": "13:29:26", "remaining_time": "6 days, 11:18:38", "throughput": 2721.66, "total_tokens": 132182848} {"current_steps": 731, "total_steps": 9134, "loss": 0.7165, "learning_rate": 4.921398016661021e-05, "epoch": 0.08002408385560633, "percentage": 8.0, "elapsed_time": "13:30:29", "remaining_time": "6 days, 11:16:46", "throughput": 2721.64, "total_tokens": 132351968} {"current_steps": 732, "total_steps": 9134, "loss": 0.8466, "learning_rate": 4.9211839541941345e-05, "epoch": 0.08013355592654424, "percentage": 8.01, "elapsed_time": "13:31:38", "remaining_time": "6 days, 11:16:10", "throughput": 2721.82, "total_tokens": 132549088} {"current_steps": 733, "total_steps": 9134, "loss": 0.7257, "learning_rate": 4.920969605305815e-05, "epoch": 0.08024302799748215, "percentage": 8.02, "elapsed_time": "13:32:43", "remaining_time": "6 days, 11:14:44", "throughput": 2721.72, "total_tokens": 132720672} {"current_steps": 734, "total_steps": 9134, "loss": 0.7737, "learning_rate": 4.92075497002142e-05, "epoch": 0.08035250006842004, "percentage": 8.04, "elapsed_time": "13:33:49", "remaining_time": "6 days, 11:13:35", "throughput": 2721.8, "total_tokens": 132905024} {"current_steps": 735, "total_steps": 9134, "loss": 0.5127, "learning_rate": 4.92054004836634e-05, "epoch": 0.08046197213935795, "percentage": 8.05, "elapsed_time": "13:34:51", "remaining_time": "6 days, 11:11:28", "throughput": 2721.47, "total_tokens": 133055552} {"current_steps": 736, "total_steps": 9134, "loss": 0.5494, "learning_rate": 4.920324840365998e-05, "epoch": 0.08057144421029584, "percentage": 8.06, "elapsed_time": "13:35:58", "remaining_time": "6 days, 11:10:27", "throughput": 2721.23, "total_tokens": 133226464} {"current_steps": 737, "total_steps": 9134, "loss": 0.6358, "learning_rate": 4.9201093460458555e-05, "epoch": 0.08068091628123375, "percentage": 8.07, "elapsed_time": "13:37:06", "remaining_time": "6 days, 11:09:48", "throughput": 2721.43, "total_tokens": 133423584} {"current_steps": 738, "total_steps": 9134, "loss": 0.7337, "learning_rate": 4.9198935654314036e-05, "epoch": 0.08079038835217166, "percentage": 8.08, "elapsed_time": "13:38:12", "remaining_time": "6 days, 11:08:34", "throughput": 2721.25, "total_tokens": 133594048} {"current_steps": 739, "total_steps": 9134, "loss": 0.6787, "learning_rate": 4.919677498548169e-05, "epoch": 0.08089986042310955, "percentage": 8.09, "elapsed_time": "13:39:21", "remaining_time": "6 days, 11:07:49", "throughput": 2721.27, "total_tokens": 133781312} {"current_steps": 740, "total_steps": 9134, "loss": 0.9397, "learning_rate": 4.9194611454217124e-05, "epoch": 0.08100933249404746, "percentage": 8.1, "elapsed_time": "13:40:28", "remaining_time": "6 days, 11:06:54", "throughput": 2721.25, "total_tokens": 133964096} {"current_steps": 741, "total_steps": 9134, "loss": 0.7926, "learning_rate": 4.9192445060776264e-05, "epoch": 0.08111880456498535, "percentage": 8.11, "elapsed_time": "13:41:37", "remaining_time": "6 days, 11:06:17", "throughput": 2721.57, "total_tokens": 134168160} {"current_steps": 742, "total_steps": 9134, "loss": 0.7434, "learning_rate": 4.919027580541541e-05, "epoch": 0.08122827663592326, "percentage": 8.12, "elapsed_time": "13:42:46", "remaining_time": "6 days, 11:05:38", "throughput": 2721.7, "total_tokens": 134362144} {"current_steps": 743, "total_steps": 9134, "loss": 0.8817, "learning_rate": 4.918810368839117e-05, "epoch": 0.08133774870686117, "percentage": 8.13, "elapsed_time": "13:43:55", "remaining_time": "6 days, 11:04:58", "throughput": 2721.62, "total_tokens": 134545600} {"current_steps": 744, "total_steps": 9134, "loss": 0.6353, "learning_rate": 4.91859287099605e-05, "epoch": 0.08144722077779906, "percentage": 8.15, "elapsed_time": "13:44:57", "remaining_time": "6 days, 11:02:59", "throughput": 2721.2, "total_tokens": 134693216} {"current_steps": 745, "total_steps": 9134, "loss": 0.5205, "learning_rate": 4.9183750870380704e-05, "epoch": 0.08155669284873697, "percentage": 8.16, "elapsed_time": "13:46:04", "remaining_time": "6 days, 11:01:57", "throughput": 2721.34, "total_tokens": 134882048} {"current_steps": 746, "total_steps": 9134, "loss": 1.1545, "learning_rate": 4.918157016990941e-05, "epoch": 0.08166616491967486, "percentage": 8.17, "elapsed_time": "13:47:12", "remaining_time": "6 days, 11:01:07", "throughput": 2721.85, "total_tokens": 135092608} {"current_steps": 747, "total_steps": 9134, "loss": 0.8898, "learning_rate": 4.917938660880459e-05, "epoch": 0.08177563699061277, "percentage": 8.18, "elapsed_time": "13:48:16", "remaining_time": "6 days, 10:59:28", "throughput": 2721.64, "total_tokens": 135255008} {"current_steps": 748, "total_steps": 9134, "loss": 0.7135, "learning_rate": 4.9177200187324556e-05, "epoch": 0.08188510906155068, "percentage": 8.19, "elapsed_time": "13:49:21", "remaining_time": "6 days, 10:58:05", "throughput": 2721.62, "total_tokens": 135431296} {"current_steps": 749, "total_steps": 9134, "loss": 0.6785, "learning_rate": 4.917501090572797e-05, "epoch": 0.08199458113248857, "percentage": 8.2, "elapsed_time": "13:50:23", "remaining_time": "6 days, 10:56:14", "throughput": 2721.29, "total_tokens": 135585184} {"current_steps": 750, "total_steps": 9134, "loss": 0.6401, "learning_rate": 4.91728187642738e-05, "epoch": 0.08210405320342648, "percentage": 8.21, "elapsed_time": "13:51:27", "remaining_time": "6 days, 10:54:31", "throughput": 2721.13, "total_tokens": 135749152} {"current_steps": 751, "total_steps": 9134, "loss": 0.6404, "learning_rate": 4.917062376322138e-05, "epoch": 0.08221352527436437, "percentage": 8.22, "elapsed_time": "13:52:36", "remaining_time": "6 days, 10:53:57", "throughput": 2721.67, "total_tokens": 135965312} {"current_steps": 752, "total_steps": 9134, "loss": 0.9701, "learning_rate": 4.916842590283037e-05, "epoch": 0.08232299734530228, "percentage": 8.23, "elapsed_time": "13:53:45", "remaining_time": "6 days, 10:53:21", "throughput": 2721.71, "total_tokens": 136155936} {"current_steps": 753, "total_steps": 9134, "loss": 0.8394, "learning_rate": 4.916622518336079e-05, "epoch": 0.08243246941624018, "percentage": 8.24, "elapsed_time": "13:54:50", "remaining_time": "6 days, 10:51:55", "throughput": 2721.65, "total_tokens": 136329088} {"current_steps": 754, "total_steps": 9134, "loss": 0.9354, "learning_rate": 4.916402160507296e-05, "epoch": 0.08254194148717808, "percentage": 8.25, "elapsed_time": "13:55:59", "remaining_time": "6 days, 10:51:16", "throughput": 2721.92, "total_tokens": 136530240} {"current_steps": 755, "total_steps": 9134, "loss": 0.6836, "learning_rate": 4.9161815168227576e-05, "epoch": 0.08265141355811599, "percentage": 8.27, "elapsed_time": "13:57:06", "remaining_time": "6 days, 10:50:15", "throughput": 2721.97, "total_tokens": 136715264} {"current_steps": 756, "total_steps": 9134, "loss": 0.6397, "learning_rate": 4.915960587308564e-05, "epoch": 0.08276088562905388, "percentage": 8.28, "elapsed_time": "13:58:10", "remaining_time": "6 days, 10:48:36", "throughput": 2721.54, "total_tokens": 136866688} {"current_steps": 757, "total_steps": 9134, "loss": 0.5921, "learning_rate": 4.915739371990852e-05, "epoch": 0.08287035769999179, "percentage": 8.29, "elapsed_time": "13:59:15", "remaining_time": "6 days, 10:47:18", "throughput": 2721.37, "total_tokens": 137036256} {"current_steps": 758, "total_steps": 9134, "loss": 0.6946, "learning_rate": 4.9155178708957896e-05, "epoch": 0.08297982977092969, "percentage": 8.3, "elapsed_time": "14:00:23", "remaining_time": "6 days, 10:46:23", "throughput": 2721.75, "total_tokens": 137239424} {"current_steps": 759, "total_steps": 9134, "loss": 0.9498, "learning_rate": 4.915296084049582e-05, "epoch": 0.0830893018418676, "percentage": 8.31, "elapsed_time": "14:01:28", "remaining_time": "6 days, 10:45:05", "throughput": 2721.58, "total_tokens": 137408992} {"current_steps": 760, "total_steps": 9134, "loss": 0.673, "learning_rate": 4.915074011478463e-05, "epoch": 0.0831987739128055, "percentage": 8.32, "elapsed_time": "14:02:35", "remaining_time": "6 days, 10:43:57", "throughput": 2721.35, "total_tokens": 137578112} {"current_steps": 761, "total_steps": 9134, "loss": 0.7599, "learning_rate": 4.914851653208707e-05, "epoch": 0.0833082459837434, "percentage": 8.33, "elapsed_time": "14:03:38", "remaining_time": "6 days, 10:42:21", "throughput": 2721.22, "total_tokens": 137744992} {"current_steps": 762, "total_steps": 9134, "loss": 0.6717, "learning_rate": 4.9146290092666163e-05, "epoch": 0.0834177180546813, "percentage": 8.34, "elapsed_time": "14:04:43", "remaining_time": "6 days, 10:40:48", "throughput": 2721.19, "total_tokens": 137918144} {"current_steps": 763, "total_steps": 9134, "loss": 0.6558, "learning_rate": 4.91440607967853e-05, "epoch": 0.0835271901256192, "percentage": 8.35, "elapsed_time": "14:05:49", "remaining_time": "6 days, 10:39:44", "throughput": 2721.31, "total_tokens": 138106080} {"current_steps": 764, "total_steps": 9134, "loss": 0.5753, "learning_rate": 4.91418286447082e-05, "epoch": 0.0836366621965571, "percentage": 8.36, "elapsed_time": "14:06:58", "remaining_time": "6 days, 10:39:06", "throughput": 2721.08, "total_tokens": 138282144} {"current_steps": 765, "total_steps": 9134, "loss": 0.7834, "learning_rate": 4.913959363669892e-05, "epoch": 0.08374613426749501, "percentage": 8.38, "elapsed_time": "14:08:03", "remaining_time": "6 days, 10:37:34", "throughput": 2721.09, "total_tokens": 138457760} {"current_steps": 766, "total_steps": 9134, "loss": 0.8654, "learning_rate": 4.9137355773021856e-05, "epoch": 0.0838556063384329, "percentage": 8.39, "elapsed_time": "14:09:11", "remaining_time": "6 days, 10:36:53", "throughput": 2721.32, "total_tokens": 138656672} {"current_steps": 767, "total_steps": 9134, "loss": 0.7416, "learning_rate": 4.913511505394175e-05, "epoch": 0.08396507840937081, "percentage": 8.4, "elapsed_time": "14:10:19", "remaining_time": "6 days, 10:35:57", "throughput": 2721.59, "total_tokens": 138854016} {"current_steps": 768, "total_steps": 9134, "loss": 0.6422, "learning_rate": 4.9132871479723675e-05, "epoch": 0.08407455048030871, "percentage": 8.41, "elapsed_time": "14:11:24", "remaining_time": "6 days, 10:34:37", "throughput": 2721.48, "total_tokens": 139026048} {"current_steps": 769, "total_steps": 9134, "loss": 0.8059, "learning_rate": 4.9130625050633036e-05, "epoch": 0.08418402255124662, "percentage": 8.42, "elapsed_time": "14:12:31", "remaining_time": "6 days, 10:33:28", "throughput": 2721.48, "total_tokens": 139206592} {"current_steps": 770, "total_steps": 9134, "loss": 0.7513, "learning_rate": 4.912837576693559e-05, "epoch": 0.08429349462218451, "percentage": 8.43, "elapsed_time": "14:13:30", "remaining_time": "6 days, 10:31:01", "throughput": 2721.11, "total_tokens": 139348384} {"current_steps": 771, "total_steps": 9134, "loss": 0.8439, "learning_rate": 4.9126123628897406e-05, "epoch": 0.08440296669312242, "percentage": 8.44, "elapsed_time": "14:14:33", "remaining_time": "6 days, 10:29:20", "throughput": 2720.96, "total_tokens": 139513024} {"current_steps": 772, "total_steps": 9134, "loss": 0.6829, "learning_rate": 4.912386863678492e-05, "epoch": 0.08451243876406032, "percentage": 8.45, "elapsed_time": "14:15:34", "remaining_time": "6 days, 10:27:18", "throughput": 2720.37, "total_tokens": 139649888} {"current_steps": 773, "total_steps": 9134, "loss": 0.9824, "learning_rate": 4.91216107908649e-05, "epoch": 0.08462191083499822, "percentage": 8.46, "elapsed_time": "14:16:39", "remaining_time": "6 days, 10:25:50", "throughput": 2720.53, "total_tokens": 139833120} {"current_steps": 774, "total_steps": 9134, "loss": 0.7618, "learning_rate": 4.911935009140443e-05, "epoch": 0.08473138290593613, "percentage": 8.47, "elapsed_time": "14:17:48", "remaining_time": "6 days, 10:25:10", "throughput": 2721.04, "total_tokens": 140047040} {"current_steps": 775, "total_steps": 9134, "loss": 0.9318, "learning_rate": 4.911708653867095e-05, "epoch": 0.08484085497687402, "percentage": 8.48, "elapsed_time": "14:18:54", "remaining_time": "6 days, 10:24:00", "throughput": 2721.13, "total_tokens": 140231840} {"current_steps": 776, "total_steps": 9134, "loss": 0.768, "learning_rate": 4.911482013293224e-05, "epoch": 0.08495032704781193, "percentage": 8.5, "elapsed_time": "14:19:58", "remaining_time": "6 days, 10:22:27", "throughput": 2721.2, "total_tokens": 140409472} {"current_steps": 777, "total_steps": 9134, "loss": 0.8267, "learning_rate": 4.91125508744564e-05, "epoch": 0.08505979911874983, "percentage": 8.51, "elapsed_time": "14:21:07", "remaining_time": "6 days, 10:21:52", "throughput": 2721.45, "total_tokens": 140611744} {"current_steps": 778, "total_steps": 9134, "loss": 0.8866, "learning_rate": 4.9110278763511897e-05, "epoch": 0.08516927118968773, "percentage": 8.52, "elapsed_time": "14:22:14", "remaining_time": "6 days, 10:20:49", "throughput": 2721.08, "total_tokens": 140774368} {"current_steps": 779, "total_steps": 9134, "loss": 0.6919, "learning_rate": 4.910800380036751e-05, "epoch": 0.08527874326062564, "percentage": 8.53, "elapsed_time": "14:23:22", "remaining_time": "6 days, 10:19:53", "throughput": 2721.44, "total_tokens": 140976416} {"current_steps": 780, "total_steps": 9134, "loss": 0.6341, "learning_rate": 4.910572598529235e-05, "epoch": 0.08538821533156353, "percentage": 8.54, "elapsed_time": "14:24:25", "remaining_time": "6 days, 10:18:16", "throughput": 2721.32, "total_tokens": 141143296} {"current_steps": 781, "total_steps": 9134, "loss": 0.5611, "learning_rate": 4.910344531855589e-05, "epoch": 0.08549768740250144, "percentage": 8.55, "elapsed_time": "14:25:31", "remaining_time": "6 days, 10:17:03", "throughput": 2721.37, "total_tokens": 141325632} {"current_steps": 782, "total_steps": 9134, "loss": 0.7065, "learning_rate": 4.910116180042793e-05, "epoch": 0.08560715947343935, "percentage": 8.56, "elapsed_time": "14:26:37", "remaining_time": "6 days, 10:15:51", "throughput": 2721.52, "total_tokens": 141512896} {"current_steps": 783, "total_steps": 9134, "loss": 0.6342, "learning_rate": 4.90988754311786e-05, "epoch": 0.08571663154437724, "percentage": 8.57, "elapsed_time": "14:27:46", "remaining_time": "6 days, 10:15:07", "throughput": 2721.31, "total_tokens": 141688512} {"current_steps": 784, "total_steps": 9134, "loss": 0.615, "learning_rate": 4.9096586211078376e-05, "epoch": 0.08582610361531515, "percentage": 8.58, "elapsed_time": "14:28:51", "remaining_time": "6 days, 10:13:41", "throughput": 2720.94, "total_tokens": 141845536} {"current_steps": 785, "total_steps": 9134, "loss": 0.7083, "learning_rate": 4.9094294140398075e-05, "epoch": 0.08593557568625304, "percentage": 8.59, "elapsed_time": "14:29:55", "remaining_time": "6 days, 10:12:12", "throughput": 2720.64, "total_tokens": 142004800} {"current_steps": 786, "total_steps": 9134, "loss": 0.6695, "learning_rate": 4.909199921940883e-05, "epoch": 0.08604504775719095, "percentage": 8.61, "elapsed_time": "14:31:03", "remaining_time": "6 days, 10:11:22", "throughput": 2720.86, "total_tokens": 142201472} {"current_steps": 787, "total_steps": 9134, "loss": 0.9538, "learning_rate": 4.908970144838214e-05, "epoch": 0.08615451982812884, "percentage": 8.62, "elapsed_time": "14:32:10", "remaining_time": "6 days, 10:10:19", "throughput": 2720.88, "total_tokens": 142384256} {"current_steps": 788, "total_steps": 9134, "loss": 0.9346, "learning_rate": 4.9087400827589814e-05, "epoch": 0.08626399189906675, "percentage": 8.63, "elapsed_time": "14:33:14", "remaining_time": "6 days, 10:08:49", "throughput": 2720.73, "total_tokens": 142551360} {"current_steps": 789, "total_steps": 9134, "loss": 0.7631, "learning_rate": 4.908509735730402e-05, "epoch": 0.08637346397000466, "percentage": 8.64, "elapsed_time": "14:34:23", "remaining_time": "6 days, 10:08:08", "throughput": 2721.19, "total_tokens": 142762816} {"current_steps": 790, "total_steps": 9134, "loss": 0.6486, "learning_rate": 4.908279103779725e-05, "epoch": 0.08648293604094255, "percentage": 8.65, "elapsed_time": "14:35:29", "remaining_time": "6 days, 10:06:56", "throughput": 2721.21, "total_tokens": 142943360} {"current_steps": 791, "total_steps": 9134, "loss": 0.7172, "learning_rate": 4.908048186934234e-05, "epoch": 0.08659240811188046, "percentage": 8.66, "elapsed_time": "14:36:35", "remaining_time": "6 days, 10:05:43", "throughput": 2721.29, "total_tokens": 143127040} {"current_steps": 792, "total_steps": 9134, "loss": 0.7696, "learning_rate": 4.9078169852212454e-05, "epoch": 0.08670188018281835, "percentage": 8.67, "elapsed_time": "14:37:43", "remaining_time": "6 days, 10:04:58", "throughput": 2721.62, "total_tokens": 143330880} {"current_steps": 793, "total_steps": 9134, "loss": 0.81, "learning_rate": 4.907585498668111e-05, "epoch": 0.08681135225375626, "percentage": 8.68, "elapsed_time": "14:38:49", "remaining_time": "6 days, 10:03:48", "throughput": 2721.25, "total_tokens": 143491264} {"current_steps": 794, "total_steps": 9134, "loss": 0.6442, "learning_rate": 4.907353727302214e-05, "epoch": 0.08692082432469417, "percentage": 8.69, "elapsed_time": "14:39:51", "remaining_time": "6 days, 10:01:51", "throughput": 2721.05, "total_tokens": 143648288} {"current_steps": 795, "total_steps": 9134, "loss": 0.5882, "learning_rate": 4.907121671150974e-05, "epoch": 0.08703029639563206, "percentage": 8.7, "elapsed_time": "14:40:57", "remaining_time": "6 days, 10:00:34", "throughput": 2721.03, "total_tokens": 143825696} {"current_steps": 796, "total_steps": 9134, "loss": 0.627, "learning_rate": 4.906889330241842e-05, "epoch": 0.08713976846656997, "percentage": 8.71, "elapsed_time": "14:42:02", "remaining_time": "6 days, 9:59:12", "throughput": 2720.71, "total_tokens": 143986080} {"current_steps": 797, "total_steps": 9134, "loss": 0.8028, "learning_rate": 4.9066567046023025e-05, "epoch": 0.08724924053750786, "percentage": 8.73, "elapsed_time": "14:43:08", "remaining_time": "6 days, 9:58:00", "throughput": 2720.95, "total_tokens": 144177824} {"current_steps": 798, "total_steps": 9134, "loss": 0.879, "learning_rate": 4.906423794259876e-05, "epoch": 0.08735871260844577, "percentage": 8.74, "elapsed_time": "14:44:12", "remaining_time": "6 days, 9:56:36", "throughput": 2720.71, "total_tokens": 144341792} {"current_steps": 799, "total_steps": 9134, "loss": 0.8659, "learning_rate": 4.906190599242115e-05, "epoch": 0.08746818467938368, "percentage": 8.75, "elapsed_time": "14:45:18", "remaining_time": "6 days, 9:55:20", "throughput": 2720.98, "total_tokens": 144533984} {"current_steps": 800, "total_steps": 9134, "loss": 0.8295, "learning_rate": 4.9059571195766066e-05, "epoch": 0.08757765675032157, "percentage": 8.76, "elapsed_time": "14:46:24", "remaining_time": "6 days, 9:54:11", "throughput": 2721.11, "total_tokens": 144721024} {"current_steps": 801, "total_steps": 9134, "loss": 0.6388, "learning_rate": 4.90572335529097e-05, "epoch": 0.08768712882125948, "percentage": 8.77, "elapsed_time": "14:47:31", "remaining_time": "6 days, 9:53:11", "throughput": 2721.19, "total_tokens": 144908288} {"current_steps": 802, "total_steps": 9134, "loss": 0.5966, "learning_rate": 4.9054893064128584e-05, "epoch": 0.08779660089219737, "percentage": 8.78, "elapsed_time": "14:48:39", "remaining_time": "6 days, 9:52:21", "throughput": 2721.27, "total_tokens": 145097792} {"current_steps": 803, "total_steps": 9134, "loss": 0.6211, "learning_rate": 4.905254972969962e-05, "epoch": 0.08790607296313528, "percentage": 8.79, "elapsed_time": "14:49:46", "remaining_time": "6 days, 9:51:21", "throughput": 2721.7, "total_tokens": 145303424} {"current_steps": 804, "total_steps": 9134, "loss": 0.7511, "learning_rate": 4.9050203549899984e-05, "epoch": 0.08801554503407318, "percentage": 8.8, "elapsed_time": "14:50:54", "remaining_time": "6 days, 9:50:29", "throughput": 2722.07, "total_tokens": 145508160} {"current_steps": 805, "total_steps": 9134, "loss": 0.733, "learning_rate": 4.904785452500726e-05, "epoch": 0.08812501710501108, "percentage": 8.81, "elapsed_time": "14:52:00", "remaining_time": "6 days, 9:49:12", "throughput": 2721.84, "total_tokens": 145673920} {"current_steps": 806, "total_steps": 9134, "loss": 0.6224, "learning_rate": 4.904550265529932e-05, "epoch": 0.08823448917594899, "percentage": 8.82, "elapsed_time": "14:53:04", "remaining_time": "6 days, 9:47:46", "throughput": 2721.84, "total_tokens": 145849760} {"current_steps": 807, "total_steps": 9134, "loss": 0.798, "learning_rate": 4.904314794105437e-05, "epoch": 0.08834396124688688, "percentage": 8.84, "elapsed_time": "14:54:13", "remaining_time": "6 days, 9:46:58", "throughput": 2722.03, "total_tokens": 146045536} {"current_steps": 808, "total_steps": 9134, "loss": 0.8995, "learning_rate": 4.9040790382550985e-05, "epoch": 0.08845343331782479, "percentage": 8.85, "elapsed_time": "14:55:22", "remaining_time": "6 days, 9:46:17", "throughput": 2722.02, "total_tokens": 146232576} {"current_steps": 809, "total_steps": 9134, "loss": 0.6881, "learning_rate": 4.903842998006806e-05, "epoch": 0.08856290538876269, "percentage": 8.86, "elapsed_time": "14:56:30", "remaining_time": "6 days, 9:45:34", "throughput": 2722.16, "total_tokens": 146427456} {"current_steps": 810, "total_steps": 9134, "loss": 0.7038, "learning_rate": 4.903606673388482e-05, "epoch": 0.0886723774597006, "percentage": 8.87, "elapsed_time": "14:57:38", "remaining_time": "6 days, 9:44:38", "throughput": 2722.21, "total_tokens": 146614048} {"current_steps": 811, "total_steps": 9134, "loss": 1.0258, "learning_rate": 4.903370064428083e-05, "epoch": 0.0887818495306385, "percentage": 8.88, "elapsed_time": "14:58:45", "remaining_time": "6 days, 9:43:36", "throughput": 2722.11, "total_tokens": 146790784} {"current_steps": 812, "total_steps": 9134, "loss": 0.9551, "learning_rate": 4.903133171153601e-05, "epoch": 0.0888913216015764, "percentage": 8.89, "elapsed_time": "14:59:54", "remaining_time": "6 days, 9:42:59", "throughput": 2722.47, "total_tokens": 146999328} {"current_steps": 813, "total_steps": 9134, "loss": 0.5975, "learning_rate": 4.902895993593058e-05, "epoch": 0.0890007936725143, "percentage": 8.9, "elapsed_time": "15:01:00", "remaining_time": "6 days, 9:41:41", "throughput": 2722.6, "total_tokens": 147183904} {"current_steps": 814, "total_steps": 9134, "loss": 0.6499, "learning_rate": 4.902658531774512e-05, "epoch": 0.0891102657434522, "percentage": 8.91, "elapsed_time": "15:02:09", "remaining_time": "6 days, 9:41:02", "throughput": 2722.66, "total_tokens": 147375648} {"current_steps": 815, "total_steps": 9134, "loss": 0.8148, "learning_rate": 4.902420785726056e-05, "epoch": 0.0892197378143901, "percentage": 8.92, "elapsed_time": "15:03:14", "remaining_time": "6 days, 9:39:43", "throughput": 2722.56, "total_tokens": 147548128} {"current_steps": 816, "total_steps": 9134, "loss": 0.8289, "learning_rate": 4.902182755475813e-05, "epoch": 0.08932920988532801, "percentage": 8.93, "elapsed_time": "15:04:21", "remaining_time": "6 days, 9:38:43", "throughput": 2722.69, "total_tokens": 147737856} {"current_steps": 817, "total_steps": 9134, "loss": 0.9015, "learning_rate": 4.9019444410519425e-05, "epoch": 0.0894386819562659, "percentage": 8.94, "elapsed_time": "15:05:27", "remaining_time": "6 days, 9:37:30", "throughput": 2722.72, "total_tokens": 147918400} {"current_steps": 818, "total_steps": 9134, "loss": 0.6044, "learning_rate": 4.9017058424826366e-05, "epoch": 0.08954815402720381, "percentage": 8.96, "elapsed_time": "15:06:32", "remaining_time": "6 days, 9:36:04", "throughput": 2722.47, "total_tokens": 148081024} {"current_steps": 819, "total_steps": 9134, "loss": 0.6394, "learning_rate": 4.901466959796121e-05, "epoch": 0.08965762609814171, "percentage": 8.97, "elapsed_time": "15:07:41", "remaining_time": "6 days, 9:35:24", "throughput": 2722.6, "total_tokens": 148276352} {"current_steps": 820, "total_steps": 9134, "loss": 0.7425, "learning_rate": 4.9012277930206536e-05, "epoch": 0.08976709816907961, "percentage": 8.98, "elapsed_time": "15:08:45", "remaining_time": "6 days, 9:33:59", "throughput": 2722.84, "total_tokens": 148465632} {"current_steps": 821, "total_steps": 9134, "loss": 0.7632, "learning_rate": 4.900988342184529e-05, "epoch": 0.08987657024001751, "percentage": 8.99, "elapsed_time": "15:09:53", "remaining_time": "6 days, 9:33:01", "throughput": 2722.92, "total_tokens": 148653120} {"current_steps": 822, "total_steps": 9134, "loss": 0.6866, "learning_rate": 4.9007486073160746e-05, "epoch": 0.08998604231095542, "percentage": 9.0, "elapsed_time": "15:10:58", "remaining_time": "6 days, 9:31:41", "throughput": 2722.62, "total_tokens": 148813952} {"current_steps": 823, "total_steps": 9134, "loss": 0.707, "learning_rate": 4.900508588443649e-05, "epoch": 0.09009551438189332, "percentage": 9.01, "elapsed_time": "15:12:03", "remaining_time": "6 days, 9:30:24", "throughput": 2722.46, "total_tokens": 148983744} {"current_steps": 824, "total_steps": 9134, "loss": 0.7952, "learning_rate": 4.900268285595645e-05, "epoch": 0.09020498645283122, "percentage": 9.02, "elapsed_time": "15:13:13", "remaining_time": "6 days, 9:29:52", "throughput": 2722.95, "total_tokens": 149200800} {"current_steps": 825, "total_steps": 9134, "loss": 0.6926, "learning_rate": 4.9000276988004925e-05, "epoch": 0.09031445852376913, "percentage": 9.03, "elapsed_time": "15:14:21", "remaining_time": "6 days, 9:29:00", "throughput": 2722.95, "total_tokens": 149385824} {"current_steps": 826, "total_steps": 9134, "loss": 1.0813, "learning_rate": 4.899786828086651e-05, "epoch": 0.09042393059470702, "percentage": 9.04, "elapsed_time": "15:15:31", "remaining_time": "6 days, 9:28:22", "throughput": 2723.45, "total_tokens": 149601984} {"current_steps": 827, "total_steps": 9134, "loss": 0.7668, "learning_rate": 4.899545673482616e-05, "epoch": 0.09053340266564493, "percentage": 9.05, "elapsed_time": "15:16:32", "remaining_time": "6 days, 9:26:26", "throughput": 2723.0, "total_tokens": 149744672} {"current_steps": 828, "total_steps": 9134, "loss": 0.8394, "learning_rate": 4.8993042350169145e-05, "epoch": 0.09064287473658283, "percentage": 9.07, "elapsed_time": "15:17:42", "remaining_time": "6 days, 9:25:51", "throughput": 2723.54, "total_tokens": 149964192} {"current_steps": 829, "total_steps": 9134, "loss": 0.6735, "learning_rate": 4.899062512718109e-05, "epoch": 0.09075234680752073, "percentage": 9.08, "elapsed_time": "15:18:45", "remaining_time": "6 days, 9:24:16", "throughput": 2723.57, "total_tokens": 150138912} {"current_steps": 830, "total_steps": 9134, "loss": 0.6986, "learning_rate": 4.898820506614794e-05, "epoch": 0.09086181887845864, "percentage": 9.09, "elapsed_time": "15:19:46", "remaining_time": "6 days, 9:22:07", "throughput": 2723.02, "total_tokens": 150272864} {"current_steps": 831, "total_steps": 9134, "loss": 0.8561, "learning_rate": 4.898578216735599e-05, "epoch": 0.09097129094939653, "percentage": 9.1, "elapsed_time": "15:20:52", "remaining_time": "6 days, 9:21:02", "throughput": 2723.45, "total_tokens": 150478496} {"current_steps": 832, "total_steps": 9134, "loss": 0.7374, "learning_rate": 4.8983356431091864e-05, "epoch": 0.09108076302033444, "percentage": 9.11, "elapsed_time": "15:21:56", "remaining_time": "6 days, 9:19:26", "throughput": 2723.43, "total_tokens": 150650304} {"current_steps": 833, "total_steps": 9134, "loss": 0.7869, "learning_rate": 4.8980927857642514e-05, "epoch": 0.09119023509127235, "percentage": 9.12, "elapsed_time": "15:22:59", "remaining_time": "6 days, 9:17:46", "throughput": 2723.11, "total_tokens": 150804192} {"current_steps": 834, "total_steps": 9134, "loss": 0.6249, "learning_rate": 4.897849644729525e-05, "epoch": 0.09129970716221024, "percentage": 9.13, "elapsed_time": "15:24:01", "remaining_time": "6 days, 9:15:57", "throughput": 2722.61, "total_tokens": 150946208} {"current_steps": 835, "total_steps": 9134, "loss": 0.5683, "learning_rate": 4.8976062200337695e-05, "epoch": 0.09140917923314815, "percentage": 9.14, "elapsed_time": "15:25:06", "remaining_time": "6 days, 9:14:35", "throughput": 2722.38, "total_tokens": 151109952} {"current_steps": 836, "total_steps": 9134, "loss": 0.7016, "learning_rate": 4.897362511705781e-05, "epoch": 0.09151865130408604, "percentage": 9.15, "elapsed_time": "15:26:14", "remaining_time": "6 days, 9:13:42", "throughput": 2722.37, "total_tokens": 151293856} {"current_steps": 837, "total_steps": 9134, "loss": 0.7584, "learning_rate": 4.897118519774391e-05, "epoch": 0.09162812337502395, "percentage": 9.16, "elapsed_time": "15:27:22", "remaining_time": "6 days, 9:12:47", "throughput": 2722.31, "total_tokens": 151474848} {"current_steps": 838, "total_steps": 9134, "loss": 0.873, "learning_rate": 4.8968742442684625e-05, "epoch": 0.09173759544596186, "percentage": 9.17, "elapsed_time": "15:28:27", "remaining_time": "6 days, 9:11:29", "throughput": 2721.98, "total_tokens": 151634112} {"current_steps": 839, "total_steps": 9134, "loss": 0.7044, "learning_rate": 4.896629685216892e-05, "epoch": 0.09184706751689975, "percentage": 9.19, "elapsed_time": "15:29:30", "remaining_time": "6 days, 9:09:54", "throughput": 2721.74, "total_tokens": 151794048} {"current_steps": 840, "total_steps": 9134, "loss": 0.5683, "learning_rate": 4.896384842648612e-05, "epoch": 0.09195653958783766, "percentage": 9.2, "elapsed_time": "15:30:33", "remaining_time": "6 days, 9:08:10", "throughput": 2721.44, "total_tokens": 151947936} {"current_steps": 841, "total_steps": 9134, "loss": 0.6199, "learning_rate": 4.8961397165925874e-05, "epoch": 0.09206601165877555, "percentage": 9.21, "elapsed_time": "15:31:37", "remaining_time": "6 days, 9:06:42", "throughput": 2721.67, "total_tokens": 152135648} {"current_steps": 842, "total_steps": 9134, "loss": 0.6604, "learning_rate": 4.895894307077814e-05, "epoch": 0.09217548372971346, "percentage": 9.22, "elapsed_time": "15:32:46", "remaining_time": "6 days, 9:05:57", "throughput": 2721.72, "total_tokens": 152325152} {"current_steps": 843, "total_steps": 9134, "loss": 0.7524, "learning_rate": 4.895648614133324e-05, "epoch": 0.09228495580065135, "percentage": 9.23, "elapsed_time": "15:33:54", "remaining_time": "6 days, 9:05:09", "throughput": 2721.96, "total_tokens": 152524512} {"current_steps": 844, "total_steps": 9134, "loss": 0.6847, "learning_rate": 4.895402637788183e-05, "epoch": 0.09239442787158926, "percentage": 9.24, "elapsed_time": "15:35:00", "remaining_time": "6 days, 9:03:54", "throughput": 2721.97, "total_tokens": 152703936} {"current_steps": 845, "total_steps": 9134, "loss": 0.6819, "learning_rate": 4.895156378071489e-05, "epoch": 0.09250389994252717, "percentage": 9.25, "elapsed_time": "15:36:09", "remaining_time": "6 days, 9:03:09", "throughput": 2722.32, "total_tokens": 152910688} {"current_steps": 846, "total_steps": 9134, "loss": 0.7543, "learning_rate": 4.894909835012374e-05, "epoch": 0.09261337201346506, "percentage": 9.26, "elapsed_time": "15:37:12", "remaining_time": "6 days, 9:01:31", "throughput": 2722.14, "total_tokens": 153072416} {"current_steps": 847, "total_steps": 9134, "loss": 0.5573, "learning_rate": 4.894663008640004e-05, "epoch": 0.09272284408440297, "percentage": 9.27, "elapsed_time": "15:38:17", "remaining_time": "6 days, 9:00:08", "throughput": 2722.0, "total_tokens": 153241088} {"current_steps": 848, "total_steps": 9134, "loss": 0.8251, "learning_rate": 4.894415898983578e-05, "epoch": 0.09283231615534086, "percentage": 9.28, "elapsed_time": "15:39:25", "remaining_time": "6 days, 8:59:23", "throughput": 2722.06, "total_tokens": 153431264} {"current_steps": 849, "total_steps": 9134, "loss": 0.6088, "learning_rate": 4.894168506072329e-05, "epoch": 0.09294178822627877, "percentage": 9.29, "elapsed_time": "15:40:33", "remaining_time": "6 days, 8:58:30", "throughput": 2722.06, "total_tokens": 153616064} {"current_steps": 850, "total_steps": 9134, "loss": 0.7778, "learning_rate": 4.8939208299355215e-05, "epoch": 0.09305126029721668, "percentage": 9.31, "elapsed_time": "15:41:42", "remaining_time": "6 days, 8:57:46", "throughput": 2721.93, "total_tokens": 153795936} {"current_steps": 851, "total_steps": 9134, "loss": 0.659, "learning_rate": 4.893672870602457e-05, "epoch": 0.09316073236815457, "percentage": 9.32, "elapsed_time": "15:42:45", "remaining_time": "6 days, 8:56:10", "throughput": 2721.61, "total_tokens": 153950272} {"current_steps": 852, "total_steps": 9134, "loss": 0.7125, "learning_rate": 4.893424628102468e-05, "epoch": 0.09327020443909248, "percentage": 9.33, "elapsed_time": "15:43:54", "remaining_time": "6 days, 8:55:23", "throughput": 2721.39, "total_tokens": 154124544} {"current_steps": 853, "total_steps": 9134, "loss": 0.706, "learning_rate": 4.8931761024649206e-05, "epoch": 0.09337967651003037, "percentage": 9.34, "elapsed_time": "15:45:01", "remaining_time": "6 days, 8:54:20", "throughput": 2721.82, "total_tokens": 154330176} {"current_steps": 854, "total_steps": 9134, "loss": 0.8021, "learning_rate": 4.8929272937192147e-05, "epoch": 0.09348914858096828, "percentage": 9.35, "elapsed_time": "15:46:04", "remaining_time": "6 days, 8:52:46", "throughput": 2721.54, "total_tokens": 154488096} {"current_steps": 855, "total_steps": 9134, "loss": 0.8338, "learning_rate": 4.892678201894785e-05, "epoch": 0.09359862065190619, "percentage": 9.36, "elapsed_time": "15:47:11", "remaining_time": "6 days, 8:51:39", "throughput": 2721.26, "total_tokens": 154652512} {"current_steps": 856, "total_steps": 9134, "loss": 0.7688, "learning_rate": 4.892428827021098e-05, "epoch": 0.09370809272284408, "percentage": 9.37, "elapsed_time": "15:48:18", "remaining_time": "6 days, 8:50:36", "throughput": 2721.1, "total_tokens": 154825216} {"current_steps": 857, "total_steps": 9134, "loss": 0.6916, "learning_rate": 4.892179169127654e-05, "epoch": 0.09381756479378199, "percentage": 9.38, "elapsed_time": "15:49:23", "remaining_time": "6 days, 8:49:16", "throughput": 2721.36, "total_tokens": 155017184} {"current_steps": 858, "total_steps": 9134, "loss": 0.7637, "learning_rate": 4.891929228243988e-05, "epoch": 0.09392703686471988, "percentage": 9.39, "elapsed_time": "15:50:32", "remaining_time": "6 days, 8:48:34", "throughput": 2721.47, "total_tokens": 155211168} {"current_steps": 859, "total_steps": 9134, "loss": 0.6796, "learning_rate": 4.8916790043996665e-05, "epoch": 0.09403650893565779, "percentage": 9.4, "elapsed_time": "15:51:36", "remaining_time": "6 days, 8:47:05", "throughput": 2721.44, "total_tokens": 155384320} {"current_steps": 860, "total_steps": 9134, "loss": 0.5568, "learning_rate": 4.891428497624291e-05, "epoch": 0.09414598100659569, "percentage": 9.42, "elapsed_time": "15:52:36", "remaining_time": "6 days, 8:45:00", "throughput": 2721.07, "total_tokens": 155527680} {"current_steps": 861, "total_steps": 9134, "loss": 0.6695, "learning_rate": 4.891177707947496e-05, "epoch": 0.0942554530775336, "percentage": 9.43, "elapsed_time": "15:53:45", "remaining_time": "6 days, 8:44:17", "throughput": 2721.31, "total_tokens": 155728384} {"current_steps": 862, "total_steps": 9134, "loss": 0.6203, "learning_rate": 4.890926635398949e-05, "epoch": 0.0943649251484715, "percentage": 9.44, "elapsed_time": "15:54:47", "remaining_time": "6 days, 8:42:32", "throughput": 2720.88, "total_tokens": 155873984} {"current_steps": 863, "total_steps": 9134, "loss": 0.7613, "learning_rate": 4.890675280008352e-05, "epoch": 0.0944743972194094, "percentage": 9.45, "elapsed_time": "15:55:56", "remaining_time": "6 days, 8:41:47", "throughput": 2721.09, "total_tokens": 156072672} {"current_steps": 864, "total_steps": 9134, "loss": 0.7572, "learning_rate": 4.8904236418054395e-05, "epoch": 0.0945838692903473, "percentage": 9.46, "elapsed_time": "15:57:01", "remaining_time": "6 days, 8:40:29", "throughput": 2720.9, "total_tokens": 156239552} {"current_steps": 865, "total_steps": 9134, "loss": 0.6268, "learning_rate": 4.890171720819979e-05, "epoch": 0.0946933413612852, "percentage": 9.47, "elapsed_time": "15:58:10", "remaining_time": "6 days, 8:39:47", "throughput": 2721.02, "total_tokens": 156433984} {"current_steps": 866, "total_steps": 9134, "loss": 0.8435, "learning_rate": 4.889919517081775e-05, "epoch": 0.0948028134322231, "percentage": 9.48, "elapsed_time": "15:59:14", "remaining_time": "6 days, 8:38:08", "throughput": 2720.73, "total_tokens": 156588992} {"current_steps": 867, "total_steps": 9134, "loss": 0.8546, "learning_rate": 4.889667030620659e-05, "epoch": 0.09491228550316101, "percentage": 9.49, "elapsed_time": "16:00:19", "remaining_time": "6 days, 8:36:54", "throughput": 2720.8, "total_tokens": 156771776} {"current_steps": 868, "total_steps": 9134, "loss": 0.8201, "learning_rate": 4.889414261466503e-05, "epoch": 0.0950217575740989, "percentage": 9.5, "elapsed_time": "16:01:27", "remaining_time": "6 days, 8:36:03", "throughput": 2720.65, "total_tokens": 156948512} {"current_steps": 869, "total_steps": 9134, "loss": 0.553, "learning_rate": 4.8891612096492066e-05, "epoch": 0.09513122964503681, "percentage": 9.51, "elapsed_time": "16:02:30", "remaining_time": "6 days, 8:34:21", "throughput": 2720.3, "total_tokens": 157098816} {"current_steps": 870, "total_steps": 9134, "loss": 0.5557, "learning_rate": 4.8889078751987074e-05, "epoch": 0.09524070171597471, "percentage": 9.52, "elapsed_time": "16:03:38", "remaining_time": "6 days, 8:33:31", "throughput": 2720.5, "total_tokens": 157295712} {"current_steps": 871, "total_steps": 9134, "loss": 0.7024, "learning_rate": 4.8886542581449726e-05, "epoch": 0.09535017378691261, "percentage": 9.54, "elapsed_time": "16:04:43", "remaining_time": "6 days, 8:32:05", "throughput": 2720.49, "total_tokens": 157470656} {"current_steps": 872, "total_steps": 9134, "loss": 0.7516, "learning_rate": 4.8884003585180053e-05, "epoch": 0.09545964585785052, "percentage": 9.55, "elapsed_time": "16:05:52", "remaining_time": "6 days, 8:31:28", "throughput": 2720.81, "total_tokens": 157678304} {"current_steps": 873, "total_steps": 9134, "loss": 0.7469, "learning_rate": 4.888146176347842e-05, "epoch": 0.09556911792878842, "percentage": 9.56, "elapsed_time": "16:06:57", "remaining_time": "6 days, 8:30:04", "throughput": 2720.79, "total_tokens": 157853024} {"current_steps": 874, "total_steps": 9134, "loss": 0.7961, "learning_rate": 4.8878917116645514e-05, "epoch": 0.09567858999972632, "percentage": 9.57, "elapsed_time": "16:08:03", "remaining_time": "6 days, 8:28:56", "throughput": 2720.72, "total_tokens": 158029088} {"current_steps": 875, "total_steps": 9134, "loss": 0.9732, "learning_rate": 4.887636964498236e-05, "epoch": 0.09578806207066422, "percentage": 9.58, "elapsed_time": "16:09:08", "remaining_time": "6 days, 8:27:37", "throughput": 2720.64, "total_tokens": 158202016} {"current_steps": 876, "total_steps": 9134, "loss": 0.605, "learning_rate": 4.887381934879032e-05, "epoch": 0.09589753414160213, "percentage": 9.59, "elapsed_time": "16:10:09", "remaining_time": "6 days, 8:25:41", "throughput": 2720.45, "total_tokens": 158357248} {"current_steps": 877, "total_steps": 9134, "loss": 0.624, "learning_rate": 4.887126622837109e-05, "epoch": 0.09600700621254002, "percentage": 9.6, "elapsed_time": "16:11:17", "remaining_time": "6 days, 8:24:45", "throughput": 2720.72, "total_tokens": 158556384} {"current_steps": 878, "total_steps": 9134, "loss": 0.7061, "learning_rate": 4.88687102840267e-05, "epoch": 0.09611647828347793, "percentage": 9.61, "elapsed_time": "16:12:20", "remaining_time": "6 days, 8:23:04", "throughput": 2720.27, "total_tokens": 158700864} {"current_steps": 879, "total_steps": 9134, "loss": 0.8227, "learning_rate": 4.886615151605951e-05, "epoch": 0.09622595035441583, "percentage": 9.62, "elapsed_time": "16:13:23", "remaining_time": "6 days, 8:21:31", "throughput": 2720.2, "total_tokens": 158870432} {"current_steps": 880, "total_steps": 9134, "loss": 0.738, "learning_rate": 4.886358992477222e-05, "epoch": 0.09633542242535373, "percentage": 9.63, "elapsed_time": "16:14:33", "remaining_time": "6 days, 8:20:53", "throughput": 2720.37, "total_tokens": 159068896} {"current_steps": 881, "total_steps": 9134, "loss": 0.6958, "learning_rate": 4.886102551046786e-05, "epoch": 0.09644489449629164, "percentage": 9.65, "elapsed_time": "16:15:39", "remaining_time": "6 days, 8:19:40", "throughput": 2720.27, "total_tokens": 159242048} {"current_steps": 882, "total_steps": 9134, "loss": 0.5828, "learning_rate": 4.8858458273449806e-05, "epoch": 0.09655436656722953, "percentage": 9.66, "elapsed_time": "16:16:45", "remaining_time": "6 days, 8:18:29", "throughput": 2720.11, "total_tokens": 159412064} {"current_steps": 883, "total_steps": 9134, "loss": 0.898, "learning_rate": 4.885588821402174e-05, "epoch": 0.09666383863816744, "percentage": 9.67, "elapsed_time": "16:17:54", "remaining_time": "6 days, 8:17:46", "throughput": 2720.54, "total_tokens": 159625312} {"current_steps": 884, "total_steps": 9134, "loss": 0.8381, "learning_rate": 4.88533153324877e-05, "epoch": 0.09677331070910535, "percentage": 9.68, "elapsed_time": "16:19:01", "remaining_time": "6 days, 8:16:48", "throughput": 2720.63, "total_tokens": 159813472} {"current_steps": 885, "total_steps": 9134, "loss": 0.555, "learning_rate": 4.885073962915207e-05, "epoch": 0.09688278278004324, "percentage": 9.69, "elapsed_time": "16:20:09", "remaining_time": "6 days, 8:15:54", "throughput": 2720.81, "total_tokens": 160008800} {"current_steps": 886, "total_steps": 9134, "loss": 0.6893, "learning_rate": 4.8848161104319525e-05, "epoch": 0.09699225485098115, "percentage": 9.7, "elapsed_time": "16:21:15", "remaining_time": "6 days, 8:14:45", "throughput": 2720.88, "total_tokens": 160192704} {"current_steps": 887, "total_steps": 9134, "loss": 0.6842, "learning_rate": 4.8845579758295114e-05, "epoch": 0.09710172692191904, "percentage": 9.71, "elapsed_time": "16:22:18", "remaining_time": "6 days, 8:13:12", "throughput": 2720.6, "total_tokens": 160349280} {"current_steps": 888, "total_steps": 9134, "loss": 0.8236, "learning_rate": 4.88429955913842e-05, "epoch": 0.09721119899285695, "percentage": 9.72, "elapsed_time": "16:23:27", "remaining_time": "6 days, 8:12:27", "throughput": 2721.22, "total_tokens": 160572608} {"current_steps": 889, "total_steps": 9134, "loss": 0.7238, "learning_rate": 4.8840408603892495e-05, "epoch": 0.09732067106379486, "percentage": 9.73, "elapsed_time": "16:24:30", "remaining_time": "6 days, 8:10:49", "throughput": 2721.0, "total_tokens": 160731648} {"current_steps": 890, "total_steps": 9134, "loss": 0.7868, "learning_rate": 4.883781879612602e-05, "epoch": 0.09743014313473275, "percentage": 9.74, "elapsed_time": "16:25:36", "remaining_time": "6 days, 8:09:37", "throughput": 2721.31, "total_tokens": 160928992} {"current_steps": 891, "total_steps": 9134, "loss": 0.8868, "learning_rate": 4.883522616839116e-05, "epoch": 0.09753961520567066, "percentage": 9.75, "elapsed_time": "16:26:45", "remaining_time": "6 days, 8:08:52", "throughput": 2721.35, "total_tokens": 161118720} {"current_steps": 892, "total_steps": 9134, "loss": 0.6829, "learning_rate": 4.88326307209946e-05, "epoch": 0.09764908727660855, "percentage": 9.77, "elapsed_time": "16:27:49", "remaining_time": "6 days, 8:07:25", "throughput": 2721.27, "total_tokens": 161288736} {"current_steps": 893, "total_steps": 9134, "loss": 0.6839, "learning_rate": 4.883003245424339e-05, "epoch": 0.09775855934754646, "percentage": 9.78, "elapsed_time": "16:28:54", "remaining_time": "6 days, 8:06:02", "throughput": 2721.47, "total_tokens": 161476224} {"current_steps": 894, "total_steps": 9134, "loss": 0.879, "learning_rate": 4.8827431368444896e-05, "epoch": 0.09786803141848435, "percentage": 9.79, "elapsed_time": "16:30:03", "remaining_time": "6 days, 8:05:20", "throughput": 2721.77, "total_tokens": 161682080} {"current_steps": 895, "total_steps": 9134, "loss": 0.9603, "learning_rate": 4.882482746390682e-05, "epoch": 0.09797750348942226, "percentage": 9.8, "elapsed_time": "16:31:09", "remaining_time": "6 days, 8:04:09", "throughput": 2721.52, "total_tokens": 161846720} {"current_steps": 896, "total_steps": 9134, "loss": 0.6528, "learning_rate": 4.8822220740937195e-05, "epoch": 0.09808697556036017, "percentage": 9.81, "elapsed_time": "16:32:06", "remaining_time": "6 days, 8:01:35", "throughput": 2720.8, "total_tokens": 161958720} {"current_steps": 897, "total_steps": 9134, "loss": 0.7086, "learning_rate": 4.8819611199844406e-05, "epoch": 0.09819644763129806, "percentage": 9.82, "elapsed_time": "16:33:14", "remaining_time": "6 days, 8:00:50", "throughput": 2721.25, "total_tokens": 162172416} {"current_steps": 898, "total_steps": 9134, "loss": 0.8896, "learning_rate": 4.881699884093715e-05, "epoch": 0.09830591970223597, "percentage": 9.83, "elapsed_time": "16:34:22", "remaining_time": "6 days, 7:59:52", "throughput": 2721.33, "total_tokens": 162360800} {"current_steps": 899, "total_steps": 9134, "loss": 0.7655, "learning_rate": 4.881438366452446e-05, "epoch": 0.09841539177317386, "percentage": 9.84, "elapsed_time": "16:35:24", "remaining_time": "6 days, 7:58:09", "throughput": 2721.24, "total_tokens": 162525216} {"current_steps": 900, "total_steps": 9134, "loss": 0.9436, "learning_rate": 4.88117656709157e-05, "epoch": 0.09852486384411177, "percentage": 9.85, "elapsed_time": "16:36:31", "remaining_time": "6 days, 7:57:06", "throughput": 2721.41, "total_tokens": 162717184} {"current_steps": 901, "total_steps": 9134, "loss": 0.6904, "learning_rate": 4.880914486042059e-05, "epoch": 0.09863433591504968, "percentage": 9.86, "elapsed_time": "16:37:38", "remaining_time": "6 days, 7:56:05", "throughput": 2721.48, "total_tokens": 162904000} {"current_steps": 902, "total_steps": 9134, "loss": 0.8643, "learning_rate": 4.8806521233349146e-05, "epoch": 0.09874380798598757, "percentage": 9.88, "elapsed_time": "16:38:47", "remaining_time": "6 days, 7:55:19", "throughput": 2721.57, "total_tokens": 163096416} {"current_steps": 903, "total_steps": 9134, "loss": 0.7828, "learning_rate": 4.880389479001176e-05, "epoch": 0.09885328005692548, "percentage": 9.89, "elapsed_time": "16:39:51", "remaining_time": "6 days, 7:53:57", "throughput": 2721.65, "total_tokens": 163276960} {"current_steps": 904, "total_steps": 9134, "loss": 0.8228, "learning_rate": 4.880126553071912e-05, "epoch": 0.09896275212786337, "percentage": 9.9, "elapsed_time": "16:41:01", "remaining_time": "6 days, 7:53:17", "throughput": 2722.15, "total_tokens": 163496256} {"current_steps": 905, "total_steps": 9134, "loss": 0.752, "learning_rate": 4.879863345578227e-05, "epoch": 0.09907222419880128, "percentage": 9.91, "elapsed_time": "16:42:07", "remaining_time": "6 days, 7:52:05", "throughput": 2721.8, "total_tokens": 163654176} {"current_steps": 906, "total_steps": 9134, "loss": 0.8627, "learning_rate": 4.879599856551258e-05, "epoch": 0.09918169626973919, "percentage": 9.92, "elapsed_time": "16:43:14", "remaining_time": "6 days, 7:51:05", "throughput": 2721.76, "total_tokens": 163834496} {"current_steps": 907, "total_steps": 9134, "loss": 0.6578, "learning_rate": 4.879336086022175e-05, "epoch": 0.09929116834067708, "percentage": 9.93, "elapsed_time": "16:44:20", "remaining_time": "6 days, 7:49:52", "throughput": 2721.65, "total_tokens": 164006528} {"current_steps": 908, "total_steps": 9134, "loss": 0.8276, "learning_rate": 4.879072034022182e-05, "epoch": 0.09940064041161499, "percentage": 9.94, "elapsed_time": "16:45:29", "remaining_time": "6 days, 7:49:09", "throughput": 2721.99, "total_tokens": 164215520} {"current_steps": 909, "total_steps": 9134, "loss": 0.7947, "learning_rate": 4.8788077005825146e-05, "epoch": 0.09951011248255288, "percentage": 9.95, "elapsed_time": "16:46:38", "remaining_time": "6 days, 7:48:27", "throughput": 2721.85, "total_tokens": 164395168} {"current_steps": 910, "total_steps": 9134, "loss": 0.6657, "learning_rate": 4.878543085734444e-05, "epoch": 0.09961958455349079, "percentage": 9.96, "elapsed_time": "16:47:41", "remaining_time": "6 days, 7:46:49", "throughput": 2721.86, "total_tokens": 164566528} {"current_steps": 911, "total_steps": 9134, "loss": 0.9609, "learning_rate": 4.8782781895092734e-05, "epoch": 0.09972905662442869, "percentage": 9.97, "elapsed_time": "16:48:50", "remaining_time": "6 days, 7:46:08", "throughput": 2721.98, "total_tokens": 164762528} {"current_steps": 912, "total_steps": 9134, "loss": 0.6463, "learning_rate": 4.878013011938339e-05, "epoch": 0.0998385286953666, "percentage": 9.98, "elapsed_time": "16:49:57", "remaining_time": "6 days, 7:45:05", "throughput": 2721.8, "total_tokens": 164933664} {"current_steps": 913, "total_steps": 9134, "loss": 0.8373, "learning_rate": 4.877747553053012e-05, "epoch": 0.0999480007663045, "percentage": 10.0, "elapsed_time": "16:51:05", "remaining_time": "6 days, 7:44:12", "throughput": 2721.9, "total_tokens": 165124512} {"current_steps": 914, "total_steps": 9134, "loss": 0.7064, "learning_rate": 4.877481812884695e-05, "epoch": 0.1000574728372424, "percentage": 10.01, "elapsed_time": "16:52:14", "remaining_time": "6 days, 7:43:32", "throughput": 2721.87, "total_tokens": 165311776} {"current_steps": 915, "total_steps": 9134, "loss": 0.8218, "learning_rate": 4.877215791464824e-05, "epoch": 0.1001669449081803, "percentage": 10.02, "elapsed_time": "16:53:18", "remaining_time": "6 days, 7:42:03", "throughput": 2721.84, "total_tokens": 165483584} {"current_steps": 916, "total_steps": 9134, "loss": 0.7181, "learning_rate": 4.876949488824869e-05, "epoch": 0.1002764169791182, "percentage": 10.03, "elapsed_time": "16:54:20", "remaining_time": "6 days, 7:40:18", "throughput": 2721.63, "total_tokens": 165640384} {"current_steps": 917, "total_steps": 9134, "loss": 0.7043, "learning_rate": 4.8766829049963344e-05, "epoch": 0.1003858890500561, "percentage": 10.04, "elapsed_time": "16:55:30", "remaining_time": "6 days, 7:39:39", "throughput": 2721.99, "total_tokens": 165851168} {"current_steps": 918, "total_steps": 9134, "loss": 0.7461, "learning_rate": 4.876416040010755e-05, "epoch": 0.10049536112099401, "percentage": 10.05, "elapsed_time": "16:56:37", "remaining_time": "6 days, 7:38:43", "throughput": 2722.08, "total_tokens": 166040672} {"current_steps": 919, "total_steps": 9134, "loss": 0.6692, "learning_rate": 4.876148893899701e-05, "epoch": 0.1006048331919319, "percentage": 10.06, "elapsed_time": "16:57:43", "remaining_time": "6 days, 7:37:27", "throughput": 2722.09, "total_tokens": 166219424} {"current_steps": 920, "total_steps": 9134, "loss": 0.8863, "learning_rate": 4.8758814666947756e-05, "epoch": 0.10071430526286981, "percentage": 10.07, "elapsed_time": "16:58:50", "remaining_time": "6 days, 7:36:27", "throughput": 2722.4, "total_tokens": 166421248} {"current_steps": 921, "total_steps": 9134, "loss": 0.7305, "learning_rate": 4.875613758427614e-05, "epoch": 0.10082377733380771, "percentage": 10.08, "elapsed_time": "16:59:57", "remaining_time": "6 days, 7:35:26", "throughput": 2722.31, "total_tokens": 166598208} {"current_steps": 922, "total_steps": 9134, "loss": 0.6228, "learning_rate": 4.875345769129887e-05, "epoch": 0.10093324940474561, "percentage": 10.09, "elapsed_time": "17:01:05", "remaining_time": "6 days, 7:34:38", "throughput": 2722.45, "total_tokens": 166793536} {"current_steps": 923, "total_steps": 9134, "loss": 0.8925, "learning_rate": 4.875077498833296e-05, "epoch": 0.10104272147568352, "percentage": 10.11, "elapsed_time": "17:02:11", "remaining_time": "6 days, 7:33:22", "throughput": 2722.43, "total_tokens": 166970496} {"current_steps": 924, "total_steps": 9134, "loss": 0.8568, "learning_rate": 4.874808947569577e-05, "epoch": 0.10115219354662142, "percentage": 10.12, "elapsed_time": "17:03:17", "remaining_time": "6 days, 7:32:12", "throughput": 2722.59, "total_tokens": 167159552} {"current_steps": 925, "total_steps": 9134, "loss": 0.624, "learning_rate": 4.8745401153704996e-05, "epoch": 0.10126166561755932, "percentage": 10.13, "elapsed_time": "17:04:22", "remaining_time": "6 days, 7:30:58", "throughput": 2722.58, "total_tokens": 167337632} {"current_steps": 926, "total_steps": 9134, "loss": 0.6356, "learning_rate": 4.874271002267866e-05, "epoch": 0.10137113768849722, "percentage": 10.14, "elapsed_time": "17:05:29", "remaining_time": "6 days, 7:29:52", "throughput": 2722.36, "total_tokens": 167505408} {"current_steps": 927, "total_steps": 9134, "loss": 0.7896, "learning_rate": 4.874001608293511e-05, "epoch": 0.10148060975943513, "percentage": 10.15, "elapsed_time": "17:06:38", "remaining_time": "6 days, 7:29:08", "throughput": 2722.6, "total_tokens": 167707456} {"current_steps": 928, "total_steps": 9134, "loss": 0.7985, "learning_rate": 4.873731933479305e-05, "epoch": 0.10159008183037303, "percentage": 10.16, "elapsed_time": "17:07:44", "remaining_time": "6 days, 7:27:55", "throughput": 2722.59, "total_tokens": 167886208} {"current_steps": 929, "total_steps": 9134, "loss": 0.8132, "learning_rate": 4.873461977857149e-05, "epoch": 0.10169955390131093, "percentage": 10.17, "elapsed_time": "17:08:46", "remaining_time": "6 days, 7:26:16", "throughput": 2722.08, "total_tokens": 168025536} {"current_steps": 930, "total_steps": 9134, "loss": 0.7088, "learning_rate": 4.8731917414589776e-05, "epoch": 0.10180902597224883, "percentage": 10.18, "elapsed_time": "17:09:53", "remaining_time": "6 days, 7:25:13", "throughput": 2722.11, "total_tokens": 168209216} {"current_steps": 931, "total_steps": 9134, "loss": 0.5851, "learning_rate": 4.872921224316761e-05, "epoch": 0.10191849804318673, "percentage": 10.19, "elapsed_time": "17:11:02", "remaining_time": "6 days, 7:24:24", "throughput": 2722.04, "total_tokens": 168390880} {"current_steps": 932, "total_steps": 9134, "loss": 0.6904, "learning_rate": 4.872650426462499e-05, "epoch": 0.10202797011412464, "percentage": 10.2, "elapsed_time": "17:12:10", "remaining_time": "6 days, 7:23:38", "throughput": 2722.23, "total_tokens": 168590240} {"current_steps": 933, "total_steps": 9134, "loss": 0.7619, "learning_rate": 4.8723793479282274e-05, "epoch": 0.10213744218506253, "percentage": 10.21, "elapsed_time": "17:13:19", "remaining_time": "6 days, 7:22:53", "throughput": 2722.53, "total_tokens": 168796544} {"current_steps": 934, "total_steps": 9134, "loss": 0.6939, "learning_rate": 4.872107988746014e-05, "epoch": 0.10224691425600044, "percentage": 10.23, "elapsed_time": "17:14:23", "remaining_time": "6 days, 7:21:24", "throughput": 2722.31, "total_tokens": 168956704} {"current_steps": 935, "total_steps": 9134, "loss": 0.6586, "learning_rate": 4.871836348947961e-05, "epoch": 0.10235638632693835, "percentage": 10.24, "elapsed_time": "17:15:27", "remaining_time": "6 days, 7:19:52", "throughput": 2722.38, "total_tokens": 169133664} {"current_steps": 936, "total_steps": 9134, "loss": 0.579, "learning_rate": 4.871564428566201e-05, "epoch": 0.10246585839787624, "percentage": 10.25, "elapsed_time": "17:16:35", "remaining_time": "6 days, 7:18:59", "throughput": 2722.56, "total_tokens": 169330112} {"current_steps": 937, "total_steps": 9134, "loss": 0.6513, "learning_rate": 4.8712922276329035e-05, "epoch": 0.10257533046881415, "percentage": 10.26, "elapsed_time": "17:17:41", "remaining_time": "6 days, 7:17:52", "throughput": 2722.71, "total_tokens": 169520512} {"current_steps": 938, "total_steps": 9134, "loss": 0.7276, "learning_rate": 4.8710197461802686e-05, "epoch": 0.10268480253975204, "percentage": 10.27, "elapsed_time": "17:18:48", "remaining_time": "6 days, 7:16:49", "throughput": 2722.91, "total_tokens": 169714272} {"current_steps": 939, "total_steps": 9134, "loss": 0.5897, "learning_rate": 4.8707469842405304e-05, "epoch": 0.10279427461068995, "percentage": 10.28, "elapsed_time": "17:19:54", "remaining_time": "6 days, 7:15:43", "throughput": 2722.74, "total_tokens": 169885408} {"current_steps": 940, "total_steps": 9134, "loss": 0.7027, "learning_rate": 4.870473941845955e-05, "epoch": 0.10290374668162786, "percentage": 10.29, "elapsed_time": "17:21:01", "remaining_time": "6 days, 7:14:35", "throughput": 2722.48, "total_tokens": 170049376} {"current_steps": 941, "total_steps": 9134, "loss": 0.6164, "learning_rate": 4.870200619028845e-05, "epoch": 0.10301321875256575, "percentage": 10.3, "elapsed_time": "17:22:08", "remaining_time": "6 days, 7:13:37", "throughput": 2722.67, "total_tokens": 170244928} {"current_steps": 942, "total_steps": 9134, "loss": 0.9216, "learning_rate": 4.869927015821533e-05, "epoch": 0.10312269082350366, "percentage": 10.31, "elapsed_time": "17:23:09", "remaining_time": "6 days, 7:11:44", "throughput": 2722.1, "total_tokens": 170375296} {"current_steps": 943, "total_steps": 9134, "loss": 0.6821, "learning_rate": 4.8696531322563857e-05, "epoch": 0.10323216289444155, "percentage": 10.32, "elapsed_time": "17:24:18", "remaining_time": "6 days, 7:11:00", "throughput": 2722.23, "total_tokens": 170571744} {"current_steps": 944, "total_steps": 9134, "loss": 0.6696, "learning_rate": 4.869378968365802e-05, "epoch": 0.10334163496537946, "percentage": 10.34, "elapsed_time": "17:25:21", "remaining_time": "6 days, 7:09:18", "throughput": 2721.71, "total_tokens": 170708384} {"current_steps": 945, "total_steps": 9134, "loss": 0.7371, "learning_rate": 4.869104524182216e-05, "epoch": 0.10345110703631737, "percentage": 10.35, "elapsed_time": "17:26:30", "remaining_time": "6 days, 7:08:34", "throughput": 2721.81, "total_tokens": 170902816} {"current_steps": 946, "total_steps": 9134, "loss": 0.6522, "learning_rate": 4.868829799738094e-05, "epoch": 0.10356057910725526, "percentage": 10.36, "elapsed_time": "17:27:35", "remaining_time": "6 days, 7:07:17", "throughput": 2721.61, "total_tokens": 171067680} {"current_steps": 947, "total_steps": 9134, "loss": 0.6111, "learning_rate": 4.8685547950659346e-05, "epoch": 0.10367005117819317, "percentage": 10.37, "elapsed_time": "17:28:37", "remaining_time": "6 days, 7:05:36", "throughput": 2721.43, "total_tokens": 171226272} {"current_steps": 948, "total_steps": 9134, "loss": 0.5951, "learning_rate": 4.868279510198271e-05, "epoch": 0.10377952324913106, "percentage": 10.38, "elapsed_time": "17:29:43", "remaining_time": "6 days, 7:04:27", "throughput": 2721.46, "total_tokens": 171408160} {"current_steps": 949, "total_steps": 9134, "loss": 0.7885, "learning_rate": 4.8680039451676695e-05, "epoch": 0.10388899532006897, "percentage": 10.39, "elapsed_time": "17:30:53", "remaining_time": "6 days, 7:03:46", "throughput": 2721.33, "total_tokens": 171588704} {"current_steps": 950, "total_steps": 9134, "loss": 0.6358, "learning_rate": 4.867728100006728e-05, "epoch": 0.10399846739100686, "percentage": 10.4, "elapsed_time": "17:32:02", "remaining_time": "6 days, 7:03:02", "throughput": 2721.3, "total_tokens": 171774848} {"current_steps": 951, "total_steps": 9134, "loss": 0.7533, "learning_rate": 4.8674519747480774e-05, "epoch": 0.10410793946194477, "percentage": 10.41, "elapsed_time": "17:33:11", "remaining_time": "6 days, 7:02:19", "throughput": 2721.41, "total_tokens": 171970400} {"current_steps": 952, "total_steps": 9134, "loss": 0.6149, "learning_rate": 4.867175569424385e-05, "epoch": 0.10421741153288268, "percentage": 10.42, "elapsed_time": "17:34:13", "remaining_time": "6 days, 7:00:36", "throughput": 2721.06, "total_tokens": 172117120} {"current_steps": 953, "total_steps": 9134, "loss": 0.715, "learning_rate": 4.866898884068348e-05, "epoch": 0.10432688360382057, "percentage": 10.43, "elapsed_time": "17:35:14", "remaining_time": "6 days, 6:58:38", "throughput": 2720.84, "total_tokens": 172268096} {"current_steps": 954, "total_steps": 9134, "loss": 0.7553, "learning_rate": 4.866621918712697e-05, "epoch": 0.10443635567475848, "percentage": 10.44, "elapsed_time": "17:36:15", "remaining_time": "6 days, 6:56:50", "throughput": 2720.53, "total_tokens": 172415488} {"current_steps": 955, "total_steps": 9134, "loss": 0.6576, "learning_rate": 4.866344673390198e-05, "epoch": 0.10454582774569637, "percentage": 10.46, "elapsed_time": "17:37:24", "remaining_time": "6 days, 6:56:04", "throughput": 2720.88, "total_tokens": 172624928} {"current_steps": 956, "total_steps": 9134, "loss": 0.6706, "learning_rate": 4.8660671481336475e-05, "epoch": 0.10465529981663428, "percentage": 10.47, "elapsed_time": "17:38:32", "remaining_time": "6 days, 6:55:13", "throughput": 2720.9, "total_tokens": 172812192} {"current_steps": 957, "total_steps": 9134, "loss": 0.6402, "learning_rate": 4.865789342975877e-05, "epoch": 0.10476477188757219, "percentage": 10.48, "elapsed_time": "17:39:41", "remaining_time": "6 days, 6:54:28", "throughput": 2721.21, "total_tokens": 173019168} {"current_steps": 958, "total_steps": 9134, "loss": 0.8545, "learning_rate": 4.865511257949749e-05, "epoch": 0.10487424395851008, "percentage": 10.49, "elapsed_time": "17:40:50", "remaining_time": "6 days, 6:53:45", "throughput": 2721.45, "total_tokens": 173223008} {"current_steps": 959, "total_steps": 9134, "loss": 0.7539, "learning_rate": 4.865232893088162e-05, "epoch": 0.10498371602944799, "percentage": 10.5, "elapsed_time": "17:41:57", "remaining_time": "6 days, 6:52:37", "throughput": 2721.68, "total_tokens": 173417888} {"current_steps": 960, "total_steps": 9134, "loss": 0.6802, "learning_rate": 4.864954248424045e-05, "epoch": 0.10509318810038588, "percentage": 10.51, "elapsed_time": "17:43:07", "remaining_time": "6 days, 6:51:59", "throughput": 2721.96, "total_tokens": 173625536} {"current_steps": 961, "total_steps": 9134, "loss": 0.7212, "learning_rate": 4.864675323990361e-05, "epoch": 0.10520266017132379, "percentage": 10.52, "elapsed_time": "17:44:16", "remaining_time": "6 days, 6:51:17", "throughput": 2721.99, "total_tokens": 173815712} {"current_steps": 962, "total_steps": 9134, "loss": 0.6268, "learning_rate": 4.864396119820108e-05, "epoch": 0.1053121322422617, "percentage": 10.53, "elapsed_time": "17:45:22", "remaining_time": "6 days, 6:50:07", "throughput": 2722.07, "total_tokens": 174001184} {"current_steps": 963, "total_steps": 9134, "loss": 0.6949, "learning_rate": 4.864116635946313e-05, "epoch": 0.1054216043131996, "percentage": 10.54, "elapsed_time": "17:46:31", "remaining_time": "6 days, 6:49:25", "throughput": 2722.54, "total_tokens": 174220032} {"current_steps": 964, "total_steps": 9134, "loss": 0.5744, "learning_rate": 4.863836872402039e-05, "epoch": 0.1055310763841375, "percentage": 10.55, "elapsed_time": "17:47:36", "remaining_time": "6 days, 6:48:06", "throughput": 2722.63, "total_tokens": 174402368} {"current_steps": 965, "total_steps": 9134, "loss": 0.9442, "learning_rate": 4.863556829220383e-05, "epoch": 0.1056405484550754, "percentage": 10.56, "elapsed_time": "17:48:45", "remaining_time": "6 days, 6:47:22", "throughput": 2722.67, "total_tokens": 174593440} {"current_steps": 966, "total_steps": 9134, "loss": 0.6836, "learning_rate": 4.863276506434471e-05, "epoch": 0.1057500205260133, "percentage": 10.58, "elapsed_time": "17:49:48", "remaining_time": "6 days, 6:45:46", "throughput": 2722.42, "total_tokens": 174748224} {"current_steps": 967, "total_steps": 9134, "loss": 0.7871, "learning_rate": 4.862995904077468e-05, "epoch": 0.1058594925969512, "percentage": 10.59, "elapsed_time": "17:50:54", "remaining_time": "6 days, 6:44:34", "throughput": 2722.22, "total_tokens": 174914432} {"current_steps": 968, "total_steps": 9134, "loss": 0.7583, "learning_rate": 4.8627150221825654e-05, "epoch": 0.1059689646678891, "percentage": 10.6, "elapsed_time": "17:51:57", "remaining_time": "6 days, 6:42:57", "throughput": 2721.92, "total_tokens": 175066752} {"current_steps": 969, "total_steps": 9134, "loss": 0.6804, "learning_rate": 4.862433860782993e-05, "epoch": 0.10607843673882701, "percentage": 10.61, "elapsed_time": "17:53:06", "remaining_time": "6 days, 6:42:13", "throughput": 2721.93, "total_tokens": 175255584} {"current_steps": 970, "total_steps": 9134, "loss": 0.7711, "learning_rate": 4.8621524199120106e-05, "epoch": 0.1061879088097649, "percentage": 10.62, "elapsed_time": "17:54:12", "remaining_time": "6 days, 6:41:05", "throughput": 2722.2, "total_tokens": 175453152} {"current_steps": 971, "total_steps": 9134, "loss": 0.7371, "learning_rate": 4.861870699602913e-05, "epoch": 0.10629738088070281, "percentage": 10.63, "elapsed_time": "17:55:21", "remaining_time": "6 days, 6:40:21", "throughput": 2722.24, "total_tokens": 175644000} {"current_steps": 972, "total_steps": 9134, "loss": 0.8159, "learning_rate": 4.8615886998890266e-05, "epoch": 0.1064068529516407, "percentage": 10.64, "elapsed_time": "17:56:30", "remaining_time": "6 days, 6:39:34", "throughput": 2722.23, "total_tokens": 175830592} {"current_steps": 973, "total_steps": 9134, "loss": 0.6739, "learning_rate": 4.861306420803712e-05, "epoch": 0.10651632502257861, "percentage": 10.65, "elapsed_time": "17:57:39", "remaining_time": "6 days, 6:38:52", "throughput": 2722.61, "total_tokens": 176043616} {"current_steps": 974, "total_steps": 9134, "loss": 0.8644, "learning_rate": 4.861023862380361e-05, "epoch": 0.10662579709351652, "percentage": 10.66, "elapsed_time": "17:58:49", "remaining_time": "6 days, 6:38:10", "throughput": 2722.95, "total_tokens": 176254624} {"current_steps": 975, "total_steps": 9134, "loss": 0.7162, "learning_rate": 4.860741024652401e-05, "epoch": 0.10673526916445442, "percentage": 10.67, "elapsed_time": "17:59:55", "remaining_time": "6 days, 6:37:04", "throughput": 2722.75, "total_tokens": 176423072} {"current_steps": 976, "total_steps": 9134, "loss": 0.9685, "learning_rate": 4.860457907653291e-05, "epoch": 0.10684474123539232, "percentage": 10.69, "elapsed_time": "18:01:05", "remaining_time": "6 days, 6:36:22", "throughput": 2723.15, "total_tokens": 176637440} {"current_steps": 977, "total_steps": 9134, "loss": 0.7168, "learning_rate": 4.860174511416523e-05, "epoch": 0.10695421330633022, "percentage": 10.7, "elapsed_time": "18:02:10", "remaining_time": "6 days, 6:35:09", "throughput": 2723.09, "total_tokens": 176812384} {"current_steps": 978, "total_steps": 9134, "loss": 0.7853, "learning_rate": 4.8598908359756226e-05, "epoch": 0.10706368537726813, "percentage": 10.71, "elapsed_time": "18:03:18", "remaining_time": "6 days, 6:34:11", "throughput": 2723.17, "total_tokens": 177001664} {"current_steps": 979, "total_steps": 9134, "loss": 0.7571, "learning_rate": 4.859606881364146e-05, "epoch": 0.10717315744820603, "percentage": 10.72, "elapsed_time": "18:04:23", "remaining_time": "6 days, 6:32:53", "throughput": 2722.78, "total_tokens": 177153536} {"current_steps": 980, "total_steps": 9134, "loss": 0.6039, "learning_rate": 4.859322647615687e-05, "epoch": 0.10728262951914393, "percentage": 10.73, "elapsed_time": "18:05:31", "remaining_time": "6 days, 6:31:59", "throughput": 2722.75, "total_tokens": 177336544} {"current_steps": 981, "total_steps": 9134, "loss": 0.8699, "learning_rate": 4.85903813476387e-05, "epoch": 0.10739210159008183, "percentage": 10.74, "elapsed_time": "18:06:40", "remaining_time": "6 days, 6:31:15", "throughput": 2722.62, "total_tokens": 177516640} {"current_steps": 982, "total_steps": 9134, "loss": 0.7725, "learning_rate": 4.8587533428423504e-05, "epoch": 0.10750157366101973, "percentage": 10.75, "elapsed_time": "18:07:43", "remaining_time": "6 days, 6:29:39", "throughput": 2722.37, "total_tokens": 177671424} {"current_steps": 983, "total_steps": 9134, "loss": 0.818, "learning_rate": 4.85846827188482e-05, "epoch": 0.10761104573195764, "percentage": 10.76, "elapsed_time": "18:08:52", "remaining_time": "6 days, 6:28:54", "throughput": 2722.65, "total_tokens": 177877728} {"current_steps": 984, "total_steps": 9134, "loss": 0.6957, "learning_rate": 4.858182921925001e-05, "epoch": 0.10772051780289553, "percentage": 10.77, "elapsed_time": "18:10:01", "remaining_time": "6 days, 6:28:09", "throughput": 2722.66, "total_tokens": 178066560} {"current_steps": 985, "total_steps": 9134, "loss": 0.8008, "learning_rate": 4.857897292996651e-05, "epoch": 0.10782998987383344, "percentage": 10.78, "elapsed_time": "18:11:07", "remaining_time": "6 days, 6:26:56", "throughput": 2722.79, "total_tokens": 178253376} {"current_steps": 986, "total_steps": 9134, "loss": 0.6187, "learning_rate": 4.857611385133559e-05, "epoch": 0.10793946194477134, "percentage": 10.79, "elapsed_time": "18:12:14", "remaining_time": "6 days, 6:25:59", "throughput": 2722.75, "total_tokens": 178434816} {"current_steps": 987, "total_steps": 9134, "loss": 0.7601, "learning_rate": 4.857325198369546e-05, "epoch": 0.10804893401570924, "percentage": 10.81, "elapsed_time": "18:13:21", "remaining_time": "6 days, 6:24:51", "throughput": 2723.05, "total_tokens": 178634848} {"current_steps": 988, "total_steps": 9134, "loss": 0.8135, "learning_rate": 4.8570387327384695e-05, "epoch": 0.10815840608664715, "percentage": 10.82, "elapsed_time": "18:14:28", "remaining_time": "6 days, 6:23:50", "throughput": 2723.07, "total_tokens": 178818752} {"current_steps": 989, "total_steps": 9134, "loss": 0.7095, "learning_rate": 4.856751988274216e-05, "epoch": 0.10826787815758504, "percentage": 10.83, "elapsed_time": "18:15:35", "remaining_time": "6 days, 6:22:49", "throughput": 2723.34, "total_tokens": 179019680} {"current_steps": 990, "total_steps": 9134, "loss": 0.6195, "learning_rate": 4.8564649650107084e-05, "epoch": 0.10837735022852295, "percentage": 10.84, "elapsed_time": "18:16:40", "remaining_time": "6 days, 6:21:34", "throughput": 2723.06, "total_tokens": 179179840} {"current_steps": 991, "total_steps": 9134, "loss": 0.6993, "learning_rate": 4.8561776629819e-05, "epoch": 0.10848682229946086, "percentage": 10.85, "elapsed_time": "18:17:47", "remaining_time": "6 days, 6:20:30", "throughput": 2722.9, "total_tokens": 179350528} {"current_steps": 992, "total_steps": 9134, "loss": 0.5838, "learning_rate": 4.855890082221778e-05, "epoch": 0.10859629437039875, "percentage": 10.86, "elapsed_time": "18:18:52", "remaining_time": "6 days, 6:19:15", "throughput": 2722.84, "total_tokens": 179524576} {"current_steps": 993, "total_steps": 9134, "loss": 0.7074, "learning_rate": 4.8556022227643636e-05, "epoch": 0.10870576644133666, "percentage": 10.87, "elapsed_time": "18:20:01", "remaining_time": "6 days, 6:18:27", "throughput": 2723.14, "total_tokens": 179731776} {"current_steps": 994, "total_steps": 9134, "loss": 0.7154, "learning_rate": 4.8553140846437094e-05, "epoch": 0.10881523851227455, "percentage": 10.88, "elapsed_time": "18:21:02", "remaining_time": "6 days, 6:16:31", "throughput": 2722.75, "total_tokens": 179870880} {"current_steps": 995, "total_steps": 9134, "loss": 0.7043, "learning_rate": 4.855025667893901e-05, "epoch": 0.10892471058321246, "percentage": 10.89, "elapsed_time": "18:22:10", "remaining_time": "6 days, 6:15:43", "throughput": 2722.54, "total_tokens": 180044032} {"current_steps": 996, "total_steps": 9134, "loss": 0.9028, "learning_rate": 4.854736972549058e-05, "epoch": 0.10903418265415037, "percentage": 10.9, "elapsed_time": "18:23:17", "remaining_time": "6 days, 6:14:38", "throughput": 2722.38, "total_tokens": 180214720} {"current_steps": 997, "total_steps": 9134, "loss": 0.8202, "learning_rate": 4.854447998643333e-05, "epoch": 0.10914365472508826, "percentage": 10.92, "elapsed_time": "18:24:21", "remaining_time": "6 days, 6:13:14", "throughput": 2722.43, "total_tokens": 180392800} {"current_steps": 998, "total_steps": 9134, "loss": 0.8383, "learning_rate": 4.8541587462109105e-05, "epoch": 0.10925312679602617, "percentage": 10.93, "elapsed_time": "18:25:24", "remaining_time": "6 days, 6:11:41", "throughput": 2722.5, "total_tokens": 180569312} {"current_steps": 999, "total_steps": 9134, "loss": 0.8878, "learning_rate": 4.8538692152860094e-05, "epoch": 0.10936259886696406, "percentage": 10.94, "elapsed_time": "18:26:31", "remaining_time": "6 days, 6:10:38", "throughput": 2722.65, "total_tokens": 180761952} {"current_steps": 1000, "total_steps": 9134, "loss": 0.6891, "learning_rate": 4.853579405902879e-05, "epoch": 0.10947207093790197, "percentage": 10.95, "elapsed_time": "18:27:37", "remaining_time": "6 days, 6:09:26", "throughput": 2722.77, "total_tokens": 180949216} {"current_steps": 1001, "total_steps": 9134, "loss": 0.6913, "learning_rate": 4.853289318095805e-05, "epoch": 0.10958154300883986, "percentage": 10.96, "elapsed_time": "18:28:42", "remaining_time": "6 days, 6:08:04", "throughput": 2722.56, "total_tokens": 181110944} {"current_steps": 1002, "total_steps": 9134, "loss": 0.6892, "learning_rate": 4.8529989518991033e-05, "epoch": 0.10969101507977777, "percentage": 10.97, "elapsed_time": "18:29:46", "remaining_time": "6 days, 6:06:40", "throughput": 2722.46, "total_tokens": 181279392} {"current_steps": 1003, "total_steps": 9134, "loss": 0.7772, "learning_rate": 4.8527083073471236e-05, "epoch": 0.10980048715071568, "percentage": 10.98, "elapsed_time": "18:30:53", "remaining_time": "6 days, 6:05:36", "throughput": 2722.27, "total_tokens": 181448064} {"current_steps": 1004, "total_steps": 9134, "loss": 0.6991, "learning_rate": 4.852417384474248e-05, "epoch": 0.10990995922165357, "percentage": 10.99, "elapsed_time": "18:31:58", "remaining_time": "6 days, 6:04:20", "throughput": 2722.02, "total_tokens": 181609344} {"current_steps": 1005, "total_steps": 9134, "loss": 0.6477, "learning_rate": 4.852126183314894e-05, "epoch": 0.11001943129259148, "percentage": 11.0, "elapsed_time": "18:33:06", "remaining_time": "6 days, 6:03:22", "throughput": 2722.21, "total_tokens": 181806016} {"current_steps": 1006, "total_steps": 9134, "loss": 0.6692, "learning_rate": 4.851834703903508e-05, "epoch": 0.11012890336352937, "percentage": 11.01, "elapsed_time": "18:34:11", "remaining_time": "6 days, 6:02:09", "throughput": 2722.31, "total_tokens": 181990816} {"current_steps": 1007, "total_steps": 9134, "loss": 0.616, "learning_rate": 4.851542946274573e-05, "epoch": 0.11023837543446728, "percentage": 11.02, "elapsed_time": "18:35:15", "remaining_time": "6 days, 6:00:41", "throughput": 2722.01, "total_tokens": 182144480} {"current_steps": 1008, "total_steps": 9134, "loss": 0.7609, "learning_rate": 4.8512509104626036e-05, "epoch": 0.11034784750540519, "percentage": 11.04, "elapsed_time": "18:36:21", "remaining_time": "6 days, 5:59:29", "throughput": 2721.94, "total_tokens": 182318528} {"current_steps": 1009, "total_steps": 9134, "loss": 0.6533, "learning_rate": 4.850958596502145e-05, "epoch": 0.11045731957634308, "percentage": 11.05, "elapsed_time": "18:37:26", "remaining_time": "6 days, 5:58:13", "throughput": 2721.65, "total_tokens": 182477120} {"current_steps": 1010, "total_steps": 9134, "loss": 0.6286, "learning_rate": 4.85066600442778e-05, "epoch": 0.11056679164728099, "percentage": 11.06, "elapsed_time": "18:38:31", "remaining_time": "6 days, 5:56:54", "throughput": 2721.45, "total_tokens": 182640416} {"current_steps": 1011, "total_steps": 9134, "loss": 0.6152, "learning_rate": 4.8503731342741195e-05, "epoch": 0.11067626371821888, "percentage": 11.07, "elapsed_time": "18:39:38", "remaining_time": "6 days, 5:55:55", "throughput": 2721.66, "total_tokens": 182837760} {"current_steps": 1012, "total_steps": 9134, "loss": 0.8555, "learning_rate": 4.8500799860758105e-05, "epoch": 0.11078573578915679, "percentage": 11.08, "elapsed_time": "18:40:48", "remaining_time": "6 days, 5:55:11", "throughput": 2721.99, "total_tokens": 183048096} {"current_steps": 1013, "total_steps": 9134, "loss": 0.7277, "learning_rate": 4.849786559867532e-05, "epoch": 0.1108952078600947, "percentage": 11.09, "elapsed_time": "18:41:55", "remaining_time": "6 days, 5:54:10", "throughput": 2721.95, "total_tokens": 183228416} {"current_steps": 1014, "total_steps": 9134, "loss": 0.8214, "learning_rate": 4.8494928556839946e-05, "epoch": 0.1110046799310326, "percentage": 11.1, "elapsed_time": "18:43:00", "remaining_time": "6 days, 5:52:55", "throughput": 2721.61, "total_tokens": 183383200} {"current_steps": 1015, "total_steps": 9134, "loss": 0.7543, "learning_rate": 4.849198873559945e-05, "epoch": 0.1111141520019705, "percentage": 11.11, "elapsed_time": "18:44:09", "remaining_time": "6 days, 5:52:11", "throughput": 2721.96, "total_tokens": 183595552} {"current_steps": 1016, "total_steps": 9134, "loss": 0.6592, "learning_rate": 4.848904613530159e-05, "epoch": 0.1112236240729084, "percentage": 11.12, "elapsed_time": "18:45:16", "remaining_time": "6 days, 5:51:05", "throughput": 2721.75, "total_tokens": 183762432} {"current_steps": 1017, "total_steps": 9134, "loss": 0.8744, "learning_rate": 4.848610075629447e-05, "epoch": 0.1113330961438463, "percentage": 11.13, "elapsed_time": "18:46:23", "remaining_time": "6 days, 5:50:03", "throughput": 2722.12, "total_tokens": 183970080} {"current_steps": 1018, "total_steps": 9134, "loss": 0.6931, "learning_rate": 4.848315259892654e-05, "epoch": 0.11144256821478421, "percentage": 11.15, "elapsed_time": "18:47:32", "remaining_time": "6 days, 5:49:19", "throughput": 2722.42, "total_tokens": 184178624} {"current_steps": 1019, "total_steps": 9134, "loss": 0.8305, "learning_rate": 4.848020166354654e-05, "epoch": 0.1115520402857221, "percentage": 11.16, "elapsed_time": "18:48:35", "remaining_time": "6 days, 5:47:45", "throughput": 2722.22, "total_tokens": 184336320} {"current_steps": 1020, "total_steps": 9134, "loss": 0.5545, "learning_rate": 4.847724795050358e-05, "epoch": 0.11166151235666001, "percentage": 11.17, "elapsed_time": "18:49:41", "remaining_time": "6 days, 5:46:35", "throughput": 2721.94, "total_tokens": 184497376} {"current_steps": 1021, "total_steps": 9134, "loss": 0.8031, "learning_rate": 4.847429146014706e-05, "epoch": 0.1117709844275979, "percentage": 11.18, "elapsed_time": "18:50:50", "remaining_time": "6 days, 5:45:49", "throughput": 2722.21, "total_tokens": 184703680} {"current_steps": 1022, "total_steps": 9134, "loss": 0.6681, "learning_rate": 4.847133219282674e-05, "epoch": 0.11188045649853581, "percentage": 11.19, "elapsed_time": "18:51:59", "remaining_time": "6 days, 5:45:03", "throughput": 2722.26, "total_tokens": 184894752} {"current_steps": 1023, "total_steps": 9134, "loss": 0.7536, "learning_rate": 4.846837014889269e-05, "epoch": 0.1119899285694737, "percentage": 11.2, "elapsed_time": "18:53:05", "remaining_time": "6 days, 5:43:51", "throughput": 2722.25, "total_tokens": 185073504} {"current_steps": 1024, "total_steps": 9134, "loss": 0.8242, "learning_rate": 4.8465405328695315e-05, "epoch": 0.11209940064041161, "percentage": 11.21, "elapsed_time": "18:54:14", "remaining_time": "6 days, 5:43:04", "throughput": 2722.17, "total_tokens": 185254944} {"current_steps": 1025, "total_steps": 9134, "loss": 0.8374, "learning_rate": 4.8462437732585345e-05, "epoch": 0.11220887271134952, "percentage": 11.22, "elapsed_time": "18:55:23", "remaining_time": "6 days, 5:42:21", "throughput": 2722.35, "total_tokens": 185456320} {"current_steps": 1026, "total_steps": 9134, "loss": 0.6488, "learning_rate": 4.845946736091384e-05, "epoch": 0.11231834478228742, "percentage": 11.23, "elapsed_time": "18:56:28", "remaining_time": "6 days, 5:41:00", "throughput": 2722.41, "total_tokens": 185636640} {"current_steps": 1027, "total_steps": 9134, "loss": 0.5977, "learning_rate": 4.8456494214032205e-05, "epoch": 0.11242781685322532, "percentage": 11.24, "elapsed_time": "18:57:34", "remaining_time": "6 days, 5:39:52", "throughput": 2722.57, "total_tokens": 185827936} {"current_steps": 1028, "total_steps": 9134, "loss": 0.7064, "learning_rate": 4.8453518292292146e-05, "epoch": 0.11253728892416322, "percentage": 11.25, "elapsed_time": "18:58:41", "remaining_time": "6 days, 5:38:52", "throughput": 2722.6, "total_tokens": 186013184} {"current_steps": 1029, "total_steps": 9134, "loss": 0.7034, "learning_rate": 4.8450539596045694e-05, "epoch": 0.11264676099510113, "percentage": 11.27, "elapsed_time": "18:59:48", "remaining_time": "6 days, 5:37:48", "throughput": 2722.19, "total_tokens": 186166624} {"current_steps": 1030, "total_steps": 9134, "loss": 0.6872, "learning_rate": 4.844755812564525e-05, "epoch": 0.11275623306603903, "percentage": 11.28, "elapsed_time": "19:00:53", "remaining_time": "6 days, 5:36:28", "throughput": 2722.18, "total_tokens": 186342240} {"current_steps": 1031, "total_steps": 9134, "loss": 0.7132, "learning_rate": 4.84445738814435e-05, "epoch": 0.11286570513697693, "percentage": 11.29, "elapsed_time": "19:02:00", "remaining_time": "6 days, 5:35:24", "throughput": 2722.36, "total_tokens": 186536896} {"current_steps": 1032, "total_steps": 9134, "loss": 0.7331, "learning_rate": 4.8441586863793475e-05, "epoch": 0.11297517720791483, "percentage": 11.3, "elapsed_time": "19:03:09", "remaining_time": "6 days, 5:34:37", "throughput": 2722.64, "total_tokens": 186743200} {"current_steps": 1033, "total_steps": 9134, "loss": 0.6708, "learning_rate": 4.843859707304854e-05, "epoch": 0.11308464927885273, "percentage": 11.31, "elapsed_time": "19:04:18", "remaining_time": "6 days, 5:33:57", "throughput": 2722.93, "total_tokens": 186953536} {"current_steps": 1034, "total_steps": 9134, "loss": 1.0204, "learning_rate": 4.843560450956238e-05, "epoch": 0.11319412134979064, "percentage": 11.32, "elapsed_time": "19:05:28", "remaining_time": "6 days, 5:33:15", "throughput": 2723.32, "total_tokens": 187169472} {"current_steps": 1035, "total_steps": 9134, "loss": 0.7375, "learning_rate": 4.8432609173689004e-05, "epoch": 0.11330359342072854, "percentage": 11.33, "elapsed_time": "19:06:33", "remaining_time": "6 days, 5:31:56", "throughput": 2723.36, "total_tokens": 187349120} {"current_steps": 1036, "total_steps": 9134, "loss": 0.7696, "learning_rate": 4.8429611065782765e-05, "epoch": 0.11341306549166644, "percentage": 11.34, "elapsed_time": "19:07:41", "remaining_time": "6 days, 5:30:59", "throughput": 2723.41, "total_tokens": 187537056} {"current_steps": 1037, "total_steps": 9134, "loss": 0.6767, "learning_rate": 4.8426610186198315e-05, "epoch": 0.11352253756260434, "percentage": 11.35, "elapsed_time": "19:08:46", "remaining_time": "6 days, 5:29:44", "throughput": 2723.45, "total_tokens": 187717824} {"current_steps": 1038, "total_steps": 9134, "loss": 0.5902, "learning_rate": 4.8423606535290675e-05, "epoch": 0.11363200963354224, "percentage": 11.36, "elapsed_time": "19:09:48", "remaining_time": "6 days, 5:28:05", "throughput": 2722.97, "total_tokens": 187853792} {"current_steps": 1039, "total_steps": 9134, "loss": 0.7321, "learning_rate": 4.842060011341516e-05, "epoch": 0.11374148170448015, "percentage": 11.38, "elapsed_time": "19:10:56", "remaining_time": "6 days, 5:27:08", "throughput": 2722.99, "total_tokens": 188039936} {"current_steps": 1040, "total_steps": 9134, "loss": 0.8522, "learning_rate": 4.841759092092741e-05, "epoch": 0.11385095377541804, "percentage": 11.39, "elapsed_time": "19:12:02", "remaining_time": "6 days, 5:25:57", "throughput": 2723.08, "total_tokens": 188225856} {"current_steps": 1041, "total_steps": 9134, "loss": 0.6799, "learning_rate": 4.841457895818344e-05, "epoch": 0.11396042584635595, "percentage": 11.4, "elapsed_time": "19:13:03", "remaining_time": "6 days, 5:24:10", "throughput": 2722.57, "total_tokens": 188357120} {"current_steps": 1042, "total_steps": 9134, "loss": 0.7518, "learning_rate": 4.841156422553953e-05, "epoch": 0.11406989791729386, "percentage": 11.41, "elapsed_time": "19:14:07", "remaining_time": "6 days, 5:22:41", "throughput": 2722.56, "total_tokens": 188529376} {"current_steps": 1043, "total_steps": 9134, "loss": 0.6675, "learning_rate": 4.840854672335233e-05, "epoch": 0.11417936998823175, "percentage": 11.42, "elapsed_time": "19:15:16", "remaining_time": "6 days, 5:21:54", "throughput": 2722.51, "total_tokens": 188713280} {"current_steps": 1044, "total_steps": 9134, "loss": 0.632, "learning_rate": 4.84055264519788e-05, "epoch": 0.11428884205916966, "percentage": 11.43, "elapsed_time": "19:16:18", "remaining_time": "6 days, 5:20:16", "throughput": 2722.19, "total_tokens": 188861120} {"current_steps": 1045, "total_steps": 9134, "loss": 0.5964, "learning_rate": 4.8402503411776235e-05, "epoch": 0.11439831413010755, "percentage": 11.44, "elapsed_time": "19:17:22", "remaining_time": "6 days, 5:18:50", "throughput": 2722.28, "total_tokens": 189041440} {"current_steps": 1046, "total_steps": 9134, "loss": 0.9238, "learning_rate": 4.839947760310226e-05, "epoch": 0.11450778620104546, "percentage": 11.45, "elapsed_time": "19:18:31", "remaining_time": "6 days, 5:18:01", "throughput": 2722.41, "total_tokens": 189237888} {"current_steps": 1047, "total_steps": 9134, "loss": 0.5199, "learning_rate": 4.8396449026314803e-05, "epoch": 0.11461725827198337, "percentage": 11.46, "elapsed_time": "19:19:34", "remaining_time": "6 days, 5:16:32", "throughput": 2722.51, "total_tokens": 189417760} {"current_steps": 1048, "total_steps": 9134, "loss": 0.7467, "learning_rate": 4.839341768177217e-05, "epoch": 0.11472673034292126, "percentage": 11.47, "elapsed_time": "19:20:41", "remaining_time": "6 days, 5:15:29", "throughput": 2722.51, "total_tokens": 189599872} {"current_steps": 1049, "total_steps": 9134, "loss": 0.5758, "learning_rate": 4.839038356983293e-05, "epoch": 0.11483620241385917, "percentage": 11.48, "elapsed_time": "19:21:48", "remaining_time": "6 days, 5:14:30", "throughput": 2722.52, "total_tokens": 189784000} {"current_steps": 1050, "total_steps": 9134, "loss": 0.6175, "learning_rate": 4.838734669085604e-05, "epoch": 0.11494567448479706, "percentage": 11.5, "elapsed_time": "19:22:53", "remaining_time": "6 days, 5:13:09", "throughput": 2722.65, "total_tokens": 189969024} {"current_steps": 1051, "total_steps": 9134, "loss": 0.7275, "learning_rate": 4.838430704520074e-05, "epoch": 0.11505514655573497, "percentage": 11.51, "elapsed_time": "19:23:59", "remaining_time": "6 days, 5:11:57", "throughput": 2722.66, "total_tokens": 190148672} {"current_steps": 1052, "total_steps": 9134, "loss": 0.6634, "learning_rate": 4.838126463322662e-05, "epoch": 0.11516461862667288, "percentage": 11.52, "elapsed_time": "19:25:04", "remaining_time": "6 days, 5:10:39", "throughput": 2722.67, "total_tokens": 190325632} {"current_steps": 1053, "total_steps": 9134, "loss": 0.7543, "learning_rate": 4.8378219455293595e-05, "epoch": 0.11527409069761077, "percentage": 11.53, "elapsed_time": "19:26:08", "remaining_time": "6 days, 5:09:16", "throughput": 2722.69, "total_tokens": 190502368} {"current_steps": 1054, "total_steps": 9134, "loss": 0.8233, "learning_rate": 4.8375171511761895e-05, "epoch": 0.11538356276854868, "percentage": 11.54, "elapsed_time": "19:27:14", "remaining_time": "6 days, 5:08:10", "throughput": 2722.83, "total_tokens": 190693216} {"current_steps": 1055, "total_steps": 9134, "loss": 0.5905, "learning_rate": 4.837212080299209e-05, "epoch": 0.11549303483948657, "percentage": 11.55, "elapsed_time": "19:28:16", "remaining_time": "6 days, 5:06:24", "throughput": 2722.48, "total_tokens": 190835232} {"current_steps": 1056, "total_steps": 9134, "loss": 0.7737, "learning_rate": 4.836906732934508e-05, "epoch": 0.11560250691042448, "percentage": 11.56, "elapsed_time": "19:29:23", "remaining_time": "6 days, 5:05:22", "throughput": 2722.56, "total_tokens": 191023616} {"current_steps": 1057, "total_steps": 9134, "loss": 1.0295, "learning_rate": 4.836601109118208e-05, "epoch": 0.11571197898136237, "percentage": 11.57, "elapsed_time": "19:30:24", "remaining_time": "6 days, 5:03:37", "throughput": 2722.41, "total_tokens": 191180640} {"current_steps": 1058, "total_steps": 9134, "loss": 0.6463, "learning_rate": 4.836295208886463e-05, "epoch": 0.11582145105230028, "percentage": 11.58, "elapsed_time": "19:31:33", "remaining_time": "6 days, 5:02:49", "throughput": 2722.45, "total_tokens": 191370144} {"current_steps": 1059, "total_steps": 9134, "loss": 0.7186, "learning_rate": 4.835989032275461e-05, "epoch": 0.11593092312323819, "percentage": 11.59, "elapsed_time": "19:32:39", "remaining_time": "6 days, 5:01:37", "throughput": 2722.43, "total_tokens": 191548224} {"current_steps": 1060, "total_steps": 9134, "loss": 0.5458, "learning_rate": 4.835682579321423e-05, "epoch": 0.11604039519417608, "percentage": 11.6, "elapsed_time": "19:33:43", "remaining_time": "6 days, 5:00:17", "throughput": 2722.43, "total_tokens": 191724512} {"current_steps": 1061, "total_steps": 9134, "loss": 0.8529, "learning_rate": 4.8353758500606e-05, "epoch": 0.11614986726511399, "percentage": 11.62, "elapsed_time": "19:34:52", "remaining_time": "6 days, 4:59:29", "throughput": 2722.49, "total_tokens": 191916032} {"current_steps": 1062, "total_steps": 9134, "loss": 0.7331, "learning_rate": 4.8350688445292794e-05, "epoch": 0.11625933933605188, "percentage": 11.63, "elapsed_time": "19:36:00", "remaining_time": "6 days, 4:58:33", "throughput": 2722.49, "total_tokens": 192100832} {"current_steps": 1063, "total_steps": 9134, "loss": 0.6914, "learning_rate": 4.834761562763777e-05, "epoch": 0.11636881140698979, "percentage": 11.64, "elapsed_time": "19:37:08", "remaining_time": "6 days, 4:57:37", "throughput": 2722.21, "total_tokens": 192265472} {"current_steps": 1064, "total_steps": 9134, "loss": 0.5881, "learning_rate": 4.834454004800446e-05, "epoch": 0.1164782834779277, "percentage": 11.65, "elapsed_time": "19:38:16", "remaining_time": "6 days, 4:56:47", "throughput": 2722.18, "total_tokens": 192450048} {"current_steps": 1065, "total_steps": 9134, "loss": 0.6059, "learning_rate": 4.8341461706756686e-05, "epoch": 0.1165877555488656, "percentage": 11.66, "elapsed_time": "19:39:22", "remaining_time": "6 days, 4:55:31", "throughput": 2722.36, "total_tokens": 192640224} {"current_steps": 1066, "total_steps": 9134, "loss": 0.6311, "learning_rate": 4.833838060425862e-05, "epoch": 0.1166972276198035, "percentage": 11.67, "elapsed_time": "19:40:29", "remaining_time": "6 days, 4:54:27", "throughput": 2722.59, "total_tokens": 192838464} {"current_steps": 1067, "total_steps": 9134, "loss": 0.7326, "learning_rate": 4.8335296740874735e-05, "epoch": 0.1168066996907414, "percentage": 11.68, "elapsed_time": "19:41:37", "remaining_time": "6 days, 4:53:33", "throughput": 2722.53, "total_tokens": 193019232} {"current_steps": 1068, "total_steps": 9134, "loss": 0.7613, "learning_rate": 4.8332210116969855e-05, "epoch": 0.1169161717616793, "percentage": 11.69, "elapsed_time": "19:42:44", "remaining_time": "6 days, 4:52:33", "throughput": 2722.74, "total_tokens": 193217472} {"current_steps": 1069, "total_steps": 9134, "loss": 0.7442, "learning_rate": 4.832912073290913e-05, "epoch": 0.11702564383261721, "percentage": 11.7, "elapsed_time": "19:43:46", "remaining_time": "6 days, 4:50:57", "throughput": 2722.65, "total_tokens": 193380992} {"current_steps": 1070, "total_steps": 9134, "loss": 0.7619, "learning_rate": 4.832602858905801e-05, "epoch": 0.1171351159035551, "percentage": 11.71, "elapsed_time": "19:44:56", "remaining_time": "6 days, 4:50:12", "throughput": 2722.6, "total_tokens": 193566240} {"current_steps": 1071, "total_steps": 9134, "loss": 0.6023, "learning_rate": 4.8322933685782304e-05, "epoch": 0.11724458797449301, "percentage": 11.73, "elapsed_time": "19:46:04", "remaining_time": "6 days, 4:49:18", "throughput": 2722.42, "total_tokens": 193738720} {"current_steps": 1072, "total_steps": 9134, "loss": 0.7588, "learning_rate": 4.831983602344813e-05, "epoch": 0.1173540600454309, "percentage": 11.74, "elapsed_time": "19:47:07", "remaining_time": "6 days, 4:47:44", "throughput": 2722.42, "total_tokens": 193910080} {"current_steps": 1073, "total_steps": 9134, "loss": 0.7136, "learning_rate": 4.8316735602421935e-05, "epoch": 0.11746353211636881, "percentage": 11.75, "elapsed_time": "19:48:13", "remaining_time": "6 days, 4:46:39", "throughput": 2722.51, "total_tokens": 194097568} {"current_steps": 1074, "total_steps": 9134, "loss": 0.7162, "learning_rate": 4.831363242307049e-05, "epoch": 0.1175730041873067, "percentage": 11.76, "elapsed_time": "19:49:19", "remaining_time": "6 days, 4:45:30", "throughput": 2722.23, "total_tokens": 194257728} {"current_steps": 1075, "total_steps": 9134, "loss": 0.8369, "learning_rate": 4.83105264857609e-05, "epoch": 0.11768247625824461, "percentage": 11.77, "elapsed_time": "19:50:29", "remaining_time": "6 days, 4:44:47", "throughput": 2722.49, "total_tokens": 194465600} {"current_steps": 1076, "total_steps": 9134, "loss": 0.5408, "learning_rate": 4.8307417790860586e-05, "epoch": 0.11779194832918252, "percentage": 11.78, "elapsed_time": "19:51:35", "remaining_time": "6 days, 4:43:38", "throughput": 2722.17, "total_tokens": 194622624} {"current_steps": 1077, "total_steps": 9134, "loss": 0.6627, "learning_rate": 4.830430633873731e-05, "epoch": 0.11790142040012042, "percentage": 11.79, "elapsed_time": "19:52:41", "remaining_time": "6 days, 4:42:27", "throughput": 2722.01, "total_tokens": 194790848} {"current_steps": 1078, "total_steps": 9134, "loss": 0.8924, "learning_rate": 4.830119212975914e-05, "epoch": 0.11801089247105832, "percentage": 11.8, "elapsed_time": "19:53:47", "remaining_time": "6 days, 4:41:18", "throughput": 2722.28, "total_tokens": 194989984} {"current_steps": 1079, "total_steps": 9134, "loss": 0.7917, "learning_rate": 4.8298075164294484e-05, "epoch": 0.11812036454199622, "percentage": 11.81, "elapsed_time": "19:54:56", "remaining_time": "6 days, 4:40:28", "throughput": 2722.55, "total_tokens": 195196064} {"current_steps": 1080, "total_steps": 9134, "loss": 0.728, "learning_rate": 4.829495544271208e-05, "epoch": 0.11822983661293412, "percentage": 11.82, "elapsed_time": "19:55:59", "remaining_time": "6 days, 4:38:57", "throughput": 2722.53, "total_tokens": 195366304} {"current_steps": 1081, "total_steps": 9134, "loss": 0.7152, "learning_rate": 4.829183296538097e-05, "epoch": 0.11833930868387203, "percentage": 11.83, "elapsed_time": "19:57:07", "remaining_time": "6 days, 4:38:08", "throughput": 2722.33, "total_tokens": 195539456} {"current_steps": 1082, "total_steps": 9134, "loss": 0.5901, "learning_rate": 4.828870773267056e-05, "epoch": 0.11844878075480993, "percentage": 11.85, "elapsed_time": "19:58:16", "remaining_time": "6 days, 4:37:13", "throughput": 2722.32, "total_tokens": 195724256} {"current_steps": 1083, "total_steps": 9134, "loss": 0.7107, "learning_rate": 4.8285579744950535e-05, "epoch": 0.11855825282574783, "percentage": 11.86, "elapsed_time": "19:59:17", "remaining_time": "6 days, 4:35:34", "throughput": 2721.97, "total_tokens": 195867616} {"current_steps": 1084, "total_steps": 9134, "loss": 0.6382, "learning_rate": 4.828244900259094e-05, "epoch": 0.11866772489668573, "percentage": 11.87, "elapsed_time": "20:00:27", "remaining_time": "6 days, 4:34:47", "throughput": 2721.89, "total_tokens": 196049728} {"current_steps": 1085, "total_steps": 9134, "loss": 0.6994, "learning_rate": 4.827931550596214e-05, "epoch": 0.11877719696762364, "percentage": 11.88, "elapsed_time": "20:01:28", "remaining_time": "6 days, 4:33:06", "throughput": 2721.59, "total_tokens": 196196224} {"current_steps": 1086, "total_steps": 9134, "loss": 0.751, "learning_rate": 4.827617925543482e-05, "epoch": 0.11888666903856154, "percentage": 11.89, "elapsed_time": "20:02:36", "remaining_time": "6 days, 4:32:07", "throughput": 2721.6, "total_tokens": 196380352} {"current_steps": 1087, "total_steps": 9134, "loss": 0.5442, "learning_rate": 4.8273040251379985e-05, "epoch": 0.11899614110949944, "percentage": 11.9, "elapsed_time": "20:03:41", "remaining_time": "6 days, 4:30:49", "throughput": 2721.6, "total_tokens": 196557312} {"current_steps": 1088, "total_steps": 9134, "loss": 0.6971, "learning_rate": 4.826989849416899e-05, "epoch": 0.11910561318043734, "percentage": 11.91, "elapsed_time": "20:04:43", "remaining_time": "6 days, 4:29:15", "throughput": 2721.34, "total_tokens": 196709408} {"current_steps": 1089, "total_steps": 9134, "loss": 0.8622, "learning_rate": 4.826675398417347e-05, "epoch": 0.11921508525137524, "percentage": 11.92, "elapsed_time": "20:05:53", "remaining_time": "6 days, 4:28:31", "throughput": 2721.57, "total_tokens": 196915040} {"current_steps": 1090, "total_steps": 9134, "loss": 0.7381, "learning_rate": 4.826360672176544e-05, "epoch": 0.11932455732231315, "percentage": 11.93, "elapsed_time": "20:07:01", "remaining_time": "6 days, 4:27:36", "throughput": 2721.73, "total_tokens": 197111488} {"current_steps": 1091, "total_steps": 9134, "loss": 0.8174, "learning_rate": 4.826045670731722e-05, "epoch": 0.11943402939325104, "percentage": 11.94, "elapsed_time": "20:08:05", "remaining_time": "6 days, 4:26:11", "throughput": 2721.61, "total_tokens": 197276576} {"current_steps": 1092, "total_steps": 9134, "loss": 0.7172, "learning_rate": 4.825730394120142e-05, "epoch": 0.11954350146418895, "percentage": 11.96, "elapsed_time": "20:09:14", "remaining_time": "6 days, 4:25:24", "throughput": 2721.53, "total_tokens": 197459136} {"current_steps": 1093, "total_steps": 9134, "loss": 0.5935, "learning_rate": 4.8254148423791035e-05, "epoch": 0.11965297353512686, "percentage": 11.97, "elapsed_time": "20:10:23", "remaining_time": "6 days, 4:24:37", "throughput": 2721.62, "total_tokens": 197653792} {"current_steps": 1094, "total_steps": 9134, "loss": 0.8727, "learning_rate": 4.825099015545934e-05, "epoch": 0.11976244560606475, "percentage": 11.98, "elapsed_time": "20:11:30", "remaining_time": "6 days, 4:23:37", "throughput": 2721.57, "total_tokens": 197833216} {"current_steps": 1095, "total_steps": 9134, "loss": 0.813, "learning_rate": 4.824782913657996e-05, "epoch": 0.11987191767700266, "percentage": 11.99, "elapsed_time": "20:12:36", "remaining_time": "6 days, 4:22:29", "throughput": 2721.64, "total_tokens": 198018688} {"current_steps": 1096, "total_steps": 9134, "loss": 0.7642, "learning_rate": 4.824466536752683e-05, "epoch": 0.11998138974794055, "percentage": 12.0, "elapsed_time": "20:13:43", "remaining_time": "6 days, 4:21:21", "throughput": 2721.61, "total_tokens": 198196544} {"current_steps": 1097, "total_steps": 9134, "loss": 0.7276, "learning_rate": 4.8241498848674236e-05, "epoch": 0.12009086181887846, "percentage": 12.01, "elapsed_time": "20:14:49", "remaining_time": "6 days, 4:20:14", "throughput": 2721.39, "total_tokens": 198361408} {"current_steps": 1098, "total_steps": 9134, "loss": 0.7087, "learning_rate": 4.823832958039675e-05, "epoch": 0.12020033388981637, "percentage": 12.02, "elapsed_time": "20:15:53", "remaining_time": "6 days, 4:18:46", "throughput": 2721.47, "total_tokens": 198539712} {"current_steps": 1099, "total_steps": 9134, "loss": 0.5878, "learning_rate": 4.82351575630693e-05, "epoch": 0.12030980596075426, "percentage": 12.03, "elapsed_time": "20:16:57", "remaining_time": "6 days, 4:17:25", "throughput": 2721.46, "total_tokens": 198714656} {"current_steps": 1100, "total_steps": 9134, "loss": 0.7793, "learning_rate": 4.823198279706713e-05, "epoch": 0.12041927803169217, "percentage": 12.04, "elapsed_time": "20:18:03", "remaining_time": "6 days, 4:16:12", "throughput": 2721.5, "total_tokens": 198896096} {"current_steps": 1101, "total_steps": 9134, "loss": 0.6473, "learning_rate": 4.8228805282765803e-05, "epoch": 0.12052875010263006, "percentage": 12.05, "elapsed_time": "20:19:10", "remaining_time": "6 days, 4:15:13", "throughput": 2721.4, "total_tokens": 199071936} {"current_steps": 1102, "total_steps": 9134, "loss": 0.8471, "learning_rate": 4.822562502054122e-05, "epoch": 0.12063822217356797, "percentage": 12.06, "elapsed_time": "20:20:19", "remaining_time": "6 days, 4:14:22", "throughput": 2721.5, "total_tokens": 199265920} {"current_steps": 1103, "total_steps": 9134, "loss": 0.7165, "learning_rate": 4.82224420107696e-05, "epoch": 0.12074769424450588, "percentage": 12.08, "elapsed_time": "20:21:28", "remaining_time": "6 days, 4:13:36", "throughput": 2721.5, "total_tokens": 199454752} {"current_steps": 1104, "total_steps": 9134, "loss": 0.7643, "learning_rate": 4.821925625382748e-05, "epoch": 0.12085716631544377, "percentage": 12.09, "elapsed_time": "20:22:35", "remaining_time": "6 days, 4:12:36", "throughput": 2721.52, "total_tokens": 199638880} {"current_steps": 1105, "total_steps": 9134, "loss": 0.6976, "learning_rate": 4.821606775009173e-05, "epoch": 0.12096663838638168, "percentage": 12.1, "elapsed_time": "20:23:42", "remaining_time": "6 days, 4:11:30", "throughput": 2721.37, "total_tokens": 199809120} {"current_steps": 1106, "total_steps": 9134, "loss": 0.6002, "learning_rate": 4.8212876499939555e-05, "epoch": 0.12107611045731957, "percentage": 12.11, "elapsed_time": "20:24:43", "remaining_time": "6 days, 4:09:48", "throughput": 2721.04, "total_tokens": 199952256} {"current_steps": 1107, "total_steps": 9134, "loss": 0.668, "learning_rate": 4.8209682503748455e-05, "epoch": 0.12118558252825748, "percentage": 12.12, "elapsed_time": "20:25:51", "remaining_time": "6 days, 4:08:52", "throughput": 2720.82, "total_tokens": 200120480} {"current_steps": 1108, "total_steps": 9134, "loss": 0.7596, "learning_rate": 4.820648576189629e-05, "epoch": 0.12129505459919539, "percentage": 12.13, "elapsed_time": "20:26:58", "remaining_time": "6 days, 4:07:47", "throughput": 2720.56, "total_tokens": 200282880} {"current_steps": 1109, "total_steps": 9134, "loss": 0.8501, "learning_rate": 4.820328627476122e-05, "epoch": 0.12140452667013328, "percentage": 12.14, "elapsed_time": "20:28:04", "remaining_time": "6 days, 4:06:41", "throughput": 2720.62, "total_tokens": 200468576} {"current_steps": 1110, "total_steps": 9134, "loss": 0.7494, "learning_rate": 4.820008404272175e-05, "epoch": 0.12151399874107119, "percentage": 12.15, "elapsed_time": "20:29:14", "remaining_time": "6 days, 4:05:56", "throughput": 2721.03, "total_tokens": 200686976} {"current_steps": 1111, "total_steps": 9134, "loss": 0.6706, "learning_rate": 4.819687906615668e-05, "epoch": 0.12162347081200908, "percentage": 12.16, "elapsed_time": "20:30:19", "remaining_time": "6 days, 4:04:43", "throughput": 2720.99, "total_tokens": 200863264} {"current_steps": 1112, "total_steps": 9134, "loss": 0.648, "learning_rate": 4.819367134544516e-05, "epoch": 0.12173294288294699, "percentage": 12.17, "elapsed_time": "20:31:29", "remaining_time": "6 days, 4:04:01", "throughput": 2721.34, "total_tokens": 201078976} {"current_steps": 1113, "total_steps": 9134, "loss": 0.7267, "learning_rate": 4.819046088096666e-05, "epoch": 0.12184241495388488, "percentage": 12.19, "elapsed_time": "20:32:32", "remaining_time": "6 days, 4:02:31", "throughput": 2721.32, "total_tokens": 201249216} {"current_steps": 1114, "total_steps": 9134, "loss": 0.7926, "learning_rate": 4.818724767310098e-05, "epoch": 0.12195188702482279, "percentage": 12.2, "elapsed_time": "20:33:40", "remaining_time": "6 days, 4:01:33", "throughput": 2721.47, "total_tokens": 201444320} {"current_steps": 1115, "total_steps": 9134, "loss": 0.5634, "learning_rate": 4.8184031722228216e-05, "epoch": 0.1220613590957607, "percentage": 12.21, "elapsed_time": "20:34:45", "remaining_time": "6 days, 4:00:14", "throughput": 2721.59, "total_tokens": 201629344} {"current_steps": 1116, "total_steps": 9134, "loss": 0.6993, "learning_rate": 4.818081302872882e-05, "epoch": 0.12217083116669859, "percentage": 12.22, "elapsed_time": "20:35:54", "remaining_time": "6 days, 3:59:29", "throughput": 2721.63, "total_tokens": 201821088} {"current_steps": 1117, "total_steps": 9134, "loss": 0.6645, "learning_rate": 4.817759159298356e-05, "epoch": 0.1222803032376365, "percentage": 12.23, "elapsed_time": "20:37:02", "remaining_time": "6 days, 3:58:32", "throughput": 2721.46, "total_tokens": 201992896} {"current_steps": 1118, "total_steps": 9134, "loss": 0.6137, "learning_rate": 4.817436741537352e-05, "epoch": 0.1223897753085744, "percentage": 12.24, "elapsed_time": "20:38:08", "remaining_time": "6 days, 3:57:21", "throughput": 2721.3, "total_tokens": 202160224} {"current_steps": 1119, "total_steps": 9134, "loss": 0.5721, "learning_rate": 4.817114049628012e-05, "epoch": 0.1224992473795123, "percentage": 12.25, "elapsed_time": "20:39:10", "remaining_time": "6 days, 3:55:48", "throughput": 2721.21, "total_tokens": 202324416} {"current_steps": 1120, "total_steps": 9134, "loss": 0.7126, "learning_rate": 4.81679108360851e-05, "epoch": 0.12260871945045021, "percentage": 12.26, "elapsed_time": "20:40:16", "remaining_time": "6 days, 3:54:37", "throughput": 2721.2, "total_tokens": 202502720} {"current_steps": 1121, "total_steps": 9134, "loss": 0.8152, "learning_rate": 4.8164678435170505e-05, "epoch": 0.1227181915213881, "percentage": 12.27, "elapsed_time": "20:41:23", "remaining_time": "6 days, 3:53:31", "throughput": 2721.29, "total_tokens": 202690208} {"current_steps": 1122, "total_steps": 9134, "loss": 0.7046, "learning_rate": 4.8161443293918746e-05, "epoch": 0.12282766359232601, "percentage": 12.28, "elapsed_time": "20:42:26", "remaining_time": "6 days, 3:52:01", "throughput": 2721.01, "total_tokens": 202841408} {"current_steps": 1123, "total_steps": 9134, "loss": 0.7138, "learning_rate": 4.815820541271252e-05, "epoch": 0.1229371356632639, "percentage": 12.29, "elapsed_time": "20:43:32", "remaining_time": "6 days, 3:50:50", "throughput": 2720.67, "total_tokens": 202994400} {"current_steps": 1124, "total_steps": 9134, "loss": 0.826, "learning_rate": 4.815496479193486e-05, "epoch": 0.12304660773420181, "percentage": 12.31, "elapsed_time": "20:44:38", "remaining_time": "6 days, 3:49:43", "throughput": 2720.19, "total_tokens": 203139552} {"current_steps": 1125, "total_steps": 9134, "loss": 0.6858, "learning_rate": 4.815172143196913e-05, "epoch": 0.12315607980513972, "percentage": 12.32, "elapsed_time": "20:45:47", "remaining_time": "6 days, 3:48:56", "throughput": 2720.25, "total_tokens": 203332192} {"current_steps": 1126, "total_steps": 9134, "loss": 0.7775, "learning_rate": 4.814847533319902e-05, "epoch": 0.12326555187607761, "percentage": 12.33, "elapsed_time": "20:46:57", "remaining_time": "6 days, 3:48:12", "throughput": 2720.01, "total_tokens": 203503328} {"current_steps": 1127, "total_steps": 9134, "loss": 0.7706, "learning_rate": 4.814522649600852e-05, "epoch": 0.12337502394701552, "percentage": 12.34, "elapsed_time": "20:48:06", "remaining_time": "6 days, 3:47:29", "throughput": 2720.41, "total_tokens": 203723520} {"current_steps": 1128, "total_steps": 9134, "loss": 0.8207, "learning_rate": 4.814197492078198e-05, "epoch": 0.12348449601795342, "percentage": 12.35, "elapsed_time": "20:49:12", "remaining_time": "6 days, 3:46:15", "throughput": 2720.35, "total_tokens": 203896448} {"current_steps": 1129, "total_steps": 9134, "loss": 0.7653, "learning_rate": 4.813872060790404e-05, "epoch": 0.12359396808889132, "percentage": 12.36, "elapsed_time": "20:50:17", "remaining_time": "6 days, 3:45:00", "throughput": 2720.56, "total_tokens": 204089760} {"current_steps": 1130, "total_steps": 9134, "loss": 0.6552, "learning_rate": 4.813546355775969e-05, "epoch": 0.12370344015982922, "percentage": 12.37, "elapsed_time": "20:51:20", "remaining_time": "6 days, 3:43:32", "throughput": 2720.35, "total_tokens": 204246336} {"current_steps": 1131, "total_steps": 9134, "loss": 0.6613, "learning_rate": 4.813220377073423e-05, "epoch": 0.12381291223076712, "percentage": 12.38, "elapsed_time": "20:52:26", "remaining_time": "6 days, 3:42:20", "throughput": 2720.34, "total_tokens": 204424416} {"current_steps": 1132, "total_steps": 9134, "loss": 0.6629, "learning_rate": 4.8128941247213286e-05, "epoch": 0.12392238430170503, "percentage": 12.39, "elapsed_time": "20:53:32", "remaining_time": "6 days, 3:41:07", "throughput": 2720.23, "total_tokens": 204594656} {"current_steps": 1133, "total_steps": 9134, "loss": 0.8369, "learning_rate": 4.812567598758281e-05, "epoch": 0.12403185637264293, "percentage": 12.4, "elapsed_time": "20:54:40", "remaining_time": "6 days, 3:40:13", "throughput": 2720.43, "total_tokens": 204794912} {"current_steps": 1134, "total_steps": 9134, "loss": 0.6613, "learning_rate": 4.812240799222906e-05, "epoch": 0.12414132844358083, "percentage": 12.42, "elapsed_time": "20:55:46", "remaining_time": "6 days, 3:39:07", "throughput": 2720.29, "total_tokens": 204964928} {"current_steps": 1135, "total_steps": 9134, "loss": 0.5747, "learning_rate": 4.811913726153866e-05, "epoch": 0.12425080051451873, "percentage": 12.43, "elapsed_time": "20:56:48", "remaining_time": "6 days, 3:37:24", "throughput": 2719.99, "total_tokens": 205109632} {"current_steps": 1136, "total_steps": 9134, "loss": 0.6956, "learning_rate": 4.8115863795898514e-05, "epoch": 0.12436027258545664, "percentage": 12.44, "elapsed_time": "20:57:56", "remaining_time": "6 days, 3:36:31", "throughput": 2720.19, "total_tokens": 205309888} {"current_steps": 1137, "total_steps": 9134, "loss": 0.8307, "learning_rate": 4.811258759569587e-05, "epoch": 0.12446974465639454, "percentage": 12.45, "elapsed_time": "20:59:05", "remaining_time": "6 days, 3:35:42", "throughput": 2720.17, "total_tokens": 205496256} {"current_steps": 1138, "total_steps": 9134, "loss": 0.9829, "learning_rate": 4.8109308661318296e-05, "epoch": 0.12457921672733244, "percentage": 12.46, "elapsed_time": "21:00:10", "remaining_time": "6 days, 3:34:25", "throughput": 2720.13, "total_tokens": 205669632} {"current_steps": 1139, "total_steps": 9134, "loss": 0.8558, "learning_rate": 4.810602699315369e-05, "epoch": 0.12468868879827034, "percentage": 12.47, "elapsed_time": "21:01:12", "remaining_time": "6 days, 3:32:50", "throughput": 2719.82, "total_tokens": 205815904} {"current_steps": 1140, "total_steps": 9134, "loss": 0.8638, "learning_rate": 4.810274259159026e-05, "epoch": 0.12479816086920824, "percentage": 12.48, "elapsed_time": "21:02:19", "remaining_time": "6 days, 3:31:45", "throughput": 2719.95, "total_tokens": 206006976} {"current_steps": 1141, "total_steps": 9134, "loss": 0.6241, "learning_rate": 4.809945545701654e-05, "epoch": 0.12490763294014615, "percentage": 12.49, "elapsed_time": "21:03:25", "remaining_time": "6 days, 3:30:38", "throughput": 2719.91, "total_tokens": 206184832} {"current_steps": 1142, "total_steps": 9134, "loss": 0.6551, "learning_rate": 4.8096165589821404e-05, "epoch": 0.12501710501108404, "percentage": 12.5, "elapsed_time": "21:04:29", "remaining_time": "6 days, 3:29:10", "throughput": 2719.85, "total_tokens": 206352832} {"current_steps": 1143, "total_steps": 9134, "loss": 0.7376, "learning_rate": 4.809287299039403e-05, "epoch": 0.12512657708202196, "percentage": 12.51, "elapsed_time": "21:05:37", "remaining_time": "6 days, 3:28:15", "throughput": 2719.87, "total_tokens": 206538752} {"current_steps": 1144, "total_steps": 9134, "loss": 0.7462, "learning_rate": 4.808957765912393e-05, "epoch": 0.12523604915295986, "percentage": 12.52, "elapsed_time": "21:06:46", "remaining_time": "6 days, 3:27:30", "throughput": 2719.93, "total_tokens": 206732288} {"current_steps": 1145, "total_steps": 9134, "loss": 0.8108, "learning_rate": 4.808627959640093e-05, "epoch": 0.12534552122389775, "percentage": 12.54, "elapsed_time": "21:07:56", "remaining_time": "6 days, 3:26:45", "throughput": 2719.88, "total_tokens": 206917760} {"current_steps": 1146, "total_steps": 9134, "loss": 0.6857, "learning_rate": 4.808297880261518e-05, "epoch": 0.12545499329483564, "percentage": 12.55, "elapsed_time": "21:09:05", "remaining_time": "6 days, 3:25:58", "throughput": 2719.98, "total_tokens": 207113984} {"current_steps": 1147, "total_steps": 9134, "loss": 0.5671, "learning_rate": 4.807967527815718e-05, "epoch": 0.12556446536577356, "percentage": 12.56, "elapsed_time": "21:10:14", "remaining_time": "6 days, 3:25:12", "throughput": 2720.21, "total_tokens": 207319840} {"current_steps": 1148, "total_steps": 9134, "loss": 0.5684, "learning_rate": 4.807636902341771e-05, "epoch": 0.12567393743671146, "percentage": 12.57, "elapsed_time": "21:11:21", "remaining_time": "6 days, 3:24:05", "throughput": 2720.08, "total_tokens": 207490752} {"current_steps": 1149, "total_steps": 9134, "loss": 0.6801, "learning_rate": 4.80730600387879e-05, "epoch": 0.12578340950764935, "percentage": 12.58, "elapsed_time": "21:12:28", "remaining_time": "6 days, 3:23:07", "throughput": 2720.17, "total_tokens": 207681824} {"current_steps": 1150, "total_steps": 9134, "loss": 0.7386, "learning_rate": 4.8069748324659193e-05, "epoch": 0.12589288157858727, "percentage": 12.59, "elapsed_time": "21:13:36", "remaining_time": "6 days, 3:22:06", "throughput": 2720.29, "total_tokens": 207873568} {"current_steps": 1151, "total_steps": 9134, "loss": 0.6109, "learning_rate": 4.8066433881423354e-05, "epoch": 0.12600235364952517, "percentage": 12.6, "elapsed_time": "21:14:41", "remaining_time": "6 days, 3:20:56", "throughput": 2720.07, "total_tokens": 208036192} {"current_steps": 1152, "total_steps": 9134, "loss": 0.6863, "learning_rate": 4.806311670947249e-05, "epoch": 0.12611182572046306, "percentage": 12.61, "elapsed_time": "21:15:44", "remaining_time": "6 days, 3:19:26", "throughput": 2719.83, "total_tokens": 208189184} {"current_steps": 1153, "total_steps": 9134, "loss": 0.6409, "learning_rate": 4.805979680919901e-05, "epoch": 0.12622129779140098, "percentage": 12.62, "elapsed_time": "21:16:52", "remaining_time": "6 days, 3:18:24", "throughput": 2719.55, "total_tokens": 208350688} {"current_steps": 1154, "total_steps": 9134, "loss": 0.5998, "learning_rate": 4.8056474180995645e-05, "epoch": 0.12633076986233888, "percentage": 12.63, "elapsed_time": "21:17:54", "remaining_time": "6 days, 3:16:48", "throughput": 2719.3, "total_tokens": 208500096} {"current_steps": 1155, "total_steps": 9134, "loss": 0.7037, "learning_rate": 4.8053148825255466e-05, "epoch": 0.12644024193327677, "percentage": 12.65, "elapsed_time": "21:19:00", "remaining_time": "6 days, 3:15:42", "throughput": 2719.24, "total_tokens": 208676384} {"current_steps": 1156, "total_steps": 9134, "loss": 0.6879, "learning_rate": 4.804982074237185e-05, "epoch": 0.12654971400421466, "percentage": 12.66, "elapsed_time": "21:20:06", "remaining_time": "6 days, 3:14:28", "throughput": 2719.22, "total_tokens": 208852448} {"current_steps": 1157, "total_steps": 9134, "loss": 0.6181, "learning_rate": 4.8046489932738504e-05, "epoch": 0.12665918607515259, "percentage": 12.67, "elapsed_time": "21:21:11", "remaining_time": "6 days, 3:13:17", "throughput": 2719.16, "total_tokens": 209027168} {"current_steps": 1158, "total_steps": 9134, "loss": 1.3005, "learning_rate": 4.8043156396749454e-05, "epoch": 0.12676865814609048, "percentage": 12.68, "elapsed_time": "21:22:17", "remaining_time": "6 days, 3:12:02", "throughput": 2719.15, "total_tokens": 209203008} {"current_steps": 1159, "total_steps": 9134, "loss": 0.7303, "learning_rate": 4.8039820134799054e-05, "epoch": 0.12687813021702837, "percentage": 12.69, "elapsed_time": "21:23:23", "remaining_time": "6 days, 3:10:55", "throughput": 2719.19, "total_tokens": 209386912} {"current_steps": 1160, "total_steps": 9134, "loss": 0.7447, "learning_rate": 4.8036481147281975e-05, "epoch": 0.1269876022879663, "percentage": 12.7, "elapsed_time": "21:24:30", "remaining_time": "6 days, 3:09:54", "throughput": 2719.42, "total_tokens": 209587840} {"current_steps": 1161, "total_steps": 9134, "loss": 0.693, "learning_rate": 4.8033139434593224e-05, "epoch": 0.1270970743589042, "percentage": 12.71, "elapsed_time": "21:25:34", "remaining_time": "6 days, 3:08:30", "throughput": 2719.26, "total_tokens": 209749120} {"current_steps": 1162, "total_steps": 9134, "loss": 0.9108, "learning_rate": 4.8029794997128096e-05, "epoch": 0.12720654642984208, "percentage": 12.72, "elapsed_time": "21:26:41", "remaining_time": "6 days, 3:07:26", "throughput": 2719.33, "total_tokens": 209935712} {"current_steps": 1163, "total_steps": 9134, "loss": 0.6871, "learning_rate": 4.8026447835282256e-05, "epoch": 0.12731601850077998, "percentage": 12.73, "elapsed_time": "21:27:45", "remaining_time": "6 days, 3:06:01", "throughput": 2719.13, "total_tokens": 210093408} {"current_steps": 1164, "total_steps": 9134, "loss": 0.8759, "learning_rate": 4.802309794945165e-05, "epoch": 0.1274254905717179, "percentage": 12.74, "elapsed_time": "21:28:53", "remaining_time": "6 days, 3:05:10", "throughput": 2719.45, "total_tokens": 210305536} {"current_steps": 1165, "total_steps": 9134, "loss": 0.7458, "learning_rate": 4.8019745340032574e-05, "epoch": 0.1275349626426558, "percentage": 12.75, "elapsed_time": "21:30:02", "remaining_time": "6 days, 3:04:22", "throughput": 2719.62, "total_tokens": 210506240} {"current_steps": 1166, "total_steps": 9134, "loss": 0.7389, "learning_rate": 4.801639000742163e-05, "epoch": 0.12764443471359369, "percentage": 12.77, "elapsed_time": "21:31:09", "remaining_time": "6 days, 3:03:17", "throughput": 2719.75, "total_tokens": 210697760} {"current_steps": 1167, "total_steps": 9134, "loss": 0.7821, "learning_rate": 4.801303195201574e-05, "epoch": 0.1277539067845316, "percentage": 12.78, "elapsed_time": "21:32:17", "remaining_time": "6 days, 3:02:19", "throughput": 2719.78, "total_tokens": 210884352} {"current_steps": 1168, "total_steps": 9134, "loss": 0.6153, "learning_rate": 4.8009671174212176e-05, "epoch": 0.1278633788554695, "percentage": 12.79, "elapsed_time": "21:33:16", "remaining_time": "6 days, 3:00:23", "throughput": 2719.49, "total_tokens": 211022336} {"current_steps": 1169, "total_steps": 9134, "loss": 0.6053, "learning_rate": 4.8006307674408494e-05, "epoch": 0.1279728509264074, "percentage": 12.8, "elapsed_time": "21:34:21", "remaining_time": "6 days, 2:59:07", "throughput": 2719.4, "total_tokens": 211192352} {"current_steps": 1170, "total_steps": 9134, "loss": 0.7252, "learning_rate": 4.800294145300259e-05, "epoch": 0.12808232299734532, "percentage": 12.81, "elapsed_time": "21:35:26", "remaining_time": "6 days, 2:57:48", "throughput": 2719.55, "total_tokens": 211379840} {"current_steps": 1171, "total_steps": 9134, "loss": 0.8351, "learning_rate": 4.799957251039269e-05, "epoch": 0.1281917950682832, "percentage": 12.82, "elapsed_time": "21:36:35", "remaining_time": "6 days, 2:57:02", "throughput": 2719.53, "total_tokens": 211567328} {"current_steps": 1172, "total_steps": 9134, "loss": 0.697, "learning_rate": 4.799620084697732e-05, "epoch": 0.1283012671392211, "percentage": 12.83, "elapsed_time": "21:37:42", "remaining_time": "6 days, 2:55:57", "throughput": 2719.61, "total_tokens": 211754592} {"current_steps": 1173, "total_steps": 9134, "loss": 0.8519, "learning_rate": 4.799282646315537e-05, "epoch": 0.128410739210159, "percentage": 12.84, "elapsed_time": "21:38:50", "remaining_time": "6 days, 2:55:05", "throughput": 2719.81, "total_tokens": 211957088} {"current_steps": 1174, "total_steps": 9134, "loss": 0.7239, "learning_rate": 4.798944935932599e-05, "epoch": 0.12852021128109692, "percentage": 12.85, "elapsed_time": "21:39:58", "remaining_time": "6 days, 2:54:07", "throughput": 2719.79, "total_tokens": 212139648} {"current_steps": 1175, "total_steps": 9134, "loss": 0.7863, "learning_rate": 4.798606953588871e-05, "epoch": 0.1286296833520348, "percentage": 12.86, "elapsed_time": "21:41:07", "remaining_time": "6 days, 2:53:19", "throughput": 2719.92, "total_tokens": 212337440} {"current_steps": 1176, "total_steps": 9134, "loss": 0.7712, "learning_rate": 4.7982686993243335e-05, "epoch": 0.1287391554229727, "percentage": 12.87, "elapsed_time": "21:42:13", "remaining_time": "6 days, 2:52:11", "throughput": 2719.86, "total_tokens": 212512384} {"current_steps": 1177, "total_steps": 9134, "loss": 0.8943, "learning_rate": 4.797930173179003e-05, "epoch": 0.12884862749391063, "percentage": 12.89, "elapsed_time": "21:43:22", "remaining_time": "6 days, 2:51:19", "throughput": 2719.9, "total_tokens": 212702784} {"current_steps": 1178, "total_steps": 9134, "loss": 0.6998, "learning_rate": 4.797591375192926e-05, "epoch": 0.12895809956484852, "percentage": 12.9, "elapsed_time": "21:44:28", "remaining_time": "6 days, 2:50:10", "throughput": 2719.86, "total_tokens": 212879296} {"current_steps": 1179, "total_steps": 9134, "loss": 0.7541, "learning_rate": 4.7972523054061815e-05, "epoch": 0.12906757163578642, "percentage": 12.91, "elapsed_time": "21:45:33", "remaining_time": "6 days, 2:48:52", "throughput": 2719.82, "total_tokens": 213052000} {"current_steps": 1180, "total_steps": 9134, "loss": 0.6441, "learning_rate": 4.7969129638588805e-05, "epoch": 0.1291770437067243, "percentage": 12.92, "elapsed_time": "21:46:38", "remaining_time": "6 days, 2:47:35", "throughput": 2719.86, "total_tokens": 213231872} {"current_steps": 1181, "total_steps": 9134, "loss": 0.6092, "learning_rate": 4.796573350591167e-05, "epoch": 0.12928651577766223, "percentage": 12.93, "elapsed_time": "21:47:45", "remaining_time": "6 days, 2:46:33", "throughput": 2720.09, "total_tokens": 213431904} {"current_steps": 1182, "total_steps": 9134, "loss": 0.6959, "learning_rate": 4.796233465643216e-05, "epoch": 0.12939598784860012, "percentage": 12.94, "elapsed_time": "21:48:51", "remaining_time": "6 days, 2:45:25", "throughput": 2720.19, "total_tokens": 213620288} {"current_steps": 1183, "total_steps": 9134, "loss": 0.6207, "learning_rate": 4.7958933090552365e-05, "epoch": 0.12950545991953802, "percentage": 12.95, "elapsed_time": "21:50:00", "remaining_time": "6 days, 2:44:37", "throughput": 2719.97, "total_tokens": 213790752} {"current_steps": 1184, "total_steps": 9134, "loss": 0.8396, "learning_rate": 4.795552880867467e-05, "epoch": 0.12961493199047594, "percentage": 12.96, "elapsed_time": "21:51:09", "remaining_time": "6 days, 2:43:48", "throughput": 2720.35, "total_tokens": 214008256} {"current_steps": 1185, "total_steps": 9134, "loss": 0.5226, "learning_rate": 4.795212181120181e-05, "epoch": 0.12972440406141383, "percentage": 12.97, "elapsed_time": "21:52:18", "remaining_time": "6 days, 2:43:01", "throughput": 2720.53, "total_tokens": 214210976} {"current_steps": 1186, "total_steps": 9134, "loss": 0.8702, "learning_rate": 4.79487120985368e-05, "epoch": 0.12983387613235173, "percentage": 12.98, "elapsed_time": "21:53:26", "remaining_time": "6 days, 2:42:02", "throughput": 2720.56, "total_tokens": 214397344} {"current_steps": 1187, "total_steps": 9134, "loss": 0.8755, "learning_rate": 4.7945299671083036e-05, "epoch": 0.12994334820328965, "percentage": 13.0, "elapsed_time": "21:54:33", "remaining_time": "6 days, 2:41:03", "throughput": 2720.66, "total_tokens": 214589088} {"current_steps": 1188, "total_steps": 9134, "loss": 0.8339, "learning_rate": 4.7941884529244175e-05, "epoch": 0.13005282027422754, "percentage": 13.01, "elapsed_time": "21:55:39", "remaining_time": "6 days, 2:39:50", "throughput": 2720.74, "total_tokens": 214773888} {"current_steps": 1189, "total_steps": 9134, "loss": 0.7587, "learning_rate": 4.793846667342423e-05, "epoch": 0.13016229234516544, "percentage": 13.02, "elapsed_time": "21:56:44", "remaining_time": "6 days, 2:38:34", "throughput": 2720.81, "total_tokens": 214955552} {"current_steps": 1190, "total_steps": 9134, "loss": 0.7152, "learning_rate": 4.793504610402754e-05, "epoch": 0.13027176441610333, "percentage": 13.03, "elapsed_time": "21:57:50", "remaining_time": "6 days, 2:37:28", "throughput": 2720.66, "total_tokens": 215124896} {"current_steps": 1191, "total_steps": 9134, "loss": 0.717, "learning_rate": 4.7931622821458726e-05, "epoch": 0.13038123648704125, "percentage": 13.04, "elapsed_time": "21:58:57", "remaining_time": "6 days, 2:36:20", "throughput": 2720.69, "total_tokens": 215307904} {"current_steps": 1192, "total_steps": 9134, "loss": 0.8882, "learning_rate": 4.7928196826122775e-05, "epoch": 0.13049070855797915, "percentage": 13.05, "elapsed_time": "22:00:02", "remaining_time": "6 days, 2:35:08", "throughput": 2720.55, "total_tokens": 215475456} {"current_steps": 1193, "total_steps": 9134, "loss": 0.7955, "learning_rate": 4.7924768118424975e-05, "epoch": 0.13060018062891704, "percentage": 13.06, "elapsed_time": "22:01:11", "remaining_time": "6 days, 2:34:16", "throughput": 2720.61, "total_tokens": 215666528} {"current_steps": 1194, "total_steps": 9134, "loss": 0.9059, "learning_rate": 4.7921336698770926e-05, "epoch": 0.13070965269985496, "percentage": 13.07, "elapsed_time": "22:02:19", "remaining_time": "6 days, 2:33:21", "throughput": 2720.86, "total_tokens": 215871712} {"current_steps": 1195, "total_steps": 9134, "loss": 0.7021, "learning_rate": 4.791790256756657e-05, "epoch": 0.13081912477079286, "percentage": 13.08, "elapsed_time": "22:03:28", "remaining_time": "6 days, 2:32:28", "throughput": 2721.1, "total_tokens": 216077568} {"current_steps": 1196, "total_steps": 9134, "loss": 0.7179, "learning_rate": 4.791446572521815e-05, "epoch": 0.13092859684173075, "percentage": 13.09, "elapsed_time": "22:04:33", "remaining_time": "6 days, 2:31:13", "throughput": 2720.91, "total_tokens": 216239744} {"current_steps": 1197, "total_steps": 9134, "loss": 0.7936, "learning_rate": 4.791102617213223e-05, "epoch": 0.13103806891266864, "percentage": 13.1, "elapsed_time": "22:05:42", "remaining_time": "6 days, 2:30:25", "throughput": 2721.01, "total_tokens": 216435744} {"current_steps": 1198, "total_steps": 9134, "loss": 0.5434, "learning_rate": 4.7907583908715725e-05, "epoch": 0.13114754098360656, "percentage": 13.12, "elapsed_time": "22:06:45", "remaining_time": "6 days, 2:28:53", "throughput": 2720.66, "total_tokens": 216578208} {"current_steps": 1199, "total_steps": 9134, "loss": 0.7392, "learning_rate": 4.790413893537583e-05, "epoch": 0.13125701305454446, "percentage": 13.13, "elapsed_time": "22:07:52", "remaining_time": "6 days, 2:27:50", "throughput": 2720.6, "total_tokens": 216755840} {"current_steps": 1200, "total_steps": 9134, "loss": 0.8309, "learning_rate": 4.790069125252009e-05, "epoch": 0.13136648512548235, "percentage": 13.14, "elapsed_time": "22:09:01", "remaining_time": "6 days, 2:27:03", "throughput": 2720.86, "total_tokens": 216965504} {"current_steps": 1201, "total_steps": 9134, "loss": 0.7778, "learning_rate": 4.7897240860556345e-05, "epoch": 0.13147595719642027, "percentage": 13.15, "elapsed_time": "22:10:10", "remaining_time": "6 days, 2:26:13", "throughput": 2720.96, "total_tokens": 217160832} {"current_steps": 1202, "total_steps": 9134, "loss": 0.6507, "learning_rate": 4.789378775989278e-05, "epoch": 0.13158542926735817, "percentage": 13.16, "elapsed_time": "22:11:14", "remaining_time": "6 days, 2:24:52", "throughput": 2720.96, "total_tokens": 217335552} {"current_steps": 1203, "total_steps": 9134, "loss": 0.6143, "learning_rate": 4.789033195093789e-05, "epoch": 0.13169490133829606, "percentage": 13.17, "elapsed_time": "22:12:20", "remaining_time": "6 days, 2:23:40", "throughput": 2720.97, "total_tokens": 217514752} {"current_steps": 1204, "total_steps": 9134, "loss": 0.6973, "learning_rate": 4.7886873434100486e-05, "epoch": 0.13180437340923398, "percentage": 13.18, "elapsed_time": "22:13:23", "remaining_time": "6 days, 2:22:15", "throughput": 2720.85, "total_tokens": 217678272} {"current_steps": 1205, "total_steps": 9134, "loss": 0.6889, "learning_rate": 4.7883412209789714e-05, "epoch": 0.13191384548017188, "percentage": 13.19, "elapsed_time": "22:14:33", "remaining_time": "6 days, 2:21:28", "throughput": 2720.75, "total_tokens": 217859488} {"current_steps": 1206, "total_steps": 9134, "loss": 0.6443, "learning_rate": 4.787994827841502e-05, "epoch": 0.13202331755110977, "percentage": 13.2, "elapsed_time": "22:15:39", "remaining_time": "6 days, 2:20:18", "throughput": 2720.64, "total_tokens": 218029504} {"current_steps": 1207, "total_steps": 9134, "loss": 0.8995, "learning_rate": 4.7876481640386184e-05, "epoch": 0.13213278962204766, "percentage": 13.21, "elapsed_time": "22:16:48", "remaining_time": "6 days, 2:19:31", "throughput": 2720.95, "total_tokens": 218243424} {"current_steps": 1208, "total_steps": 9134, "loss": 0.7954, "learning_rate": 4.78730122961133e-05, "epoch": 0.13224226169298559, "percentage": 13.23, "elapsed_time": "22:17:54", "remaining_time": "6 days, 2:18:18", "throughput": 2720.79, "total_tokens": 218408512} {"current_steps": 1209, "total_steps": 9134, "loss": 0.5628, "learning_rate": 4.78695402460068e-05, "epoch": 0.13235173376392348, "percentage": 13.24, "elapsed_time": "22:19:00", "remaining_time": "6 days, 2:17:11", "throughput": 2720.8, "total_tokens": 218589728} {"current_steps": 1210, "total_steps": 9134, "loss": 0.6415, "learning_rate": 4.7866065490477386e-05, "epoch": 0.13246120583486137, "percentage": 13.25, "elapsed_time": "22:20:06", "remaining_time": "6 days, 2:16:02", "throughput": 2720.68, "total_tokens": 218760416} {"current_steps": 1211, "total_steps": 9134, "loss": 0.8429, "learning_rate": 4.786258802993615e-05, "epoch": 0.1325706779057993, "percentage": 13.26, "elapsed_time": "22:21:15", "remaining_time": "6 days, 2:15:15", "throughput": 2720.74, "total_tokens": 218953952} {"current_steps": 1212, "total_steps": 9134, "loss": 0.8278, "learning_rate": 4.785910786479445e-05, "epoch": 0.1326801499767372, "percentage": 13.27, "elapsed_time": "22:22:24", "remaining_time": "6 days, 2:14:22", "throughput": 2720.52, "total_tokens": 219122176} {"current_steps": 1213, "total_steps": 9134, "loss": 0.6846, "learning_rate": 4.7855624995464e-05, "epoch": 0.13278962204767508, "percentage": 13.28, "elapsed_time": "22:23:33", "remaining_time": "6 days, 2:13:30", "throughput": 2720.44, "total_tokens": 219303168} {"current_steps": 1214, "total_steps": 9134, "loss": 0.6599, "learning_rate": 4.785213942235679e-05, "epoch": 0.13289909411861298, "percentage": 13.29, "elapsed_time": "22:24:42", "remaining_time": "6 days, 2:12:41", "throughput": 2720.7, "total_tokens": 219511712} {"current_steps": 1215, "total_steps": 9134, "loss": 0.668, "learning_rate": 4.784865114588518e-05, "epoch": 0.1330085661895509, "percentage": 13.3, "elapsed_time": "22:25:49", "remaining_time": "6 days, 2:11:39", "throughput": 2720.71, "total_tokens": 219695168} {"current_steps": 1216, "total_steps": 9134, "loss": 0.7701, "learning_rate": 4.784516016646182e-05, "epoch": 0.1331180382604888, "percentage": 13.31, "elapsed_time": "22:26:49", "remaining_time": "6 days, 2:09:53", "throughput": 2720.41, "total_tokens": 219835616} {"current_steps": 1217, "total_steps": 9134, "loss": 0.7214, "learning_rate": 4.784166648449969e-05, "epoch": 0.13322751033142669, "percentage": 13.32, "elapsed_time": "22:27:52", "remaining_time": "6 days, 2:08:25", "throughput": 2720.44, "total_tokens": 220009440} {"current_steps": 1218, "total_steps": 9134, "loss": 0.7259, "learning_rate": 4.783817010041207e-05, "epoch": 0.1333369824023646, "percentage": 13.33, "elapsed_time": "22:29:00", "remaining_time": "6 days, 2:07:27", "throughput": 2720.42, "total_tokens": 220192000} {"current_steps": 1219, "total_steps": 9134, "loss": 0.71, "learning_rate": 4.783467101461259e-05, "epoch": 0.1334464544733025, "percentage": 13.35, "elapsed_time": "22:30:09", "remaining_time": "6 days, 2:06:40", "throughput": 2720.49, "total_tokens": 220387104} {"current_steps": 1220, "total_steps": 9134, "loss": 0.7189, "learning_rate": 4.783116922751518e-05, "epoch": 0.1335559265442404, "percentage": 13.36, "elapsed_time": "22:31:16", "remaining_time": "6 days, 2:05:34", "throughput": 2720.3, "total_tokens": 220552864} {"current_steps": 1221, "total_steps": 9134, "loss": 0.6644, "learning_rate": 4.78276647395341e-05, "epoch": 0.13366539861517832, "percentage": 13.37, "elapsed_time": "22:32:24", "remaining_time": "6 days, 2:04:39", "throughput": 2720.36, "total_tokens": 220743264} {"current_steps": 1222, "total_steps": 9134, "loss": 0.7144, "learning_rate": 4.782415755108392e-05, "epoch": 0.1337748706861162, "percentage": 13.38, "elapsed_time": "22:33:32", "remaining_time": "6 days, 2:03:44", "throughput": 2720.21, "total_tokens": 220916192} {"current_steps": 1223, "total_steps": 9134, "loss": 0.6621, "learning_rate": 4.782064766257953e-05, "epoch": 0.1338843427570541, "percentage": 13.39, "elapsed_time": "22:34:39", "remaining_time": "6 days, 2:02:38", "throughput": 2720.21, "total_tokens": 221097408} {"current_steps": 1224, "total_steps": 9134, "loss": 0.8934, "learning_rate": 4.781713507443615e-05, "epoch": 0.133993814827992, "percentage": 13.4, "elapsed_time": "22:35:48", "remaining_time": "6 days, 2:01:51", "throughput": 2720.5, "total_tokens": 221309984} {"current_steps": 1225, "total_steps": 9134, "loss": 0.7203, "learning_rate": 4.7813619787069314e-05, "epoch": 0.13410328689892992, "percentage": 13.41, "elapsed_time": "22:36:56", "remaining_time": "6 days, 2:00:50", "throughput": 2720.58, "total_tokens": 221499488} {"current_steps": 1226, "total_steps": 9134, "loss": 0.6175, "learning_rate": 4.781010180089487e-05, "epoch": 0.1342127589698678, "percentage": 13.42, "elapsed_time": "22:37:55", "remaining_time": "6 days, 1:58:59", "throughput": 2720.28, "total_tokens": 221637248} {"current_steps": 1227, "total_steps": 9134, "loss": 0.7926, "learning_rate": 4.7806581116328976e-05, "epoch": 0.1343222310408057, "percentage": 13.43, "elapsed_time": "22:39:04", "remaining_time": "6 days, 1:58:09", "throughput": 2720.53, "total_tokens": 221845120} {"current_steps": 1228, "total_steps": 9134, "loss": 0.7109, "learning_rate": 4.780305773378815e-05, "epoch": 0.13443170311174363, "percentage": 13.44, "elapsed_time": "22:40:09", "remaining_time": "6 days, 1:56:51", "throughput": 2720.74, "total_tokens": 222038208} {"current_steps": 1229, "total_steps": 9134, "loss": 0.6611, "learning_rate": 4.779953165368917e-05, "epoch": 0.13454117518268152, "percentage": 13.46, "elapsed_time": "22:41:16", "remaining_time": "6 days, 1:55:49", "throughput": 2720.52, "total_tokens": 222203072} {"current_steps": 1230, "total_steps": 9134, "loss": 0.7126, "learning_rate": 4.779600287644919e-05, "epoch": 0.13465064725361942, "percentage": 13.47, "elapsed_time": "22:42:24", "remaining_time": "6 days, 1:54:50", "throughput": 2720.65, "total_tokens": 222397728} {"current_steps": 1231, "total_steps": 9134, "loss": 0.7454, "learning_rate": 4.779247140248565e-05, "epoch": 0.1347601193245573, "percentage": 13.48, "elapsed_time": "22:43:30", "remaining_time": "6 days, 1:53:41", "throughput": 2720.54, "total_tokens": 222568640} {"current_steps": 1232, "total_steps": 9134, "loss": 0.8002, "learning_rate": 4.778893723221631e-05, "epoch": 0.13486959139549523, "percentage": 13.49, "elapsed_time": "22:44:37", "remaining_time": "6 days, 1:52:40", "throughput": 2720.45, "total_tokens": 222744480} {"current_steps": 1233, "total_steps": 9134, "loss": 0.6589, "learning_rate": 4.7785400366059266e-05, "epoch": 0.13497906346643312, "percentage": 13.5, "elapsed_time": "22:45:43", "remaining_time": "6 days, 1:51:30", "throughput": 2720.16, "total_tokens": 222900160} {"current_steps": 1234, "total_steps": 9134, "loss": 0.616, "learning_rate": 4.778186080443291e-05, "epoch": 0.13508853553737102, "percentage": 13.51, "elapsed_time": "22:46:51", "remaining_time": "6 days, 1:50:32", "throughput": 2720.04, "total_tokens": 223074208} {"current_steps": 1235, "total_steps": 9134, "loss": 0.6828, "learning_rate": 4.777831854775598e-05, "epoch": 0.13519800760830894, "percentage": 13.52, "elapsed_time": "22:47:58", "remaining_time": "6 days, 1:49:27", "throughput": 2719.74, "total_tokens": 223231008} {"current_steps": 1236, "total_steps": 9134, "loss": 0.8746, "learning_rate": 4.777477359644751e-05, "epoch": 0.13530747967924683, "percentage": 13.53, "elapsed_time": "22:49:03", "remaining_time": "6 days, 1:48:15", "throughput": 2719.62, "total_tokens": 223399680} {"current_steps": 1237, "total_steps": 9134, "loss": 0.6213, "learning_rate": 4.7771225950926854e-05, "epoch": 0.13541695175018473, "percentage": 13.54, "elapsed_time": "22:50:09", "remaining_time": "6 days, 1:47:04", "throughput": 2719.66, "total_tokens": 223582016} {"current_steps": 1238, "total_steps": 9134, "loss": 0.7855, "learning_rate": 4.7767675611613704e-05, "epoch": 0.13552642382112265, "percentage": 13.55, "elapsed_time": "22:51:15", "remaining_time": "6 days, 1:45:57", "throughput": 2719.69, "total_tokens": 223764576} {"current_steps": 1239, "total_steps": 9134, "loss": 0.7594, "learning_rate": 4.776412257892805e-05, "epoch": 0.13563589589206054, "percentage": 13.56, "elapsed_time": "22:52:20", "remaining_time": "6 days, 1:44:42", "throughput": 2719.64, "total_tokens": 223937280} {"current_steps": 1240, "total_steps": 9134, "loss": 0.6476, "learning_rate": 4.7760566853290215e-05, "epoch": 0.13574536796299844, "percentage": 13.58, "elapsed_time": "22:53:30", "remaining_time": "6 days, 1:43:55", "throughput": 2720.02, "total_tokens": 224157920} {"current_steps": 1241, "total_steps": 9134, "loss": 0.6917, "learning_rate": 4.775700843512084e-05, "epoch": 0.13585484003393633, "percentage": 13.59, "elapsed_time": "22:54:37", "remaining_time": "6 days, 1:42:52", "throughput": 2719.84, "total_tokens": 224325248} {"current_steps": 1242, "total_steps": 9134, "loss": 0.8417, "learning_rate": 4.775344732484086e-05, "epoch": 0.13596431210487425, "percentage": 13.6, "elapsed_time": "22:55:46", "remaining_time": "6 days, 1:42:01", "throughput": 2720.02, "total_tokens": 224527296} {"current_steps": 1243, "total_steps": 9134, "loss": 0.6032, "learning_rate": 4.774988352287156e-05, "epoch": 0.13607378417581215, "percentage": 13.61, "elapsed_time": "22:56:53", "remaining_time": "6 days, 1:41:02", "throughput": 2720.05, "total_tokens": 224714112} {"current_steps": 1244, "total_steps": 9134, "loss": 0.6384, "learning_rate": 4.774631702963453e-05, "epoch": 0.13618325624675004, "percentage": 13.62, "elapsed_time": "22:58:03", "remaining_time": "6 days, 1:40:14", "throughput": 2720.08, "total_tokens": 224904960} {"current_steps": 1245, "total_steps": 9134, "loss": 0.8046, "learning_rate": 4.7742747845551685e-05, "epoch": 0.13629272831768796, "percentage": 13.63, "elapsed_time": "22:59:06", "remaining_time": "6 days, 1:38:45", "throughput": 2719.81, "total_tokens": 225053696} {"current_steps": 1246, "total_steps": 9134, "loss": 0.695, "learning_rate": 4.773917597104525e-05, "epoch": 0.13640220038862585, "percentage": 13.64, "elapsed_time": "23:00:12", "remaining_time": "6 days, 1:37:40", "throughput": 2719.85, "total_tokens": 225238944} {"current_steps": 1247, "total_steps": 9134, "loss": 0.6213, "learning_rate": 4.773560140653775e-05, "epoch": 0.13651167245956375, "percentage": 13.65, "elapsed_time": "23:01:18", "remaining_time": "6 days, 1:36:29", "throughput": 2719.83, "total_tokens": 225415680} {"current_steps": 1248, "total_steps": 9134, "loss": 0.7096, "learning_rate": 4.773202415245208e-05, "epoch": 0.13662114453050164, "percentage": 13.66, "elapsed_time": "23:02:23", "remaining_time": "6 days, 1:35:11", "throughput": 2719.78, "total_tokens": 225587040} {"current_steps": 1249, "total_steps": 9134, "loss": 0.5362, "learning_rate": 4.772844420921141e-05, "epoch": 0.13673061660143956, "percentage": 13.67, "elapsed_time": "23:03:26", "remaining_time": "6 days, 1:33:46", "throughput": 2719.67, "total_tokens": 225751680} {"current_steps": 1250, "total_steps": 9134, "loss": 0.5776, "learning_rate": 4.772486157723923e-05, "epoch": 0.13684008867237746, "percentage": 13.69, "elapsed_time": "23:04:34", "remaining_time": "6 days, 1:32:50", "throughput": 2719.88, "total_tokens": 225953728} {"current_steps": 1251, "total_steps": 9134, "loss": 0.801, "learning_rate": 4.772127625695937e-05, "epoch": 0.13694956074331535, "percentage": 13.7, "elapsed_time": "23:05:38", "remaining_time": "6 days, 1:31:23", "throughput": 2719.55, "total_tokens": 226098656} {"current_steps": 1252, "total_steps": 9134, "loss": 0.645, "learning_rate": 4.771768824879597e-05, "epoch": 0.13705903281425327, "percentage": 13.71, "elapsed_time": "23:06:44", "remaining_time": "6 days, 1:30:14", "throughput": 2719.35, "total_tokens": 226261504} {"current_steps": 1253, "total_steps": 9134, "loss": 0.5859, "learning_rate": 4.771409755317348e-05, "epoch": 0.13716850488519117, "percentage": 13.72, "elapsed_time": "23:07:50", "remaining_time": "6 days, 1:29:08", "throughput": 2719.26, "total_tokens": 226434656} {"current_steps": 1254, "total_steps": 9134, "loss": 0.6591, "learning_rate": 4.771050417051667e-05, "epoch": 0.13727797695612906, "percentage": 13.73, "elapsed_time": "23:08:52", "remaining_time": "6 days, 1:27:32", "throughput": 2719.16, "total_tokens": 226594368} {"current_steps": 1255, "total_steps": 9134, "loss": 0.6216, "learning_rate": 4.770690810125062e-05, "epoch": 0.13738744902706698, "percentage": 13.74, "elapsed_time": "23:10:00", "remaining_time": "6 days, 1:26:33", "throughput": 2719.26, "total_tokens": 226786336} {"current_steps": 1256, "total_steps": 9134, "loss": 0.7215, "learning_rate": 4.7703309345800766e-05, "epoch": 0.13749692109800488, "percentage": 13.75, "elapsed_time": "23:11:09", "remaining_time": "6 days, 1:25:45", "throughput": 2719.03, "total_tokens": 226956576} {"current_steps": 1257, "total_steps": 9134, "loss": 0.9164, "learning_rate": 4.769970790459282e-05, "epoch": 0.13760639316894277, "percentage": 13.76, "elapsed_time": "23:12:16", "remaining_time": "6 days, 1:24:43", "throughput": 2719.04, "total_tokens": 227139808} {"current_steps": 1258, "total_steps": 9134, "loss": 0.7662, "learning_rate": 4.769610377805281e-05, "epoch": 0.13771586523988066, "percentage": 13.77, "elapsed_time": "23:13:25", "remaining_time": "6 days, 1:23:50", "throughput": 2719.0, "total_tokens": 227322592} {"current_steps": 1259, "total_steps": 9134, "loss": 0.806, "learning_rate": 4.769249696660711e-05, "epoch": 0.13782533731081859, "percentage": 13.78, "elapsed_time": "23:14:35", "remaining_time": "6 days, 1:23:04", "throughput": 2719.07, "total_tokens": 227517920} {"current_steps": 1260, "total_steps": 9134, "loss": 0.6878, "learning_rate": 4.768888747068241e-05, "epoch": 0.13793480938175648, "percentage": 13.79, "elapsed_time": "23:15:41", "remaining_time": "6 days, 1:21:55", "throughput": 2718.9, "total_tokens": 227684128} {"current_steps": 1261, "total_steps": 9134, "loss": 0.577, "learning_rate": 4.7685275290705686e-05, "epoch": 0.13804428145269437, "percentage": 13.81, "elapsed_time": "23:16:48", "remaining_time": "6 days, 1:20:56", "throughput": 2718.91, "total_tokens": 227868256} {"current_steps": 1262, "total_steps": 9134, "loss": 0.6753, "learning_rate": 4.7681660427104266e-05, "epoch": 0.1381537535236323, "percentage": 13.82, "elapsed_time": "23:17:53", "remaining_time": "6 days, 1:19:37", "throughput": 2718.73, "total_tokens": 228028192} {"current_steps": 1263, "total_steps": 9134, "loss": 0.7942, "learning_rate": 4.7678042880305785e-05, "epoch": 0.1382632255945702, "percentage": 13.83, "elapsed_time": "23:18:59", "remaining_time": "6 days, 1:18:30", "throughput": 2718.73, "total_tokens": 228209184} {"current_steps": 1264, "total_steps": 9134, "loss": 0.6687, "learning_rate": 4.767442265073818e-05, "epoch": 0.13837269766550808, "percentage": 13.84, "elapsed_time": "23:20:04", "remaining_time": "6 days, 1:17:17", "throughput": 2718.43, "total_tokens": 228361504} {"current_steps": 1265, "total_steps": 9134, "loss": 0.6364, "learning_rate": 4.767079973882972e-05, "epoch": 0.13848216973644598, "percentage": 13.85, "elapsed_time": "23:21:12", "remaining_time": "6 days, 1:16:16", "throughput": 2718.28, "total_tokens": 228532416} {"current_steps": 1266, "total_steps": 9134, "loss": 0.7894, "learning_rate": 4.766717414500898e-05, "epoch": 0.1385916418073839, "percentage": 13.86, "elapsed_time": "23:22:19", "remaining_time": "6 days, 1:15:14", "throughput": 2718.15, "total_tokens": 228704224} {"current_steps": 1267, "total_steps": 9134, "loss": 0.6682, "learning_rate": 4.766354586970489e-05, "epoch": 0.1387011138783218, "percentage": 13.87, "elapsed_time": "23:23:28", "remaining_time": "6 days, 1:14:24", "throughput": 2718.14, "total_tokens": 228890368} {"current_steps": 1268, "total_steps": 9134, "loss": 0.6803, "learning_rate": 4.7659914913346634e-05, "epoch": 0.13881058594925968, "percentage": 13.88, "elapsed_time": "23:24:36", "remaining_time": "6 days, 1:13:24", "throughput": 2718.07, "total_tokens": 229068224} {"current_steps": 1269, "total_steps": 9134, "loss": 0.666, "learning_rate": 4.7656281276363765e-05, "epoch": 0.1389200580201976, "percentage": 13.89, "elapsed_time": "23:25:44", "remaining_time": "6 days, 1:12:31", "throughput": 2718.21, "total_tokens": 229266688} {"current_steps": 1270, "total_steps": 9134, "loss": 0.6594, "learning_rate": 4.7652644959186146e-05, "epoch": 0.1390295300911355, "percentage": 13.9, "elapsed_time": "23:26:51", "remaining_time": "6 days, 1:11:23", "throughput": 2718.21, "total_tokens": 229446784} {"current_steps": 1271, "total_steps": 9134, "loss": 0.7602, "learning_rate": 4.764900596224392e-05, "epoch": 0.1391390021620734, "percentage": 13.92, "elapsed_time": "23:27:54", "remaining_time": "6 days, 1:10:01", "throughput": 2717.95, "total_tokens": 229598208} {"current_steps": 1272, "total_steps": 9134, "loss": 0.788, "learning_rate": 4.7645364285967584e-05, "epoch": 0.13924847423301132, "percentage": 13.93, "elapsed_time": "23:29:01", "remaining_time": "6 days, 1:08:54", "throughput": 2718.01, "total_tokens": 229783904} {"current_steps": 1273, "total_steps": 9134, "loss": 0.6389, "learning_rate": 4.764171993078795e-05, "epoch": 0.1393579463039492, "percentage": 13.94, "elapsed_time": "23:30:03", "remaining_time": "6 days, 1:07:23", "throughput": 2717.94, "total_tokens": 229948320} {"current_steps": 1274, "total_steps": 9134, "loss": 0.9654, "learning_rate": 4.763807289713613e-05, "epoch": 0.1394674183748871, "percentage": 13.95, "elapsed_time": "23:31:12", "remaining_time": "6 days, 1:06:30", "throughput": 2717.98, "total_tokens": 230137824} {"current_steps": 1275, "total_steps": 9134, "loss": 0.7913, "learning_rate": 4.763442318544356e-05, "epoch": 0.139576890445825, "percentage": 13.96, "elapsed_time": "23:32:19", "remaining_time": "6 days, 1:05:30", "throughput": 2718.02, "total_tokens": 230325088} {"current_steps": 1276, "total_steps": 9134, "loss": 0.7346, "learning_rate": 4.7630770796142e-05, "epoch": 0.13968636251676292, "percentage": 13.97, "elapsed_time": "23:33:26", "remaining_time": "6 days, 1:04:24", "throughput": 2718.17, "total_tokens": 230518624} {"current_steps": 1277, "total_steps": 9134, "loss": 0.5652, "learning_rate": 4.762711572966352e-05, "epoch": 0.1397958345877008, "percentage": 13.98, "elapsed_time": "23:34:33", "remaining_time": "6 days, 1:03:23", "throughput": 2718.17, "total_tokens": 230701408} {"current_steps": 1278, "total_steps": 9134, "loss": 0.7643, "learning_rate": 4.76234579864405e-05, "epoch": 0.1399053066586387, "percentage": 13.99, "elapsed_time": "23:35:42", "remaining_time": "6 days, 1:02:32", "throughput": 2718.12, "total_tokens": 230885312} {"current_steps": 1279, "total_steps": 9134, "loss": 0.7445, "learning_rate": 4.761979756690565e-05, "epoch": 0.14001477872957663, "percentage": 14.0, "elapsed_time": "23:36:48", "remaining_time": "6 days, 1:01:19", "throughput": 2718.17, "total_tokens": 231066752} {"current_steps": 1280, "total_steps": 9134, "loss": 0.7607, "learning_rate": 4.761613447149199e-05, "epoch": 0.14012425080051452, "percentage": 14.01, "elapsed_time": "23:37:57", "remaining_time": "6 days, 1:00:30", "throughput": 2718.42, "total_tokens": 231277088} {"current_steps": 1281, "total_steps": 9134, "loss": 0.7039, "learning_rate": 4.761246870063286e-05, "epoch": 0.14023372287145242, "percentage": 14.02, "elapsed_time": "23:39:04", "remaining_time": "6 days, 0:59:28", "throughput": 2718.71, "total_tokens": 231484064} {"current_steps": 1282, "total_steps": 9134, "loss": 0.658, "learning_rate": 4.760880025476191e-05, "epoch": 0.1403431949423903, "percentage": 14.04, "elapsed_time": "23:40:07", "remaining_time": "6 days, 0:58:01", "throughput": 2718.65, "total_tokens": 231650496} {"current_steps": 1283, "total_steps": 9134, "loss": 0.7526, "learning_rate": 4.76051291343131e-05, "epoch": 0.14045266701332823, "percentage": 14.05, "elapsed_time": "23:41:15", "remaining_time": "6 days, 0:57:00", "throughput": 2718.74, "total_tokens": 231841344} {"current_steps": 1284, "total_steps": 9134, "loss": 0.7538, "learning_rate": 4.7601455339720736e-05, "epoch": 0.14056213908426612, "percentage": 14.06, "elapsed_time": "23:42:20", "remaining_time": "6 days, 0:55:46", "throughput": 2718.5, "total_tokens": 231998144} {"current_steps": 1285, "total_steps": 9134, "loss": 0.5775, "learning_rate": 4.759777887141941e-05, "epoch": 0.14067161115520402, "percentage": 14.07, "elapsed_time": "23:43:25", "remaining_time": "6 days, 0:54:29", "throughput": 2718.51, "total_tokens": 232174880} {"current_steps": 1286, "total_steps": 9134, "loss": 0.6722, "learning_rate": 4.7594099729844045e-05, "epoch": 0.14078108322614194, "percentage": 14.08, "elapsed_time": "23:44:31", "remaining_time": "6 days, 0:53:21", "throughput": 2718.26, "total_tokens": 232333696} {"current_steps": 1287, "total_steps": 9134, "loss": 0.6954, "learning_rate": 4.759041791542987e-05, "epoch": 0.14089055529707983, "percentage": 14.09, "elapsed_time": "23:45:41", "remaining_time": "6 days, 0:52:35", "throughput": 2718.31, "total_tokens": 232527680} {"current_steps": 1288, "total_steps": 9134, "loss": 0.637, "learning_rate": 4.7586733428612454e-05, "epoch": 0.14100002736801773, "percentage": 14.1, "elapsed_time": "23:46:50", "remaining_time": "6 days, 0:51:43", "throughput": 2718.54, "total_tokens": 232734432} {"current_steps": 1289, "total_steps": 9134, "loss": 0.6359, "learning_rate": 4.758304626982764e-05, "epoch": 0.14110949943895565, "percentage": 14.11, "elapsed_time": "23:47:59", "remaining_time": "6 days, 0:50:55", "throughput": 2718.72, "total_tokens": 232939168} {"current_steps": 1290, "total_steps": 9134, "loss": 0.7564, "learning_rate": 4.757935643951163e-05, "epoch": 0.14121897150989354, "percentage": 14.12, "elapsed_time": "23:49:05", "remaining_time": "6 days, 0:49:42", "throughput": 2718.56, "total_tokens": 233103136} {"current_steps": 1291, "total_steps": 9134, "loss": 0.9284, "learning_rate": 4.757566393810091e-05, "epoch": 0.14132844358083144, "percentage": 14.13, "elapsed_time": "23:50:12", "remaining_time": "6 days, 0:48:43", "throughput": 2718.46, "total_tokens": 233278080} {"current_steps": 1292, "total_steps": 9134, "loss": 0.8183, "learning_rate": 4.75719687660323e-05, "epoch": 0.14143791565176933, "percentage": 14.14, "elapsed_time": "23:51:21", "remaining_time": "6 days, 0:47:51", "throughput": 2718.51, "total_tokens": 233470272} {"current_steps": 1293, "total_steps": 9134, "loss": 0.8962, "learning_rate": 4.756827092374295e-05, "epoch": 0.14154738772270725, "percentage": 14.16, "elapsed_time": "23:52:29", "remaining_time": "6 days, 0:46:52", "throughput": 2718.5, "total_tokens": 233653280} {"current_steps": 1294, "total_steps": 9134, "loss": 0.8683, "learning_rate": 4.7564570411670284e-05, "epoch": 0.14165685979364515, "percentage": 14.17, "elapsed_time": "23:53:38", "remaining_time": "6 days, 0:46:02", "throughput": 2718.41, "total_tokens": 233832704} {"current_steps": 1295, "total_steps": 9134, "loss": 0.6789, "learning_rate": 4.756086723025208e-05, "epoch": 0.14176633186458304, "percentage": 14.18, "elapsed_time": "23:54:47", "remaining_time": "6 days, 0:45:10", "throughput": 2718.42, "total_tokens": 234021088} {"current_steps": 1296, "total_steps": 9134, "loss": 0.764, "learning_rate": 4.755716137992641e-05, "epoch": 0.14187580393552096, "percentage": 14.19, "elapsed_time": "23:55:52", "remaining_time": "6 days, 0:43:58", "throughput": 2718.33, "total_tokens": 234191776} {"current_steps": 1297, "total_steps": 9134, "loss": 0.8036, "learning_rate": 4.755345286113166e-05, "epoch": 0.14198527600645885, "percentage": 14.2, "elapsed_time": "23:56:58", "remaining_time": "6 days, 0:42:46", "throughput": 2718.06, "total_tokens": 234346560} {"current_steps": 1298, "total_steps": 9134, "loss": 0.7765, "learning_rate": 4.7549741674306567e-05, "epoch": 0.14209474807739675, "percentage": 14.21, "elapsed_time": "23:58:04", "remaining_time": "6 days, 0:41:39", "throughput": 2718.1, "total_tokens": 234530464} {"current_steps": 1299, "total_steps": 9134, "loss": 0.7371, "learning_rate": 4.754602781989013e-05, "epoch": 0.14220422014833464, "percentage": 14.22, "elapsed_time": "23:59:10", "remaining_time": "6 days, 0:40:26", "throughput": 2718.11, "total_tokens": 234709440} {"current_steps": 1300, "total_steps": 9134, "loss": 0.6459, "learning_rate": 4.754231129832171e-05, "epoch": 0.14231369221927256, "percentage": 14.23, "elapsed_time": "1 day, 0:00:15", "remaining_time": "6 days, 0:39:12", "throughput": 2718.1, "total_tokens": 234885504} {"current_steps": 1301, "total_steps": 9134, "loss": 0.8833, "learning_rate": 4.753859211004096e-05, "epoch": 0.14242316429021046, "percentage": 14.24, "elapsed_time": "1 day, 0:01:24", "remaining_time": "6 days, 0:38:23", "throughput": 2718.19, "total_tokens": 235082624} {"current_steps": 1302, "total_steps": 9134, "loss": 0.722, "learning_rate": 4.753487025548784e-05, "epoch": 0.14253263636114835, "percentage": 14.25, "elapsed_time": "1 day, 0:02:32", "remaining_time": "6 days, 0:37:22", "throughput": 2718.11, "total_tokens": 235257792} {"current_steps": 1303, "total_steps": 9134, "loss": 0.8241, "learning_rate": 4.753114573510265e-05, "epoch": 0.14264210843208627, "percentage": 14.27, "elapsed_time": "1 day, 0:03:37", "remaining_time": "6 days, 0:36:07", "throughput": 2717.83, "total_tokens": 235410560} {"current_steps": 1304, "total_steps": 9134, "loss": 0.5141, "learning_rate": 4.7527418549326e-05, "epoch": 0.14275158050302417, "percentage": 14.28, "elapsed_time": "1 day, 0:04:46", "remaining_time": "6 days, 0:35:15", "throughput": 2717.94, "total_tokens": 235607456} {"current_steps": 1305, "total_steps": 9134, "loss": 0.7885, "learning_rate": 4.752368869859879e-05, "epoch": 0.14286105257396206, "percentage": 14.29, "elapsed_time": "1 day, 0:05:55", "remaining_time": "6 days, 0:34:27", "throughput": 2718.0, "total_tokens": 235801440} {"current_steps": 1306, "total_steps": 9134, "loss": 0.7191, "learning_rate": 4.751995618336227e-05, "epoch": 0.14297052464489998, "percentage": 14.3, "elapsed_time": "1 day, 0:07:04", "remaining_time": "6 days, 0:33:36", "throughput": 2718.34, "total_tokens": 236018944} {"current_steps": 1307, "total_steps": 9134, "loss": 0.6686, "learning_rate": 4.751622100405798e-05, "epoch": 0.14307999671583788, "percentage": 14.31, "elapsed_time": "1 day, 0:08:11", "remaining_time": "6 days, 0:32:29", "throughput": 2718.45, "total_tokens": 236209344} {"current_steps": 1308, "total_steps": 9134, "loss": 0.5666, "learning_rate": 4.7512483161127794e-05, "epoch": 0.14318946878677577, "percentage": 14.32, "elapsed_time": "1 day, 0:09:20", "remaining_time": "6 days, 0:31:42", "throughput": 2718.51, "total_tokens": 236404000} {"current_steps": 1309, "total_steps": 9134, "loss": 0.6433, "learning_rate": 4.750874265501389e-05, "epoch": 0.14329894085771366, "percentage": 14.33, "elapsed_time": "1 day, 0:10:28", "remaining_time": "6 days, 0:30:42", "throughput": 2718.4, "total_tokens": 236577600} {"current_steps": 1310, "total_steps": 9134, "loss": 0.7324, "learning_rate": 4.750499948615875e-05, "epoch": 0.14340841292865159, "percentage": 14.34, "elapsed_time": "1 day, 0:11:34", "remaining_time": "6 days, 0:29:35", "throughput": 2718.2, "total_tokens": 236741568} {"current_steps": 1311, "total_steps": 9134, "loss": 0.6275, "learning_rate": 4.750125365500521e-05, "epoch": 0.14351788499958948, "percentage": 14.35, "elapsed_time": "1 day, 0:12:40", "remaining_time": "6 days, 0:28:24", "throughput": 2718.1, "total_tokens": 236910912} {"current_steps": 1312, "total_steps": 9134, "loss": 0.7143, "learning_rate": 4.7497505161996356e-05, "epoch": 0.14362735707052737, "percentage": 14.36, "elapsed_time": "1 day, 0:13:49", "remaining_time": "6 days, 0:27:34", "throughput": 2718.24, "total_tokens": 237111616} {"current_steps": 1313, "total_steps": 9134, "loss": 0.8587, "learning_rate": 4.749375400757566e-05, "epoch": 0.1437368291414653, "percentage": 14.37, "elapsed_time": "1 day, 0:14:55", "remaining_time": "6 days, 0:26:26", "throughput": 2718.06, "total_tokens": 237275584} {"current_steps": 1314, "total_steps": 9134, "loss": 0.6385, "learning_rate": 4.749000019218687e-05, "epoch": 0.1438463012124032, "percentage": 14.39, "elapsed_time": "1 day, 0:16:01", "remaining_time": "6 days, 0:25:15", "throughput": 2717.96, "total_tokens": 237445824} {"current_steps": 1315, "total_steps": 9134, "loss": 0.788, "learning_rate": 4.7486243716274036e-05, "epoch": 0.14395577328334108, "percentage": 14.4, "elapsed_time": "1 day, 0:17:06", "remaining_time": "6 days, 0:23:56", "throughput": 2717.87, "total_tokens": 237612928} {"current_steps": 1316, "total_steps": 9134, "loss": 0.7473, "learning_rate": 4.748248458028157e-05, "epoch": 0.14406524535427898, "percentage": 14.41, "elapsed_time": "1 day, 0:18:13", "remaining_time": "6 days, 0:22:54", "throughput": 2718.01, "total_tokens": 237807584} {"current_steps": 1317, "total_steps": 9134, "loss": 0.6219, "learning_rate": 4.747872278465416e-05, "epoch": 0.1441747174252169, "percentage": 14.42, "elapsed_time": "1 day, 0:19:14", "remaining_time": "6 days, 0:21:14", "throughput": 2717.73, "total_tokens": 237949152} {"current_steps": 1318, "total_steps": 9134, "loss": 0.6392, "learning_rate": 4.7474958329836805e-05, "epoch": 0.1442841894961548, "percentage": 14.43, "elapsed_time": "1 day, 0:20:21", "remaining_time": "6 days, 0:20:12", "throughput": 2717.75, "total_tokens": 238133280} {"current_steps": 1319, "total_steps": 9134, "loss": 0.656, "learning_rate": 4.747119121627485e-05, "epoch": 0.14439366156709268, "percentage": 14.44, "elapsed_time": "1 day, 0:21:27", "remaining_time": "6 days, 0:19:02", "throughput": 2717.93, "total_tokens": 238327936} {"current_steps": 1320, "total_steps": 9134, "loss": 0.7357, "learning_rate": 4.746742144441393e-05, "epoch": 0.1445031336380306, "percentage": 14.45, "elapsed_time": "1 day, 0:22:30", "remaining_time": "6 days, 0:17:37", "throughput": 2717.79, "total_tokens": 238488096} {"current_steps": 1321, "total_steps": 9134, "loss": 0.6705, "learning_rate": 4.7463649014700004e-05, "epoch": 0.1446126057089685, "percentage": 14.46, "elapsed_time": "1 day, 0:23:34", "remaining_time": "6 days, 0:16:16", "throughput": 2717.77, "total_tokens": 238660352} {"current_steps": 1322, "total_steps": 9134, "loss": 0.6446, "learning_rate": 4.7459873927579345e-05, "epoch": 0.1447220777799064, "percentage": 14.47, "elapsed_time": "1 day, 0:24:43", "remaining_time": "6 days, 0:15:21", "throughput": 2717.79, "total_tokens": 238847616} {"current_steps": 1323, "total_steps": 9134, "loss": 0.6836, "learning_rate": 4.745609618349853e-05, "epoch": 0.14483154985084432, "percentage": 14.48, "elapsed_time": "1 day, 0:25:51", "remaining_time": "6 days, 0:14:28", "throughput": 2717.65, "total_tokens": 239023008} {"current_steps": 1324, "total_steps": 9134, "loss": 0.8015, "learning_rate": 4.7452315782904477e-05, "epoch": 0.1449410219217822, "percentage": 14.5, "elapsed_time": "1 day, 0:26:55", "remaining_time": "6 days, 0:13:06", "throughput": 2717.61, "total_tokens": 239192800} {"current_steps": 1325, "total_steps": 9134, "loss": 0.6096, "learning_rate": 4.744853272624438e-05, "epoch": 0.1450504939927201, "percentage": 14.51, "elapsed_time": "1 day, 0:28:04", "remaining_time": "6 days, 0:12:12", "throughput": 2717.6, "total_tokens": 239378048} {"current_steps": 1326, "total_steps": 9134, "loss": 0.7963, "learning_rate": 4.7444747013965776e-05, "epoch": 0.145159966063658, "percentage": 14.52, "elapsed_time": "1 day, 0:29:13", "remaining_time": "6 days, 0:11:24", "throughput": 2717.85, "total_tokens": 239589280} {"current_steps": 1327, "total_steps": 9134, "loss": 0.7845, "learning_rate": 4.744095864651651e-05, "epoch": 0.14526943813459592, "percentage": 14.53, "elapsed_time": "1 day, 0:30:23", "remaining_time": "6 days, 0:10:37", "throughput": 2717.96, "total_tokens": 239787968} {"current_steps": 1328, "total_steps": 9134, "loss": 0.598, "learning_rate": 4.7437167624344736e-05, "epoch": 0.1453789102055338, "percentage": 14.54, "elapsed_time": "1 day, 0:31:27", "remaining_time": "6 days, 0:09:16", "throughput": 2717.86, "total_tokens": 239953952} {"current_steps": 1329, "total_steps": 9134, "loss": 1.0846, "learning_rate": 4.743337394789892e-05, "epoch": 0.1454883822764717, "percentage": 14.55, "elapsed_time": "1 day, 0:32:37", "remaining_time": "6 days, 0:08:28", "throughput": 2717.97, "total_tokens": 240152640} {"current_steps": 1330, "total_steps": 9134, "loss": 0.5813, "learning_rate": 4.7429577617627864e-05, "epoch": 0.14559785434740963, "percentage": 14.56, "elapsed_time": "1 day, 0:33:46", "remaining_time": "6 days, 0:07:37", "throughput": 2718.19, "total_tokens": 240359616} {"current_steps": 1331, "total_steps": 9134, "loss": 0.7968, "learning_rate": 4.7425778633980636e-05, "epoch": 0.14570732641834752, "percentage": 14.57, "elapsed_time": "1 day, 0:34:52", "remaining_time": "6 days, 0:06:29", "throughput": 2718.16, "total_tokens": 240537696} {"current_steps": 1332, "total_steps": 9134, "loss": 0.8136, "learning_rate": 4.742197699740668e-05, "epoch": 0.14581679848928542, "percentage": 14.58, "elapsed_time": "1 day, 0:36:00", "remaining_time": "6 days, 0:05:31", "throughput": 2718.28, "total_tokens": 240732800} {"current_steps": 1333, "total_steps": 9134, "loss": 0.6057, "learning_rate": 4.74181727083557e-05, "epoch": 0.14592627056022334, "percentage": 14.59, "elapsed_time": "1 day, 0:37:08", "remaining_time": "6 days, 0:04:30", "throughput": 2718.23, "total_tokens": 240911776} {"current_steps": 1334, "total_steps": 9134, "loss": 0.756, "learning_rate": 4.741436576727775e-05, "epoch": 0.14603574263116123, "percentage": 14.6, "elapsed_time": "1 day, 0:38:17", "remaining_time": "6 days, 0:03:42", "throughput": 2718.43, "total_tokens": 241118304} {"current_steps": 1335, "total_steps": 9134, "loss": 0.8881, "learning_rate": 4.741055617462318e-05, "epoch": 0.14614521470209912, "percentage": 14.62, "elapsed_time": "1 day, 0:39:23", "remaining_time": "6 days, 0:02:29", "throughput": 2718.49, "total_tokens": 241301760} {"current_steps": 1336, "total_steps": 9134, "loss": 0.6046, "learning_rate": 4.7406743930842655e-05, "epoch": 0.14625468677303702, "percentage": 14.63, "elapsed_time": "1 day, 0:40:27", "remaining_time": "6 days, 0:01:11", "throughput": 2718.43, "total_tokens": 241471776} {"current_steps": 1337, "total_steps": 9134, "loss": 0.6165, "learning_rate": 4.740292903638716e-05, "epoch": 0.14636415884397494, "percentage": 14.64, "elapsed_time": "1 day, 0:41:30", "remaining_time": "5 days, 23:59:41", "throughput": 2718.3, "total_tokens": 241629920} {"current_steps": 1338, "total_steps": 9134, "loss": 0.772, "learning_rate": 4.739911149170798e-05, "epoch": 0.14647363091491283, "percentage": 14.65, "elapsed_time": "1 day, 0:42:36", "remaining_time": "5 days, 23:58:32", "throughput": 2718.31, "total_tokens": 241810464} {"current_steps": 1339, "total_steps": 9134, "loss": 0.749, "learning_rate": 4.7395291297256725e-05, "epoch": 0.14658310298585073, "percentage": 14.66, "elapsed_time": "1 day, 0:43:40", "remaining_time": "5 days, 23:57:14", "throughput": 2718.26, "total_tokens": 241981600} {"current_steps": 1340, "total_steps": 9134, "loss": 0.6604, "learning_rate": 4.7391468453485334e-05, "epoch": 0.14669257505678865, "percentage": 14.67, "elapsed_time": "1 day, 0:44:42", "remaining_time": "5 days, 23:55:41", "throughput": 2718.15, "total_tokens": 242140192} {"current_steps": 1341, "total_steps": 9134, "loss": 0.8946, "learning_rate": 4.738764296084603e-05, "epoch": 0.14680204712772654, "percentage": 14.68, "elapsed_time": "1 day, 0:45:47", "remaining_time": "5 days, 23:54:27", "throughput": 2718.08, "total_tokens": 242310656} {"current_steps": 1342, "total_steps": 9134, "loss": 0.6092, "learning_rate": 4.738381481979136e-05, "epoch": 0.14691151919866444, "percentage": 14.69, "elapsed_time": "1 day, 0:46:50", "remaining_time": "5 days, 23:52:58", "throughput": 2717.99, "total_tokens": 242472832} {"current_steps": 1343, "total_steps": 9134, "loss": 0.7997, "learning_rate": 4.7379984030774184e-05, "epoch": 0.14702099126960233, "percentage": 14.7, "elapsed_time": "1 day, 0:47:59", "remaining_time": "5 days, 23:52:08", "throughput": 2718.02, "total_tokens": 242664128} {"current_steps": 1344, "total_steps": 9134, "loss": 0.7865, "learning_rate": 4.737615059424768e-05, "epoch": 0.14713046334054025, "percentage": 14.71, "elapsed_time": "1 day, 0:49:08", "remaining_time": "5 days, 23:51:18", "throughput": 2718.02, "total_tokens": 242851840} {"current_steps": 1345, "total_steps": 9134, "loss": 0.7408, "learning_rate": 4.737231451066534e-05, "epoch": 0.14723993541147815, "percentage": 14.73, "elapsed_time": "1 day, 0:50:18", "remaining_time": "5 days, 23:50:26", "throughput": 2718.24, "total_tokens": 243059488} {"current_steps": 1346, "total_steps": 9134, "loss": 0.8787, "learning_rate": 4.7368475780480956e-05, "epoch": 0.14734940748241604, "percentage": 14.74, "elapsed_time": "1 day, 0:51:24", "remaining_time": "5 days, 23:49:21", "throughput": 2718.16, "total_tokens": 243233760} {"current_steps": 1347, "total_steps": 9134, "loss": 0.7509, "learning_rate": 4.7364634404148655e-05, "epoch": 0.14745887955335396, "percentage": 14.75, "elapsed_time": "1 day, 0:52:28", "remaining_time": "5 days, 23:47:58", "throughput": 2717.89, "total_tokens": 243382048} {"current_steps": 1348, "total_steps": 9134, "loss": 0.7923, "learning_rate": 4.736079038212286e-05, "epoch": 0.14756835162429185, "percentage": 14.76, "elapsed_time": "1 day, 0:53:36", "remaining_time": "5 days, 23:47:02", "throughput": 2718.0, "total_tokens": 243578496} {"current_steps": 1349, "total_steps": 9134, "loss": 0.773, "learning_rate": 4.7356943714858306e-05, "epoch": 0.14767782369522975, "percentage": 14.77, "elapsed_time": "1 day, 0:54:45", "remaining_time": "5 days, 23:46:11", "throughput": 2718.05, "total_tokens": 243770240} {"current_steps": 1350, "total_steps": 9134, "loss": 0.7505, "learning_rate": 4.735309440281005e-05, "epoch": 0.14778729576616767, "percentage": 14.78, "elapsed_time": "1 day, 0:55:50", "remaining_time": "5 days, 23:44:56", "throughput": 2717.98, "total_tokens": 243940704} {"current_steps": 1351, "total_steps": 9134, "loss": 0.9581, "learning_rate": 4.7349242446433464e-05, "epoch": 0.14789676783710556, "percentage": 14.79, "elapsed_time": "1 day, 0:57:00", "remaining_time": "5 days, 23:44:08", "throughput": 2717.98, "total_tokens": 244129760} {"current_steps": 1352, "total_steps": 9134, "loss": 0.8142, "learning_rate": 4.734538784618421e-05, "epoch": 0.14800623990804346, "percentage": 14.8, "elapsed_time": "1 day, 0:58:08", "remaining_time": "5 days, 23:43:10", "throughput": 2718.26, "total_tokens": 244339872} {"current_steps": 1353, "total_steps": 9134, "loss": 0.6503, "learning_rate": 4.734153060251829e-05, "epoch": 0.14811571197898135, "percentage": 14.81, "elapsed_time": "1 day, 0:59:17", "remaining_time": "5 days, 23:42:16", "throughput": 2718.41, "total_tokens": 244539904} {"current_steps": 1354, "total_steps": 9134, "loss": 0.7656, "learning_rate": 4.733767071589202e-05, "epoch": 0.14822518404991927, "percentage": 14.82, "elapsed_time": "1 day, 1:00:26", "remaining_time": "5 days, 23:41:25", "throughput": 2718.56, "total_tokens": 244741952} {"current_steps": 1355, "total_steps": 9134, "loss": 0.5994, "learning_rate": 4.7333808186761996e-05, "epoch": 0.14833465612085717, "percentage": 14.83, "elapsed_time": "1 day, 1:01:28", "remaining_time": "5 days, 23:39:56", "throughput": 2718.46, "total_tokens": 244903456} {"current_steps": 1356, "total_steps": 9134, "loss": 0.8564, "learning_rate": 4.732994301558516e-05, "epoch": 0.14844412819179506, "percentage": 14.85, "elapsed_time": "1 day, 1:02:35", "remaining_time": "5 days, 23:38:51", "throughput": 2718.13, "total_tokens": 245054656} {"current_steps": 1357, "total_steps": 9134, "loss": 0.7511, "learning_rate": 4.7326075202818765e-05, "epoch": 0.14855360026273298, "percentage": 14.86, "elapsed_time": "1 day, 1:03:40", "remaining_time": "5 days, 23:37:33", "throughput": 2718.14, "total_tokens": 245230272} {"current_steps": 1358, "total_steps": 9134, "loss": 0.7001, "learning_rate": 4.7322204748920345e-05, "epoch": 0.14866307233367088, "percentage": 14.87, "elapsed_time": "1 day, 1:04:44", "remaining_time": "5 days, 23:36:16", "throughput": 2718.2, "total_tokens": 245412160} {"current_steps": 1359, "total_steps": 9134, "loss": 0.8003, "learning_rate": 4.731833165434778e-05, "epoch": 0.14877254440460877, "percentage": 14.88, "elapsed_time": "1 day, 1:05:51", "remaining_time": "5 days, 23:35:10", "throughput": 2718.18, "total_tokens": 245590688} {"current_steps": 1360, "total_steps": 9134, "loss": 0.8152, "learning_rate": 4.731445591955924e-05, "epoch": 0.14888201647554666, "percentage": 14.89, "elapsed_time": "1 day, 1:06:59", "remaining_time": "5 days, 23:34:11", "throughput": 2718.29, "total_tokens": 245785120} {"current_steps": 1361, "total_steps": 9134, "loss": 0.6393, "learning_rate": 4.7310577545013224e-05, "epoch": 0.14899148854648459, "percentage": 14.9, "elapsed_time": "1 day, 1:08:05", "remaining_time": "5 days, 23:33:04", "throughput": 2718.12, "total_tokens": 245950656} {"current_steps": 1362, "total_steps": 9134, "loss": 0.7065, "learning_rate": 4.7306696531168535e-05, "epoch": 0.14910096061742248, "percentage": 14.91, "elapsed_time": "1 day, 1:09:05", "remaining_time": "5 days, 23:31:19", "throughput": 2717.93, "total_tokens": 246095808} {"current_steps": 1363, "total_steps": 9134, "loss": 0.7815, "learning_rate": 4.7302812878484294e-05, "epoch": 0.14921043268836037, "percentage": 14.92, "elapsed_time": "1 day, 1:10:13", "remaining_time": "5 days, 23:30:21", "throughput": 2718.17, "total_tokens": 246301888} {"current_steps": 1364, "total_steps": 9134, "loss": 0.7585, "learning_rate": 4.7298926587419924e-05, "epoch": 0.1493199047592983, "percentage": 14.93, "elapsed_time": "1 day, 1:11:16", "remaining_time": "5 days, 23:28:56", "throughput": 2718.14, "total_tokens": 246471008} {"current_steps": 1365, "total_steps": 9134, "loss": 0.6733, "learning_rate": 4.729503765843516e-05, "epoch": 0.1494293768302362, "percentage": 14.94, "elapsed_time": "1 day, 1:12:23", "remaining_time": "5 days, 23:27:51", "throughput": 2717.86, "total_tokens": 246626688} {"current_steps": 1366, "total_steps": 9134, "loss": 0.6085, "learning_rate": 4.7291146091990066e-05, "epoch": 0.14953884890117408, "percentage": 14.96, "elapsed_time": "1 day, 1:13:29", "remaining_time": "5 days, 23:26:42", "throughput": 2717.89, "total_tokens": 246809920} {"current_steps": 1367, "total_steps": 9134, "loss": 0.6327, "learning_rate": 4.7287251888545005e-05, "epoch": 0.149648320972112, "percentage": 14.97, "elapsed_time": "1 day, 1:14:34", "remaining_time": "5 days, 23:25:26", "throughput": 2717.93, "total_tokens": 246989120} {"current_steps": 1368, "total_steps": 9134, "loss": 0.6761, "learning_rate": 4.728335504856065e-05, "epoch": 0.1497577930430499, "percentage": 14.98, "elapsed_time": "1 day, 1:15:40", "remaining_time": "5 days, 23:24:19", "throughput": 2718.1, "total_tokens": 247184672} {"current_steps": 1369, "total_steps": 9134, "loss": 0.5573, "learning_rate": 4.727945557249799e-05, "epoch": 0.1498672651139878, "percentage": 14.99, "elapsed_time": "1 day, 1:16:47", "remaining_time": "5 days, 23:23:14", "throughput": 2718.22, "total_tokens": 247376864} {"current_steps": 1370, "total_steps": 9134, "loss": 0.6686, "learning_rate": 4.727555346081833e-05, "epoch": 0.14997673718492568, "percentage": 15.0, "elapsed_time": "1 day, 1:17:54", "remaining_time": "5 days, 23:22:11", "throughput": 2718.28, "total_tokens": 247565024} {"current_steps": 1371, "total_steps": 9134, "loss": 0.8797, "learning_rate": 4.7271648713983276e-05, "epoch": 0.1500862092558636, "percentage": 15.01, "elapsed_time": "1 day, 1:19:01", "remaining_time": "5 days, 23:21:07", "throughput": 2718.44, "total_tokens": 247761696} {"current_steps": 1372, "total_steps": 9134, "loss": 0.6095, "learning_rate": 4.726774133245476e-05, "epoch": 0.1501956813268015, "percentage": 15.02, "elapsed_time": "1 day, 1:20:06", "remaining_time": "5 days, 23:19:54", "throughput": 2718.22, "total_tokens": 247919168} {"current_steps": 1373, "total_steps": 9134, "loss": 0.8636, "learning_rate": 4.7263831316695005e-05, "epoch": 0.1503051533977394, "percentage": 15.03, "elapsed_time": "1 day, 1:21:13", "remaining_time": "5 days, 23:18:49", "throughput": 2718.28, "total_tokens": 248106432} {"current_steps": 1374, "total_steps": 9134, "loss": 0.7765, "learning_rate": 4.725991866716657e-05, "epoch": 0.15041462546867732, "percentage": 15.04, "elapsed_time": "1 day, 1:22:20", "remaining_time": "5 days, 23:17:46", "throughput": 2718.26, "total_tokens": 248286080} {"current_steps": 1375, "total_steps": 9134, "loss": 0.6218, "learning_rate": 4.7256003384332314e-05, "epoch": 0.1505240975396152, "percentage": 15.05, "elapsed_time": "1 day, 1:23:26", "remaining_time": "5 days, 23:16:39", "throughput": 2718.36, "total_tokens": 248476704} {"current_steps": 1376, "total_steps": 9134, "loss": 0.9153, "learning_rate": 4.72520854686554e-05, "epoch": 0.1506335696105531, "percentage": 15.06, "elapsed_time": "1 day, 1:24:33", "remaining_time": "5 days, 23:15:33", "throughput": 2718.35, "total_tokens": 248655680} {"current_steps": 1377, "total_steps": 9134, "loss": 0.6723, "learning_rate": 4.724816492059932e-05, "epoch": 0.150743041681491, "percentage": 15.08, "elapsed_time": "1 day, 1:25:41", "remaining_time": "5 days, 23:14:36", "throughput": 2718.32, "total_tokens": 248838688} {"current_steps": 1378, "total_steps": 9134, "loss": 0.6343, "learning_rate": 4.724424174062786e-05, "epoch": 0.15085251375242892, "percentage": 15.09, "elapsed_time": "1 day, 1:26:48", "remaining_time": "5 days, 23:13:32", "throughput": 2718.15, "total_tokens": 249004672} {"current_steps": 1379, "total_steps": 9134, "loss": 0.6019, "learning_rate": 4.724031592920512e-05, "epoch": 0.1509619858233668, "percentage": 15.1, "elapsed_time": "1 day, 1:27:50", "remaining_time": "5 days, 23:12:03", "throughput": 2718.11, "total_tokens": 249170880} {"current_steps": 1380, "total_steps": 9134, "loss": 0.7691, "learning_rate": 4.7236387486795525e-05, "epoch": 0.1510714578943047, "percentage": 15.11, "elapsed_time": "1 day, 1:28:57", "remaining_time": "5 days, 23:10:58", "throughput": 2718.19, "total_tokens": 249360160} {"current_steps": 1381, "total_steps": 9134, "loss": 0.6459, "learning_rate": 4.72324564138638e-05, "epoch": 0.15118092996524263, "percentage": 15.12, "elapsed_time": "1 day, 1:30:05", "remaining_time": "5 days, 23:09:57", "throughput": 2718.33, "total_tokens": 249556832} {"current_steps": 1382, "total_steps": 9134, "loss": 0.7898, "learning_rate": 4.722852271087498e-05, "epoch": 0.15129040203618052, "percentage": 15.13, "elapsed_time": "1 day, 1:31:10", "remaining_time": "5 days, 23:08:47", "throughput": 2718.19, "total_tokens": 249722592} {"current_steps": 1383, "total_steps": 9134, "loss": 0.8013, "learning_rate": 4.722458637829442e-05, "epoch": 0.15139987410711842, "percentage": 15.14, "elapsed_time": "1 day, 1:32:18", "remaining_time": "5 days, 23:07:47", "throughput": 2718.09, "total_tokens": 249896864} {"current_steps": 1384, "total_steps": 9134, "loss": 0.6231, "learning_rate": 4.722064741658777e-05, "epoch": 0.15150934617805634, "percentage": 15.15, "elapsed_time": "1 day, 1:33:26", "remaining_time": "5 days, 23:06:52", "throughput": 2718.14, "total_tokens": 250087488} {"current_steps": 1385, "total_steps": 9134, "loss": 0.6553, "learning_rate": 4.721670582622102e-05, "epoch": 0.15161881824899423, "percentage": 15.16, "elapsed_time": "1 day, 1:34:31", "remaining_time": "5 days, 23:05:32", "throughput": 2717.99, "total_tokens": 250248544} {"current_steps": 1386, "total_steps": 9134, "loss": 0.618, "learning_rate": 4.721276160766043e-05, "epoch": 0.15172829031993212, "percentage": 15.17, "elapsed_time": "1 day, 1:35:37", "remaining_time": "5 days, 23:04:26", "throughput": 2717.92, "total_tokens": 250422368} {"current_steps": 1387, "total_steps": 9134, "loss": 0.8347, "learning_rate": 4.720881476137261e-05, "epoch": 0.15183776239087002, "percentage": 15.19, "elapsed_time": "1 day, 1:36:47", "remaining_time": "5 days, 23:03:37", "throughput": 2718.15, "total_tokens": 250632928} {"current_steps": 1388, "total_steps": 9134, "loss": 0.6543, "learning_rate": 4.720486528782447e-05, "epoch": 0.15194723446180794, "percentage": 15.2, "elapsed_time": "1 day, 1:37:53", "remaining_time": "5 days, 23:02:32", "throughput": 2718.22, "total_tokens": 250820416} {"current_steps": 1389, "total_steps": 9134, "loss": 0.8169, "learning_rate": 4.720091318748321e-05, "epoch": 0.15205670653274583, "percentage": 15.21, "elapsed_time": "1 day, 1:38:59", "remaining_time": "5 days, 23:01:20", "throughput": 2718.4, "total_tokens": 251015296} {"current_steps": 1390, "total_steps": 9134, "loss": 0.8252, "learning_rate": 4.7196958460816356e-05, "epoch": 0.15216617860368373, "percentage": 15.22, "elapsed_time": "1 day, 1:40:09", "remaining_time": "5 days, 23:00:32", "throughput": 2718.59, "total_tokens": 251222944} {"current_steps": 1391, "total_steps": 9134, "loss": 0.6979, "learning_rate": 4.719300110829174e-05, "epoch": 0.15227565067462165, "percentage": 15.23, "elapsed_time": "1 day, 1:41:18", "remaining_time": "5 days, 22:59:41", "throughput": 2718.81, "total_tokens": 251431264} {"current_steps": 1392, "total_steps": 9134, "loss": 0.6846, "learning_rate": 4.718904113037754e-05, "epoch": 0.15238512274555954, "percentage": 15.24, "elapsed_time": "1 day, 1:42:25", "remaining_time": "5 days, 22:58:37", "throughput": 2718.73, "total_tokens": 251605760} {"current_steps": 1393, "total_steps": 9134, "loss": 0.7524, "learning_rate": 4.718507852754218e-05, "epoch": 0.15249459481649744, "percentage": 15.25, "elapsed_time": "1 day, 1:43:33", "remaining_time": "5 days, 22:57:39", "throughput": 2718.66, "total_tokens": 251784064} {"current_steps": 1394, "total_steps": 9134, "loss": 0.5712, "learning_rate": 4.718111330025444e-05, "epoch": 0.15260406688743533, "percentage": 15.26, "elapsed_time": "1 day, 1:44:41", "remaining_time": "5 days, 22:56:39", "throughput": 2718.33, "total_tokens": 251938176} {"current_steps": 1395, "total_steps": 9134, "loss": 0.6583, "learning_rate": 4.717714544898341e-05, "epoch": 0.15271353895837325, "percentage": 15.27, "elapsed_time": "1 day, 1:45:43", "remaining_time": "5 days, 22:55:10", "throughput": 2718.21, "total_tokens": 252096992} {"current_steps": 1396, "total_steps": 9134, "loss": 0.8149, "learning_rate": 4.717317497419846e-05, "epoch": 0.15282301102931115, "percentage": 15.28, "elapsed_time": "1 day, 1:46:51", "remaining_time": "5 days, 22:54:12", "throughput": 2718.22, "total_tokens": 252281792} {"current_steps": 1397, "total_steps": 9134, "loss": 0.6314, "learning_rate": 4.7169201876369295e-05, "epoch": 0.15293248310024904, "percentage": 15.29, "elapsed_time": "1 day, 1:47:57", "remaining_time": "5 days, 22:53:01", "throughput": 2717.87, "total_tokens": 252428288} {"current_steps": 1398, "total_steps": 9134, "loss": 0.5287, "learning_rate": 4.7165226155965936e-05, "epoch": 0.15304195517118696, "percentage": 15.31, "elapsed_time": "1 day, 1:48:59", "remaining_time": "5 days, 22:51:30", "throughput": 2717.81, "total_tokens": 252591136} {"current_steps": 1399, "total_steps": 9134, "loss": 0.9543, "learning_rate": 4.7161247813458696e-05, "epoch": 0.15315142724212485, "percentage": 15.32, "elapsed_time": "1 day, 1:50:05", "remaining_time": "5 days, 22:50:20", "throughput": 2717.79, "total_tokens": 252768320} {"current_steps": 1400, "total_steps": 9134, "loss": 0.8586, "learning_rate": 4.71572668493182e-05, "epoch": 0.15326089931306275, "percentage": 15.33, "elapsed_time": "1 day, 1:51:14", "remaining_time": "5 days, 22:49:27", "throughput": 2717.93, "total_tokens": 252968800} {"current_steps": 1401, "total_steps": 9134, "loss": 0.9379, "learning_rate": 4.7153283264015394e-05, "epoch": 0.15337037138400067, "percentage": 15.34, "elapsed_time": "1 day, 1:52:23", "remaining_time": "5 days, 22:48:35", "throughput": 2718.23, "total_tokens": 253184288} {"current_steps": 1402, "total_steps": 9134, "loss": 0.8419, "learning_rate": 4.714929705802153e-05, "epoch": 0.15347984345493856, "percentage": 15.35, "elapsed_time": "1 day, 1:53:29", "remaining_time": "5 days, 22:47:29", "throughput": 2718.19, "total_tokens": 253361696} {"current_steps": 1403, "total_steps": 9134, "loss": 0.7545, "learning_rate": 4.714530823180816e-05, "epoch": 0.15358931552587646, "percentage": 15.36, "elapsed_time": "1 day, 1:54:37", "remaining_time": "5 days, 22:46:28", "throughput": 2718.1, "total_tokens": 253536864} {"current_steps": 1404, "total_steps": 9134, "loss": 0.7545, "learning_rate": 4.7141316785847176e-05, "epoch": 0.15369878759681435, "percentage": 15.37, "elapsed_time": "1 day, 1:55:45", "remaining_time": "5 days, 22:45:31", "throughput": 2718.04, "total_tokens": 253716064} {"current_steps": 1405, "total_steps": 9134, "loss": 0.6513, "learning_rate": 4.713732272061073e-05, "epoch": 0.15380825966775227, "percentage": 15.38, "elapsed_time": "1 day, 1:56:50", "remaining_time": "5 days, 22:44:19", "throughput": 2717.84, "total_tokens": 253875776} {"current_steps": 1406, "total_steps": 9134, "loss": 0.6302, "learning_rate": 4.713332603657133e-05, "epoch": 0.15391773173869017, "percentage": 15.39, "elapsed_time": "1 day, 1:57:55", "remaining_time": "5 days, 22:43:00", "throughput": 2717.75, "total_tokens": 254041760} {"current_steps": 1407, "total_steps": 9134, "loss": 0.6368, "learning_rate": 4.712932673420177e-05, "epoch": 0.15402720380962806, "percentage": 15.4, "elapsed_time": "1 day, 1:59:04", "remaining_time": "5 days, 22:42:08", "throughput": 2717.75, "total_tokens": 254229920} {"current_steps": 1408, "total_steps": 9134, "loss": 0.5526, "learning_rate": 4.7125324813975155e-05, "epoch": 0.15413667588056598, "percentage": 15.41, "elapsed_time": "1 day, 2:00:09", "remaining_time": "5 days, 22:40:53", "throughput": 2717.48, "total_tokens": 254380672} {"current_steps": 1409, "total_steps": 9134, "loss": 0.7591, "learning_rate": 4.712132027636492e-05, "epoch": 0.15424614795150388, "percentage": 15.43, "elapsed_time": "1 day, 2:01:16", "remaining_time": "5 days, 22:39:49", "throughput": 2717.5, "total_tokens": 254564352} {"current_steps": 1410, "total_steps": 9134, "loss": 0.7529, "learning_rate": 4.711731312184479e-05, "epoch": 0.15435562002244177, "percentage": 15.44, "elapsed_time": "1 day, 2:02:19", "remaining_time": "5 days, 22:38:26", "throughput": 2717.36, "total_tokens": 254723840} {"current_steps": 1411, "total_steps": 9134, "loss": 0.9235, "learning_rate": 4.711330335088879e-05, "epoch": 0.15446509209337966, "percentage": 15.45, "elapsed_time": "1 day, 2:03:28", "remaining_time": "5 days, 22:37:36", "throughput": 2717.57, "total_tokens": 254932608} {"current_steps": 1412, "total_steps": 9134, "loss": 0.6455, "learning_rate": 4.710929096397127e-05, "epoch": 0.15457456416431758, "percentage": 15.46, "elapsed_time": "1 day, 2:04:33", "remaining_time": "5 days, 22:36:19", "throughput": 2717.56, "total_tokens": 255107552} {"current_steps": 1413, "total_steps": 9134, "loss": 0.5425, "learning_rate": 4.710527596156691e-05, "epoch": 0.15468403623525548, "percentage": 15.47, "elapsed_time": "1 day, 2:05:39", "remaining_time": "5 days, 22:35:12", "throughput": 2717.61, "total_tokens": 255292352} {"current_steps": 1414, "total_steps": 9134, "loss": 0.8238, "learning_rate": 4.710125834415065e-05, "epoch": 0.15479350830619337, "percentage": 15.48, "elapsed_time": "1 day, 2:06:46", "remaining_time": "5 days, 22:34:08", "throughput": 2717.59, "total_tokens": 255472224} {"current_steps": 1415, "total_steps": 9134, "loss": 0.7698, "learning_rate": 4.709723811219779e-05, "epoch": 0.1549029803771313, "percentage": 15.49, "elapsed_time": "1 day, 2:07:53", "remaining_time": "5 days, 22:33:00", "throughput": 2717.32, "total_tokens": 255626336} {"current_steps": 1416, "total_steps": 9134, "loss": 0.8038, "learning_rate": 4.70932152661839e-05, "epoch": 0.1550124524480692, "percentage": 15.5, "elapsed_time": "1 day, 2:09:01", "remaining_time": "5 days, 22:32:03", "throughput": 2717.36, "total_tokens": 255816288} {"current_steps": 1417, "total_steps": 9134, "loss": 0.7319, "learning_rate": 4.7089189806584874e-05, "epoch": 0.15512192451900708, "percentage": 15.51, "elapsed_time": "1 day, 2:10:05", "remaining_time": "5 days, 22:30:42", "throughput": 2717.07, "total_tokens": 255962112} {"current_steps": 1418, "total_steps": 9134, "loss": 0.922, "learning_rate": 4.708516173387692e-05, "epoch": 0.155231396589945, "percentage": 15.52, "elapsed_time": "1 day, 2:11:14", "remaining_time": "5 days, 22:29:52", "throughput": 2717.34, "total_tokens": 256176256} {"current_steps": 1419, "total_steps": 9134, "loss": 0.5817, "learning_rate": 4.7081131048536564e-05, "epoch": 0.1553408686608829, "percentage": 15.54, "elapsed_time": "1 day, 2:12:22", "remaining_time": "5 days, 22:28:50", "throughput": 2717.39, "total_tokens": 256363968} {"current_steps": 1420, "total_steps": 9134, "loss": 0.7691, "learning_rate": 4.70770977510406e-05, "epoch": 0.1554503407318208, "percentage": 15.55, "elapsed_time": "1 day, 2:13:27", "remaining_time": "5 days, 22:27:37", "throughput": 2717.08, "total_tokens": 256512480} {"current_steps": 1421, "total_steps": 9134, "loss": 0.6224, "learning_rate": 4.70730618418662e-05, "epoch": 0.15555981280275868, "percentage": 15.56, "elapsed_time": "1 day, 2:14:29", "remaining_time": "5 days, 22:26:06", "throughput": 2716.92, "total_tokens": 256665696} {"current_steps": 1422, "total_steps": 9134, "loss": 0.5609, "learning_rate": 4.7069023321490754e-05, "epoch": 0.1556692848736966, "percentage": 15.57, "elapsed_time": "1 day, 2:15:34", "remaining_time": "5 days, 22:24:53", "throughput": 2716.86, "total_tokens": 256837504} {"current_steps": 1423, "total_steps": 9134, "loss": 0.7151, "learning_rate": 4.706498219039206e-05, "epoch": 0.1557787569446345, "percentage": 15.58, "elapsed_time": "1 day, 2:16:43", "remaining_time": "5 days, 22:23:59", "throughput": 2716.68, "total_tokens": 257006848} {"current_steps": 1424, "total_steps": 9134, "loss": 0.6813, "learning_rate": 4.706093844904814e-05, "epoch": 0.1558882290155724, "percentage": 15.59, "elapsed_time": "1 day, 2:17:49", "remaining_time": "5 days, 22:22:48", "throughput": 2716.58, "total_tokens": 257175520} {"current_steps": 1425, "total_steps": 9134, "loss": 0.6728, "learning_rate": 4.7056892097937376e-05, "epoch": 0.15599770108651032, "percentage": 15.6, "elapsed_time": "1 day, 2:18:58", "remaining_time": "5 days, 22:21:58", "throughput": 2716.75, "total_tokens": 257380256} {"current_steps": 1426, "total_steps": 9134, "loss": 0.6883, "learning_rate": 4.705284313753845e-05, "epoch": 0.1561071731574482, "percentage": 15.61, "elapsed_time": "1 day, 2:20:07", "remaining_time": "5 days, 22:21:03", "throughput": 2717.01, "total_tokens": 257591712} {"current_steps": 1427, "total_steps": 9134, "loss": 0.7034, "learning_rate": 4.7048791568330333e-05, "epoch": 0.1562166452283861, "percentage": 15.62, "elapsed_time": "1 day, 2:21:16", "remaining_time": "5 days, 22:20:11", "throughput": 2717.08, "total_tokens": 257786144} {"current_steps": 1428, "total_steps": 9134, "loss": 0.7254, "learning_rate": 4.7044737390792326e-05, "epoch": 0.156326117299324, "percentage": 15.63, "elapsed_time": "1 day, 2:22:23", "remaining_time": "5 days, 22:19:08", "throughput": 2717.16, "total_tokens": 257976544} {"current_steps": 1429, "total_steps": 9134, "loss": 0.8161, "learning_rate": 4.704068060540402e-05, "epoch": 0.15643558937026192, "percentage": 15.64, "elapsed_time": "1 day, 2:23:32", "remaining_time": "5 days, 22:18:15", "throughput": 2717.1, "total_tokens": 258157984} {"current_steps": 1430, "total_steps": 9134, "loss": 0.905, "learning_rate": 4.703662121264535e-05, "epoch": 0.1565450614411998, "percentage": 15.66, "elapsed_time": "1 day, 2:24:41", "remaining_time": "5 days, 22:17:23", "throughput": 2717.3, "total_tokens": 258364736} {"current_steps": 1431, "total_steps": 9134, "loss": 0.701, "learning_rate": 4.70325592129965e-05, "epoch": 0.1566545335121377, "percentage": 15.67, "elapsed_time": "1 day, 2:25:51", "remaining_time": "5 days, 22:16:35", "throughput": 2717.58, "total_tokens": 258581344} {"current_steps": 1432, "total_steps": 9134, "loss": 0.9636, "learning_rate": 4.7028494606938025e-05, "epoch": 0.15676400558307563, "percentage": 15.68, "elapsed_time": "1 day, 2:26:57", "remaining_time": "5 days, 22:15:26", "throughput": 2717.55, "total_tokens": 258758080} {"current_steps": 1433, "total_steps": 9134, "loss": 0.7459, "learning_rate": 4.7024427394950745e-05, "epoch": 0.15687347765401352, "percentage": 15.69, "elapsed_time": "1 day, 2:28:04", "remaining_time": "5 days, 22:14:24", "throughput": 2717.47, "total_tokens": 258933696} {"current_steps": 1434, "total_steps": 9134, "loss": 0.7365, "learning_rate": 4.702035757751581e-05, "epoch": 0.15698294972495141, "percentage": 15.7, "elapsed_time": "1 day, 2:29:11", "remaining_time": "5 days, 22:13:18", "throughput": 2717.42, "total_tokens": 259109984} {"current_steps": 1435, "total_steps": 9134, "loss": 0.7074, "learning_rate": 4.701628515511467e-05, "epoch": 0.15709242179588934, "percentage": 15.71, "elapsed_time": "1 day, 2:30:20", "remaining_time": "5 days, 22:12:28", "throughput": 2717.66, "total_tokens": 259321216} {"current_steps": 1436, "total_steps": 9134, "loss": 0.6889, "learning_rate": 4.701221012822908e-05, "epoch": 0.15720189386682723, "percentage": 15.72, "elapsed_time": "1 day, 2:31:28", "remaining_time": "5 days, 22:11:27", "throughput": 2717.65, "total_tokens": 259504672} {"current_steps": 1437, "total_steps": 9134, "loss": 0.9133, "learning_rate": 4.7008132497341116e-05, "epoch": 0.15731136593776512, "percentage": 15.73, "elapsed_time": "1 day, 2:32:35", "remaining_time": "5 days, 22:10:25", "throughput": 2717.56, "total_tokens": 259678496} {"current_steps": 1438, "total_steps": 9134, "loss": 0.7161, "learning_rate": 4.700405226293314e-05, "epoch": 0.15742083800870302, "percentage": 15.74, "elapsed_time": "1 day, 2:33:40", "remaining_time": "5 days, 22:09:10", "throughput": 2717.46, "total_tokens": 259845376} {"current_steps": 1439, "total_steps": 9134, "loss": 0.6339, "learning_rate": 4.6999969425487864e-05, "epoch": 0.15753031007964094, "percentage": 15.75, "elapsed_time": "1 day, 2:34:43", "remaining_time": "5 days, 22:07:46", "throughput": 2717.28, "total_tokens": 259999936} {"current_steps": 1440, "total_steps": 9134, "loss": 0.6262, "learning_rate": 4.699588398548825e-05, "epoch": 0.15763978215057883, "percentage": 15.77, "elapsed_time": "1 day, 2:35:50", "remaining_time": "5 days, 22:06:39", "throughput": 2717.34, "total_tokens": 260186304} {"current_steps": 1441, "total_steps": 9134, "loss": 0.7425, "learning_rate": 4.699179594341761e-05, "epoch": 0.15774925422151673, "percentage": 15.78, "elapsed_time": "1 day, 2:36:59", "remaining_time": "5 days, 22:05:49", "throughput": 2717.51, "total_tokens": 260391488} {"current_steps": 1442, "total_steps": 9134, "loss": 0.6812, "learning_rate": 4.698770529975956e-05, "epoch": 0.15785872629245465, "percentage": 15.79, "elapsed_time": "1 day, 2:38:03", "remaining_time": "5 days, 22:04:27", "throughput": 2717.52, "total_tokens": 260565536} {"current_steps": 1443, "total_steps": 9134, "loss": 0.7717, "learning_rate": 4.698361205499799e-05, "epoch": 0.15796819836339254, "percentage": 15.8, "elapsed_time": "1 day, 2:39:09", "remaining_time": "5 days, 22:03:17", "throughput": 2717.48, "total_tokens": 260740928} {"current_steps": 1444, "total_steps": 9134, "loss": 0.7051, "learning_rate": 4.6979516209617144e-05, "epoch": 0.15807767043433044, "percentage": 15.81, "elapsed_time": "1 day, 2:40:16", "remaining_time": "5 days, 22:02:15", "throughput": 2717.55, "total_tokens": 260930208} {"current_steps": 1445, "total_steps": 9134, "loss": 0.5688, "learning_rate": 4.697541776410156e-05, "epoch": 0.15818714250526833, "percentage": 15.82, "elapsed_time": "1 day, 2:41:25", "remaining_time": "5 days, 22:01:23", "throughput": 2717.53, "total_tokens": 261116800} {"current_steps": 1446, "total_steps": 9134, "loss": 0.5024, "learning_rate": 4.697131671893605e-05, "epoch": 0.15829661457620625, "percentage": 15.83, "elapsed_time": "1 day, 2:42:27", "remaining_time": "5 days, 21:59:52", "throughput": 2717.39, "total_tokens": 261270464} {"current_steps": 1447, "total_steps": 9134, "loss": 0.7838, "learning_rate": 4.696721307460579e-05, "epoch": 0.15840608664714415, "percentage": 15.84, "elapsed_time": "1 day, 2:43:33", "remaining_time": "5 days, 21:58:43", "throughput": 2717.43, "total_tokens": 261453920} {"current_steps": 1448, "total_steps": 9134, "loss": 0.8274, "learning_rate": 4.6963106831596206e-05, "epoch": 0.15851555871808204, "percentage": 15.85, "elapsed_time": "1 day, 2:44:36", "remaining_time": "5 days, 21:57:16", "throughput": 2717.22, "total_tokens": 261604000} {"current_steps": 1449, "total_steps": 9134, "loss": 0.6234, "learning_rate": 4.695899799039307e-05, "epoch": 0.15862503078901996, "percentage": 15.86, "elapsed_time": "1 day, 2:45:43", "remaining_time": "5 days, 21:56:15", "throughput": 2717.2, "total_tokens": 261785888} {"current_steps": 1450, "total_steps": 9134, "loss": 0.8017, "learning_rate": 4.695488655148245e-05, "epoch": 0.15873450285995785, "percentage": 15.87, "elapsed_time": "1 day, 2:46:47", "remaining_time": "5 days, 21:54:51", "throughput": 2717.2, "total_tokens": 261957920} {"current_steps": 1451, "total_steps": 9134, "loss": 0.7015, "learning_rate": 4.695077251535073e-05, "epoch": 0.15884397493089575, "percentage": 15.89, "elapsed_time": "1 day, 2:47:54", "remaining_time": "5 days, 21:53:50", "throughput": 2717.31, "total_tokens": 262151232} {"current_steps": 1452, "total_steps": 9134, "loss": 0.7989, "learning_rate": 4.6946655882484575e-05, "epoch": 0.15895344700183367, "percentage": 15.9, "elapsed_time": "1 day, 2:48:59", "remaining_time": "5 days, 21:52:34", "throughput": 2717.32, "total_tokens": 262328640} {"current_steps": 1453, "total_steps": 9134, "loss": 0.8251, "learning_rate": 4.694253665337099e-05, "epoch": 0.15906291907277156, "percentage": 15.91, "elapsed_time": "1 day, 2:50:08", "remaining_time": "5 days, 21:51:42", "throughput": 2717.54, "total_tokens": 262537184} {"current_steps": 1454, "total_steps": 9134, "loss": 0.8237, "learning_rate": 4.693841482849726e-05, "epoch": 0.15917239114370946, "percentage": 15.92, "elapsed_time": "1 day, 2:51:14", "remaining_time": "5 days, 21:50:31", "throughput": 2717.4, "total_tokens": 262702720} {"current_steps": 1455, "total_steps": 9134, "loss": 0.8038, "learning_rate": 4.6934290408351e-05, "epoch": 0.15928186321464735, "percentage": 15.93, "elapsed_time": "1 day, 2:52:21", "remaining_time": "5 days, 21:49:29", "throughput": 2717.48, "total_tokens": 262893344} {"current_steps": 1456, "total_steps": 9134, "loss": 0.5497, "learning_rate": 4.693016339342011e-05, "epoch": 0.15939133528558527, "percentage": 15.94, "elapsed_time": "1 day, 2:53:27", "remaining_time": "5 days, 21:48:18", "throughput": 2717.34, "total_tokens": 263058208} {"current_steps": 1457, "total_steps": 9134, "loss": 0.5789, "learning_rate": 4.692603378419282e-05, "epoch": 0.15950080735652317, "percentage": 15.95, "elapsed_time": "1 day, 2:54:35", "remaining_time": "5 days, 21:47:19", "throughput": 2717.1, "total_tokens": 263219712} {"current_steps": 1458, "total_steps": 9134, "loss": 0.7238, "learning_rate": 4.692190158115765e-05, "epoch": 0.15961027942746106, "percentage": 15.96, "elapsed_time": "1 day, 2:55:36", "remaining_time": "5 days, 21:45:48", "throughput": 2716.95, "total_tokens": 263372256} {"current_steps": 1459, "total_steps": 9134, "loss": 0.7467, "learning_rate": 4.691776678480343e-05, "epoch": 0.15971975149839898, "percentage": 15.97, "elapsed_time": "1 day, 2:56:46", "remaining_time": "5 days, 21:44:56", "throughput": 2717.05, "total_tokens": 263571168} {"current_steps": 1460, "total_steps": 9134, "loss": 0.7387, "learning_rate": 4.69136293956193e-05, "epoch": 0.15982922356933688, "percentage": 15.98, "elapsed_time": "1 day, 2:57:52", "remaining_time": "5 days, 21:43:48", "throughput": 2716.94, "total_tokens": 263740288} {"current_steps": 1461, "total_steps": 9134, "loss": 0.8547, "learning_rate": 4.6909489414094694e-05, "epoch": 0.15993869564027477, "percentage": 16.0, "elapsed_time": "1 day, 2:58:59", "remaining_time": "5 days, 21:42:45", "throughput": 2716.96, "total_tokens": 263924640} {"current_steps": 1462, "total_steps": 9134, "loss": 0.6846, "learning_rate": 4.6905346840719386e-05, "epoch": 0.16004816771121266, "percentage": 16.01, "elapsed_time": "1 day, 3:00:06", "remaining_time": "5 days, 21:41:42", "throughput": 2716.98, "total_tokens": 264108544} {"current_steps": 1463, "total_steps": 9134, "loss": 0.6742, "learning_rate": 4.690120167598341e-05, "epoch": 0.16015763978215058, "percentage": 16.02, "elapsed_time": "1 day, 3:01:13", "remaining_time": "5 days, 21:40:37", "throughput": 2717.08, "total_tokens": 264300064} {"current_steps": 1464, "total_steps": 9134, "loss": 0.7547, "learning_rate": 4.689705392037716e-05, "epoch": 0.16026711185308848, "percentage": 16.03, "elapsed_time": "1 day, 3:02:19", "remaining_time": "5 days, 21:39:29", "throughput": 2716.97, "total_tokens": 264469408} {"current_steps": 1465, "total_steps": 9134, "loss": 0.5629, "learning_rate": 4.689290357439128e-05, "epoch": 0.16037658392402637, "percentage": 16.04, "elapsed_time": "1 day, 3:03:27", "remaining_time": "5 days, 21:38:29", "throughput": 2717.02, "total_tokens": 264658240} {"current_steps": 1466, "total_steps": 9134, "loss": 0.7411, "learning_rate": 4.688875063851676e-05, "epoch": 0.1604860559949643, "percentage": 16.05, "elapsed_time": "1 day, 3:04:27", "remaining_time": "5 days, 21:36:50", "throughput": 2716.79, "total_tokens": 264799584} {"current_steps": 1467, "total_steps": 9134, "loss": 0.7588, "learning_rate": 4.688459511324489e-05, "epoch": 0.1605955280659022, "percentage": 16.06, "elapsed_time": "1 day, 3:05:28", "remaining_time": "5 days, 21:35:16", "throughput": 2716.57, "total_tokens": 264943616} {"current_steps": 1468, "total_steps": 9134, "loss": 0.6871, "learning_rate": 4.688043699906725e-05, "epoch": 0.16070500013684008, "percentage": 16.07, "elapsed_time": "1 day, 3:06:38", "remaining_time": "5 days, 21:34:25", "throughput": 2716.78, "total_tokens": 265153280} {"current_steps": 1469, "total_steps": 9134, "loss": 0.7719, "learning_rate": 4.687627629647573e-05, "epoch": 0.160814472207778, "percentage": 16.08, "elapsed_time": "1 day, 3:07:41", "remaining_time": "5 days, 21:33:02", "throughput": 2716.65, "total_tokens": 265312320} {"current_steps": 1470, "total_steps": 9134, "loss": 0.9027, "learning_rate": 4.687211300596256e-05, "epoch": 0.1609239442787159, "percentage": 16.09, "elapsed_time": "1 day, 3:08:47", "remaining_time": "5 days, 21:31:54", "throughput": 2716.6, "total_tokens": 265487712} {"current_steps": 1471, "total_steps": 9134, "loss": 0.865, "learning_rate": 4.686794712802023e-05, "epoch": 0.1610334163496538, "percentage": 16.1, "elapsed_time": "1 day, 3:09:53", "remaining_time": "5 days, 21:30:45", "throughput": 2716.29, "total_tokens": 265636672} {"current_steps": 1472, "total_steps": 9134, "loss": 0.6975, "learning_rate": 4.6863778663141556e-05, "epoch": 0.16114288842059168, "percentage": 16.12, "elapsed_time": "1 day, 3:10:56", "remaining_time": "5 days, 21:29:18", "throughput": 2716.16, "total_tokens": 265793696} {"current_steps": 1473, "total_steps": 9134, "loss": 0.6301, "learning_rate": 4.6859607611819664e-05, "epoch": 0.1612523604915296, "percentage": 16.13, "elapsed_time": "1 day, 3:11:58", "remaining_time": "5 days, 21:27:51", "throughput": 2716.09, "total_tokens": 265956320} {"current_steps": 1474, "total_steps": 9134, "loss": 0.6863, "learning_rate": 4.685543397454799e-05, "epoch": 0.1613618325624675, "percentage": 16.14, "elapsed_time": "1 day, 3:13:00", "remaining_time": "5 days, 21:26:21", "throughput": 2715.93, "total_tokens": 266108864} {"current_steps": 1475, "total_steps": 9134, "loss": 0.79, "learning_rate": 4.685125775182024e-05, "epoch": 0.1614713046334054, "percentage": 16.15, "elapsed_time": "1 day, 3:14:03", "remaining_time": "5 days, 21:24:57", "throughput": 2715.91, "total_tokens": 266278880} {"current_steps": 1476, "total_steps": 9134, "loss": 0.7672, "learning_rate": 4.684707894413048e-05, "epoch": 0.16158077670434332, "percentage": 16.16, "elapsed_time": "1 day, 3:15:11", "remaining_time": "5 days, 21:23:58", "throughput": 2716.08, "total_tokens": 266479808} {"current_steps": 1477, "total_steps": 9134, "loss": 0.6446, "learning_rate": 4.684289755197305e-05, "epoch": 0.1616902487752812, "percentage": 16.17, "elapsed_time": "1 day, 3:16:18", "remaining_time": "5 days, 21:22:50", "throughput": 2716.01, "total_tokens": 266652960} {"current_steps": 1478, "total_steps": 9134, "loss": 0.6489, "learning_rate": 4.683871357584259e-05, "epoch": 0.1617997208462191, "percentage": 16.18, "elapsed_time": "1 day, 3:17:23", "remaining_time": "5 days, 21:21:38", "throughput": 2715.76, "total_tokens": 266805728} {"current_steps": 1479, "total_steps": 9134, "loss": 0.644, "learning_rate": 4.6834527016234065e-05, "epoch": 0.161909192917157, "percentage": 16.19, "elapsed_time": "1 day, 3:18:28", "remaining_time": "5 days, 21:20:22", "throughput": 2715.82, "total_tokens": 266987168} {"current_steps": 1480, "total_steps": 9134, "loss": 0.6839, "learning_rate": 4.6830337873642724e-05, "epoch": 0.16201866498809492, "percentage": 16.2, "elapsed_time": "1 day, 3:19:37", "remaining_time": "5 days, 21:19:29", "throughput": 2715.67, "total_tokens": 267159872} {"current_steps": 1481, "total_steps": 9134, "loss": 0.7335, "learning_rate": 4.682614614856416e-05, "epoch": 0.1621281370590328, "percentage": 16.21, "elapsed_time": "1 day, 3:20:43", "remaining_time": "5 days, 21:18:23", "throughput": 2715.45, "total_tokens": 267318912} {"current_steps": 1482, "total_steps": 9134, "loss": 0.7909, "learning_rate": 4.6821951841494225e-05, "epoch": 0.1622376091299707, "percentage": 16.23, "elapsed_time": "1 day, 3:21:52", "remaining_time": "5 days, 21:17:29", "throughput": 2715.53, "total_tokens": 267514464} {"current_steps": 1483, "total_steps": 9134, "loss": 0.6752, "learning_rate": 4.6817754952929106e-05, "epoch": 0.16234708120090863, "percentage": 16.24, "elapsed_time": "1 day, 3:23:00", "remaining_time": "5 days, 21:16:32", "throughput": 2715.54, "total_tokens": 267699936} {"current_steps": 1484, "total_steps": 9134, "loss": 0.8886, "learning_rate": 4.681355548336528e-05, "epoch": 0.16245655327184652, "percentage": 16.25, "elapsed_time": "1 day, 3:24:08", "remaining_time": "5 days, 21:15:29", "throughput": 2715.61, "total_tokens": 267889216} {"current_steps": 1485, "total_steps": 9134, "loss": 0.6516, "learning_rate": 4.680935343329954e-05, "epoch": 0.16256602534278441, "percentage": 16.26, "elapsed_time": "1 day, 3:25:16", "remaining_time": "5 days, 21:14:33", "throughput": 2715.74, "total_tokens": 268088576} {"current_steps": 1486, "total_steps": 9134, "loss": 0.7621, "learning_rate": 4.680514880322898e-05, "epoch": 0.16267549741372234, "percentage": 16.27, "elapsed_time": "1 day, 3:26:24", "remaining_time": "5 days, 21:13:32", "throughput": 2715.81, "total_tokens": 268278752} {"current_steps": 1487, "total_steps": 9134, "loss": 0.6528, "learning_rate": 4.680094159365101e-05, "epoch": 0.16278496948466023, "percentage": 16.28, "elapsed_time": "1 day, 3:27:32", "remaining_time": "5 days, 21:12:36", "throughput": 2715.86, "total_tokens": 268470048} {"current_steps": 1488, "total_steps": 9134, "loss": 0.7321, "learning_rate": 4.679673180506332e-05, "epoch": 0.16289444155559812, "percentage": 16.29, "elapsed_time": "1 day, 3:28:39", "remaining_time": "5 days, 21:11:33", "throughput": 2715.77, "total_tokens": 268643872} {"current_steps": 1489, "total_steps": 9134, "loss": 0.8103, "learning_rate": 4.679251943796393e-05, "epoch": 0.16300391362653602, "percentage": 16.3, "elapsed_time": "1 day, 3:29:45", "remaining_time": "5 days, 21:10:25", "throughput": 2715.73, "total_tokens": 268818816} {"current_steps": 1490, "total_steps": 9134, "loss": 0.6323, "learning_rate": 4.678830449285114e-05, "epoch": 0.16311338569747394, "percentage": 16.31, "elapsed_time": "1 day, 3:30:54", "remaining_time": "5 days, 21:09:29", "throughput": 2715.61, "total_tokens": 268993536} {"current_steps": 1491, "total_steps": 9134, "loss": 0.6342, "learning_rate": 4.6784086970223596e-05, "epoch": 0.16322285776841183, "percentage": 16.32, "elapsed_time": "1 day, 3:31:59", "remaining_time": "5 days, 21:08:16", "throughput": 2715.65, "total_tokens": 269173856} {"current_steps": 1492, "total_steps": 9134, "loss": 0.921, "learning_rate": 4.677986687058019e-05, "epoch": 0.16333232983934973, "percentage": 16.33, "elapsed_time": "1 day, 3:33:06", "remaining_time": "5 days, 21:07:10", "throughput": 2715.7, "total_tokens": 269360672} {"current_steps": 1493, "total_steps": 9134, "loss": 0.6604, "learning_rate": 4.6775644194420184e-05, "epoch": 0.16344180191028765, "percentage": 16.35, "elapsed_time": "1 day, 3:34:13", "remaining_time": "5 days, 21:06:06", "throughput": 2715.81, "total_tokens": 269553312} {"current_steps": 1494, "total_steps": 9134, "loss": 0.6726, "learning_rate": 4.6771418942243096e-05, "epoch": 0.16355127398122554, "percentage": 16.36, "elapsed_time": "1 day, 3:35:22", "remaining_time": "5 days, 21:05:15", "throughput": 2716.0, "total_tokens": 269760288} {"current_steps": 1495, "total_steps": 9134, "loss": 0.9044, "learning_rate": 4.6767191114548755e-05, "epoch": 0.16366074605216344, "percentage": 16.37, "elapsed_time": "1 day, 3:36:31", "remaining_time": "5 days, 21:04:22", "throughput": 2716.05, "total_tokens": 269953152} {"current_steps": 1496, "total_steps": 9134, "loss": 0.5553, "learning_rate": 4.676296071183733e-05, "epoch": 0.16377021812310136, "percentage": 16.38, "elapsed_time": "1 day, 3:37:39", "remaining_time": "5 days, 21:03:20", "throughput": 2716.02, "total_tokens": 270132576} {"current_steps": 1497, "total_steps": 9134, "loss": 0.5936, "learning_rate": 4.6758727734609256e-05, "epoch": 0.16387969019403925, "percentage": 16.39, "elapsed_time": "1 day, 3:38:45", "remaining_time": "5 days, 21:02:11", "throughput": 2715.98, "total_tokens": 270307968} {"current_steps": 1498, "total_steps": 9134, "loss": 0.5061, "learning_rate": 4.675449218336528e-05, "epoch": 0.16398916226497715, "percentage": 16.4, "elapsed_time": "1 day, 3:39:51", "remaining_time": "5 days, 21:01:05", "throughput": 2716.13, "total_tokens": 270504192} {"current_steps": 1499, "total_steps": 9134, "loss": 0.507, "learning_rate": 4.6750254058606467e-05, "epoch": 0.16409863433591504, "percentage": 16.41, "elapsed_time": "1 day, 3:40:54", "remaining_time": "5 days, 20:59:41", "throughput": 2716.14, "total_tokens": 270676224} {"current_steps": 1500, "total_steps": 9134, "loss": 0.7169, "learning_rate": 4.6746013360834184e-05, "epoch": 0.16420810640685296, "percentage": 16.42, "elapsed_time": "1 day, 3:42:00", "remaining_time": "5 days, 20:58:28", "throughput": 2715.83, "total_tokens": 270822720} {"current_steps": 1501, "total_steps": 9134, "loss": 0.7463, "learning_rate": 4.6741770090550084e-05, "epoch": 0.16431757847779085, "percentage": 16.43, "elapsed_time": "1 day, 3:43:08", "remaining_time": "5 days, 20:57:33", "throughput": 2715.75, "total_tokens": 271001248} {"current_steps": 1502, "total_steps": 9134, "loss": 0.7822, "learning_rate": 4.673752424825615e-05, "epoch": 0.16442705054872875, "percentage": 16.44, "elapsed_time": "1 day, 3:44:12", "remaining_time": "5 days, 20:56:11", "throughput": 2715.86, "total_tokens": 271184032} {"current_steps": 1503, "total_steps": 9134, "loss": 0.8156, "learning_rate": 4.673327583445465e-05, "epoch": 0.16453652261966667, "percentage": 16.46, "elapsed_time": "1 day, 3:45:20", "remaining_time": "5 days, 20:55:11", "throughput": 2715.93, "total_tokens": 271376000} {"current_steps": 1504, "total_steps": 9134, "loss": 0.6269, "learning_rate": 4.672902484964817e-05, "epoch": 0.16464599469060456, "percentage": 16.47, "elapsed_time": "1 day, 3:46:28", "remaining_time": "5 days, 20:54:15", "throughput": 2715.93, "total_tokens": 271561696} {"current_steps": 1505, "total_steps": 9134, "loss": 0.8395, "learning_rate": 4.672477129433959e-05, "epoch": 0.16475546676154246, "percentage": 16.48, "elapsed_time": "1 day, 3:47:34", "remaining_time": "5 days, 20:53:06", "throughput": 2715.98, "total_tokens": 271745600} {"current_steps": 1506, "total_steps": 9134, "loss": 0.7432, "learning_rate": 4.672051516903209e-05, "epoch": 0.16486493883248035, "percentage": 16.49, "elapsed_time": "1 day, 3:48:40", "remaining_time": "5 days, 20:51:58", "throughput": 2715.85, "total_tokens": 271912704} {"current_steps": 1507, "total_steps": 9134, "loss": 0.7383, "learning_rate": 4.671625647422917e-05, "epoch": 0.16497441090341827, "percentage": 16.5, "elapsed_time": "1 day, 3:49:48", "remaining_time": "5 days, 20:51:00", "throughput": 2715.88, "total_tokens": 272101088} {"current_steps": 1508, "total_steps": 9134, "loss": 0.7614, "learning_rate": 4.6711995210434625e-05, "epoch": 0.16508388297435617, "percentage": 16.51, "elapsed_time": "1 day, 3:50:57", "remaining_time": "5 days, 20:50:06", "throughput": 2715.98, "total_tokens": 272298432} {"current_steps": 1509, "total_steps": 9134, "loss": 0.9494, "learning_rate": 4.670773137815255e-05, "epoch": 0.16519335504529406, "percentage": 16.52, "elapsed_time": "1 day, 3:52:03", "remaining_time": "5 days, 20:48:57", "throughput": 2716.05, "total_tokens": 272484352} {"current_steps": 1510, "total_steps": 9134, "loss": 0.7336, "learning_rate": 4.670346497788736e-05, "epoch": 0.16530282711623198, "percentage": 16.53, "elapsed_time": "1 day, 3:53:10", "remaining_time": "5 days, 20:47:54", "throughput": 2715.97, "total_tokens": 272658400} {"current_steps": 1511, "total_steps": 9134, "loss": 0.8216, "learning_rate": 4.669919601014374e-05, "epoch": 0.16541229918716988, "percentage": 16.54, "elapsed_time": "1 day, 3:54:18", "remaining_time": "5 days, 20:46:52", "throughput": 2716.05, "total_tokens": 272849920} {"current_steps": 1512, "total_steps": 9134, "loss": 0.6921, "learning_rate": 4.669492447542673e-05, "epoch": 0.16552177125810777, "percentage": 16.55, "elapsed_time": "1 day, 3:55:25", "remaining_time": "5 days, 20:45:48", "throughput": 2716.06, "total_tokens": 273032704} {"current_steps": 1513, "total_steps": 9134, "loss": 0.5839, "learning_rate": 4.669065037424161e-05, "epoch": 0.1656312433290457, "percentage": 16.56, "elapsed_time": "1 day, 3:56:34", "remaining_time": "5 days, 20:44:56", "throughput": 2716.27, "total_tokens": 273241920} {"current_steps": 1514, "total_steps": 9134, "loss": 0.7662, "learning_rate": 4.668637370709403e-05, "epoch": 0.16574071539998358, "percentage": 16.58, "elapsed_time": "1 day, 3:57:40", "remaining_time": "5 days, 20:43:47", "throughput": 2716.38, "total_tokens": 273432320} {"current_steps": 1515, "total_steps": 9134, "loss": 0.6626, "learning_rate": 4.668209447448989e-05, "epoch": 0.16585018747092148, "percentage": 16.59, "elapsed_time": "1 day, 3:58:47", "remaining_time": "5 days, 20:42:44", "throughput": 2716.4, "total_tokens": 273617344} {"current_steps": 1516, "total_steps": 9134, "loss": 0.8782, "learning_rate": 4.667781267693543e-05, "epoch": 0.16595965954185937, "percentage": 16.6, "elapsed_time": "1 day, 3:59:52", "remaining_time": "5 days, 20:41:29", "throughput": 2716.33, "total_tokens": 273786464} {"current_steps": 1517, "total_steps": 9134, "loss": 0.6219, "learning_rate": 4.6673528314937166e-05, "epoch": 0.1660691316127973, "percentage": 16.61, "elapsed_time": "1 day, 4:00:58", "remaining_time": "5 days, 20:40:21", "throughput": 2716.35, "total_tokens": 273967456} {"current_steps": 1518, "total_steps": 9134, "loss": 0.7154, "learning_rate": 4.666924138900194e-05, "epoch": 0.1661786036837352, "percentage": 16.62, "elapsed_time": "1 day, 4:02:01", "remaining_time": "5 days, 20:38:58", "throughput": 2716.16, "total_tokens": 274119776} {"current_steps": 1519, "total_steps": 9134, "loss": 0.7352, "learning_rate": 4.666495189963688e-05, "epoch": 0.16628807575467308, "percentage": 16.63, "elapsed_time": "1 day, 4:03:09", "remaining_time": "5 days, 20:37:57", "throughput": 2716.08, "total_tokens": 274295840} {"current_steps": 1520, "total_steps": 9134, "loss": 0.7133, "learning_rate": 4.666065984734942e-05, "epoch": 0.166397547825611, "percentage": 16.64, "elapsed_time": "1 day, 4:04:16", "remaining_time": "5 days, 20:36:52", "throughput": 2716.23, "total_tokens": 274492288} {"current_steps": 1521, "total_steps": 9134, "loss": 0.6485, "learning_rate": 4.6656365232647316e-05, "epoch": 0.1665070198965489, "percentage": 16.65, "elapsed_time": "1 day, 4:05:25", "remaining_time": "5 days, 20:35:59", "throughput": 2716.14, "total_tokens": 274670592} {"current_steps": 1522, "total_steps": 9134, "loss": 0.6739, "learning_rate": 4.66520680560386e-05, "epoch": 0.1666164919674868, "percentage": 16.66, "elapsed_time": "1 day, 4:06:34", "remaining_time": "5 days, 20:35:04", "throughput": 2716.23, "total_tokens": 274866592} {"current_steps": 1523, "total_steps": 9134, "loss": 0.6798, "learning_rate": 4.664776831803163e-05, "epoch": 0.16672596403842468, "percentage": 16.67, "elapsed_time": "1 day, 4:07:40", "remaining_time": "5 days, 20:33:54", "throughput": 2716.07, "total_tokens": 275029440} {"current_steps": 1524, "total_steps": 9134, "loss": 0.6982, "learning_rate": 4.664346601913504e-05, "epoch": 0.1668354361093626, "percentage": 16.68, "elapsed_time": "1 day, 4:08:45", "remaining_time": "5 days, 20:32:40", "throughput": 2716.16, "total_tokens": 275215136} {"current_steps": 1525, "total_steps": 9134, "loss": 0.7057, "learning_rate": 4.663916115985781e-05, "epoch": 0.1669449081803005, "percentage": 16.7, "elapsed_time": "1 day, 4:09:51", "remaining_time": "5 days, 20:31:34", "throughput": 2716.19, "total_tokens": 275398816} {"current_steps": 1526, "total_steps": 9134, "loss": 0.7479, "learning_rate": 4.663485374070917e-05, "epoch": 0.1670543802512384, "percentage": 16.71, "elapsed_time": "1 day, 4:11:00", "remaining_time": "5 days, 20:30:38", "throughput": 2716.36, "total_tokens": 275601984} {"current_steps": 1527, "total_steps": 9134, "loss": 0.6276, "learning_rate": 4.66305437621987e-05, "epoch": 0.16716385232217632, "percentage": 16.72, "elapsed_time": "1 day, 4:12:06", "remaining_time": "5 days, 20:29:29", "throughput": 2716.37, "total_tokens": 275782976} {"current_steps": 1528, "total_steps": 9134, "loss": 0.8127, "learning_rate": 4.6626231224836245e-05, "epoch": 0.1672733243931142, "percentage": 16.73, "elapsed_time": "1 day, 4:13:13", "remaining_time": "5 days, 20:28:29", "throughput": 2716.46, "total_tokens": 275975616} {"current_steps": 1529, "total_steps": 9134, "loss": 0.827, "learning_rate": 4.662191612913199e-05, "epoch": 0.1673827964640521, "percentage": 16.74, "elapsed_time": "1 day, 4:14:22", "remaining_time": "5 days, 20:27:33", "throughput": 2716.49, "total_tokens": 276165344} {"current_steps": 1530, "total_steps": 9134, "loss": 0.5903, "learning_rate": 4.661759847559638e-05, "epoch": 0.16749226853499002, "percentage": 16.75, "elapsed_time": "1 day, 4:15:31", "remaining_time": "5 days, 20:26:39", "throughput": 2716.62, "total_tokens": 276365824} {"current_steps": 1531, "total_steps": 9134, "loss": 0.8826, "learning_rate": 4.66132782647402e-05, "epoch": 0.16760174060592792, "percentage": 16.76, "elapsed_time": "1 day, 4:16:40", "remaining_time": "5 days, 20:25:45", "throughput": 2716.81, "total_tokens": 276572800} {"current_steps": 1532, "total_steps": 9134, "loss": 0.6796, "learning_rate": 4.6608955497074526e-05, "epoch": 0.1677112126768658, "percentage": 16.77, "elapsed_time": "1 day, 4:17:44", "remaining_time": "5 days, 20:24:24", "throughput": 2716.62, "total_tokens": 276726688} {"current_steps": 1533, "total_steps": 9134, "loss": 0.8858, "learning_rate": 4.660463017311072e-05, "epoch": 0.1678206847478037, "percentage": 16.78, "elapsed_time": "1 day, 4:18:51", "remaining_time": "5 days, 20:23:23", "throughput": 2716.76, "total_tokens": 276923584} {"current_steps": 1534, "total_steps": 9134, "loss": 0.5721, "learning_rate": 4.660030229336046e-05, "epoch": 0.16793015681874163, "percentage": 16.79, "elapsed_time": "1 day, 4:19:57", "remaining_time": "5 days, 20:22:12", "throughput": 2716.66, "total_tokens": 277092480} {"current_steps": 1535, "total_steps": 9134, "loss": 0.6596, "learning_rate": 4.659597185833574e-05, "epoch": 0.16803962888967952, "percentage": 16.81, "elapsed_time": "1 day, 4:21:04", "remaining_time": "5 days, 20:21:10", "throughput": 2716.78, "total_tokens": 277287136} {"current_steps": 1536, "total_steps": 9134, "loss": 0.6495, "learning_rate": 4.6591638868548824e-05, "epoch": 0.16814910096061741, "percentage": 16.82, "elapsed_time": "1 day, 4:22:12", "remaining_time": "5 days, 20:20:10", "throughput": 2716.93, "total_tokens": 277486720} {"current_steps": 1537, "total_steps": 9134, "loss": 0.9191, "learning_rate": 4.6587303324512324e-05, "epoch": 0.16825857303155534, "percentage": 16.83, "elapsed_time": "1 day, 4:23:21", "remaining_time": "5 days, 20:19:17", "throughput": 2717.07, "total_tokens": 277689664} {"current_steps": 1538, "total_steps": 9134, "loss": 0.6179, "learning_rate": 4.6582965226739094e-05, "epoch": 0.16836804510249323, "percentage": 16.84, "elapsed_time": "1 day, 4:24:28", "remaining_time": "5 days, 20:18:10", "throughput": 2717.1, "total_tokens": 277872896} {"current_steps": 1539, "total_steps": 9134, "loss": 0.5461, "learning_rate": 4.6578624575742335e-05, "epoch": 0.16847751717343112, "percentage": 16.85, "elapsed_time": "1 day, 4:25:34", "remaining_time": "5 days, 20:17:03", "throughput": 2717.06, "total_tokens": 278048960} {"current_steps": 1540, "total_steps": 9134, "loss": 0.542, "learning_rate": 4.6574281372035546e-05, "epoch": 0.16858698924436902, "percentage": 16.86, "elapsed_time": "1 day, 4:26:43", "remaining_time": "5 days, 20:16:08", "throughput": 2717.18, "total_tokens": 278248320} {"current_steps": 1541, "total_steps": 9134, "loss": 0.6508, "learning_rate": 4.6569935616132516e-05, "epoch": 0.16869646131530694, "percentage": 16.87, "elapsed_time": "1 day, 4:27:49", "remaining_time": "5 days, 20:14:58", "throughput": 2716.98, "total_tokens": 278406912} {"current_steps": 1542, "total_steps": 9134, "loss": 0.9863, "learning_rate": 4.6565587308547334e-05, "epoch": 0.16880593338624483, "percentage": 16.88, "elapsed_time": "1 day, 4:28:56", "remaining_time": "5 days, 20:13:53", "throughput": 2717.09, "total_tokens": 278599776} {"current_steps": 1543, "total_steps": 9134, "loss": 0.739, "learning_rate": 4.65612364497944e-05, "epoch": 0.16891540545718273, "percentage": 16.89, "elapsed_time": "1 day, 4:30:01", "remaining_time": "5 days, 20:12:41", "throughput": 2717.07, "total_tokens": 278774944} {"current_steps": 1544, "total_steps": 9134, "loss": 0.7061, "learning_rate": 4.655688304038841e-05, "epoch": 0.16902487752812065, "percentage": 16.9, "elapsed_time": "1 day, 4:31:05", "remaining_time": "5 days, 20:11:23", "throughput": 2717.01, "total_tokens": 278942496} {"current_steps": 1545, "total_steps": 9134, "loss": 0.9761, "learning_rate": 4.6552527080844374e-05, "epoch": 0.16913434959905854, "percentage": 16.91, "elapsed_time": "1 day, 4:32:12", "remaining_time": "5 days, 20:10:20", "throughput": 2717.08, "total_tokens": 279133344} {"current_steps": 1546, "total_steps": 9134, "loss": 0.584, "learning_rate": 4.6548168571677574e-05, "epoch": 0.16924382166999644, "percentage": 16.93, "elapsed_time": "1 day, 4:33:20", "remaining_time": "5 days, 20:09:18", "throughput": 2717.22, "total_tokens": 279330464} {"current_steps": 1547, "total_steps": 9134, "loss": 0.6647, "learning_rate": 4.6543807513403636e-05, "epoch": 0.16935329374093436, "percentage": 16.94, "elapsed_time": "1 day, 4:34:27", "remaining_time": "5 days, 20:08:15", "throughput": 2717.27, "total_tokens": 279518400} {"current_steps": 1548, "total_steps": 9134, "loss": 0.6937, "learning_rate": 4.653944390653845e-05, "epoch": 0.16946276581187225, "percentage": 16.95, "elapsed_time": "1 day, 4:35:32", "remaining_time": "5 days, 20:07:04", "throughput": 2717.08, "total_tokens": 279676992} {"current_steps": 1549, "total_steps": 9134, "loss": 0.6195, "learning_rate": 4.6535077751598224e-05, "epoch": 0.16957223788281015, "percentage": 16.96, "elapsed_time": "1 day, 4:36:39", "remaining_time": "5 days, 20:05:57", "throughput": 2717.09, "total_tokens": 279858432} {"current_steps": 1550, "total_steps": 9134, "loss": 0.6947, "learning_rate": 4.653070904909947e-05, "epoch": 0.16968170995374804, "percentage": 16.97, "elapsed_time": "1 day, 4:37:45", "remaining_time": "5 days, 20:04:51", "throughput": 2717.1, "total_tokens": 280040096} {"current_steps": 1551, "total_steps": 9134, "loss": 0.6698, "learning_rate": 4.6526337799559e-05, "epoch": 0.16979118202468596, "percentage": 16.98, "elapsed_time": "1 day, 4:38:54", "remaining_time": "5 days, 20:03:54", "throughput": 2717.04, "total_tokens": 280220416} {"current_steps": 1552, "total_steps": 9134, "loss": 0.5624, "learning_rate": 4.652196400349391e-05, "epoch": 0.16990065409562385, "percentage": 16.99, "elapsed_time": "1 day, 4:39:55", "remaining_time": "5 days, 20:02:22", "throughput": 2716.87, "total_tokens": 280369376} {"current_steps": 1553, "total_steps": 9134, "loss": 0.7419, "learning_rate": 4.651758766142162e-05, "epoch": 0.17001012616656175, "percentage": 17.0, "elapsed_time": "1 day, 4:41:04", "remaining_time": "5 days, 20:01:28", "throughput": 2716.93, "total_tokens": 280562240} {"current_steps": 1554, "total_steps": 9134, "loss": 0.7965, "learning_rate": 4.6513208773859854e-05, "epoch": 0.17011959823749967, "percentage": 17.01, "elapsed_time": "1 day, 4:42:10", "remaining_time": "5 days, 20:00:19", "throughput": 2717.04, "total_tokens": 280753984} {"current_steps": 1555, "total_steps": 9134, "loss": 0.8029, "learning_rate": 4.650882734132661e-05, "epoch": 0.17022907030843756, "percentage": 17.02, "elapsed_time": "1 day, 4:43:20", "remaining_time": "5 days, 19:59:28", "throughput": 2717.25, "total_tokens": 280964320} {"current_steps": 1556, "total_steps": 9134, "loss": 0.5798, "learning_rate": 4.650444336434021e-05, "epoch": 0.17033854237937546, "percentage": 17.04, "elapsed_time": "1 day, 4:44:22", "remaining_time": "5 days, 19:58:02", "throughput": 2717.15, "total_tokens": 281123808} {"current_steps": 1557, "total_steps": 9134, "loss": 0.7068, "learning_rate": 4.650005684341928e-05, "epoch": 0.17044801445031335, "percentage": 17.05, "elapsed_time": "1 day, 4:45:28", "remaining_time": "5 days, 19:56:54", "throughput": 2717.2, "total_tokens": 281309056} {"current_steps": 1558, "total_steps": 9134, "loss": 0.711, "learning_rate": 4.6495667779082716e-05, "epoch": 0.17055748652125127, "percentage": 17.06, "elapsed_time": "1 day, 4:46:38", "remaining_time": "5 days, 19:56:00", "throughput": 2717.07, "total_tokens": 281483328} {"current_steps": 1559, "total_steps": 9134, "loss": 0.7761, "learning_rate": 4.649127617184975e-05, "epoch": 0.17066695859218917, "percentage": 17.07, "elapsed_time": "1 day, 4:47:43", "remaining_time": "5 days, 19:54:49", "throughput": 2716.98, "total_tokens": 281652000} {"current_steps": 1560, "total_steps": 9134, "loss": 0.733, "learning_rate": 4.6486882022239895e-05, "epoch": 0.17077643066312706, "percentage": 17.08, "elapsed_time": "1 day, 4:48:51", "remaining_time": "5 days, 19:53:49", "throughput": 2717.23, "total_tokens": 281862560} {"current_steps": 1561, "total_steps": 9134, "loss": 0.559, "learning_rate": 4.648248533077297e-05, "epoch": 0.17088590273406498, "percentage": 17.09, "elapsed_time": "1 day, 4:49:56", "remaining_time": "5 days, 19:52:34", "throughput": 2717.05, "total_tokens": 282020032} {"current_steps": 1562, "total_steps": 9134, "loss": 0.9127, "learning_rate": 4.6478086097969104e-05, "epoch": 0.17099537480500288, "percentage": 17.1, "elapsed_time": "1 day, 4:51:03", "remaining_time": "5 days, 19:51:32", "throughput": 2717.08, "total_tokens": 282205280} {"current_steps": 1563, "total_steps": 9134, "loss": 0.7845, "learning_rate": 4.647368432434871e-05, "epoch": 0.17110484687594077, "percentage": 17.11, "elapsed_time": "1 day, 4:52:11", "remaining_time": "5 days, 19:50:31", "throughput": 2717.25, "total_tokens": 282407328} {"current_steps": 1564, "total_steps": 9134, "loss": 0.6889, "learning_rate": 4.646928001043251e-05, "epoch": 0.1712143189468787, "percentage": 17.12, "elapsed_time": "1 day, 4:53:12", "remaining_time": "5 days, 19:48:57", "throughput": 2717.04, "total_tokens": 282550464} {"current_steps": 1565, "total_steps": 9134, "loss": 0.7499, "learning_rate": 4.646487315674153e-05, "epoch": 0.17132379101781658, "percentage": 17.13, "elapsed_time": "1 day, 4:54:19", "remaining_time": "5 days, 19:47:53", "throughput": 2716.99, "total_tokens": 282727648} {"current_steps": 1566, "total_steps": 9134, "loss": 0.7225, "learning_rate": 4.646046376379708e-05, "epoch": 0.17143326308875448, "percentage": 17.14, "elapsed_time": "1 day, 4:55:25", "remaining_time": "5 days, 19:46:47", "throughput": 2717.12, "total_tokens": 282921856} {"current_steps": 1567, "total_steps": 9134, "loss": 0.8488, "learning_rate": 4.64560518321208e-05, "epoch": 0.17154273515969237, "percentage": 17.16, "elapsed_time": "1 day, 4:56:34", "remaining_time": "5 days, 19:45:54", "throughput": 2717.12, "total_tokens": 283110464} {"current_steps": 1568, "total_steps": 9134, "loss": 0.8527, "learning_rate": 4.6451637362234604e-05, "epoch": 0.1716522072306303, "percentage": 17.17, "elapsed_time": "1 day, 4:57:44", "remaining_time": "5 days, 19:45:01", "throughput": 2717.21, "total_tokens": 283308256} {"current_steps": 1569, "total_steps": 9134, "loss": 0.5577, "learning_rate": 4.644722035466072e-05, "epoch": 0.1717616793015682, "percentage": 17.18, "elapsed_time": "1 day, 4:58:50", "remaining_time": "5 days, 19:43:52", "throughput": 2717.16, "total_tokens": 283481408} {"current_steps": 1570, "total_steps": 9134, "loss": 0.8266, "learning_rate": 4.644280080992166e-05, "epoch": 0.17187115137250608, "percentage": 17.19, "elapsed_time": "1 day, 4:59:56", "remaining_time": "5 days, 19:42:44", "throughput": 2717.33, "total_tokens": 283679872} {"current_steps": 1571, "total_steps": 9134, "loss": 0.6238, "learning_rate": 4.643837872854027e-05, "epoch": 0.171980623443444, "percentage": 17.2, "elapsed_time": "1 day, 5:01:01", "remaining_time": "5 days, 19:41:30", "throughput": 2717.34, "total_tokens": 283857056} {"current_steps": 1572, "total_steps": 9134, "loss": 0.8533, "learning_rate": 4.643395411103965e-05, "epoch": 0.1720900955143819, "percentage": 17.21, "elapsed_time": "1 day, 5:02:07", "remaining_time": "5 days, 19:40:24", "throughput": 2717.42, "total_tokens": 284046784} {"current_steps": 1573, "total_steps": 9134, "loss": 0.6206, "learning_rate": 4.642952695794323e-05, "epoch": 0.1721995675853198, "percentage": 17.22, "elapsed_time": "1 day, 5:03:13", "remaining_time": "5 days, 19:39:12", "throughput": 2717.37, "total_tokens": 284218592} {"current_steps": 1574, "total_steps": 9134, "loss": 0.7451, "learning_rate": 4.6425097269774744e-05, "epoch": 0.17230903965625768, "percentage": 17.23, "elapsed_time": "1 day, 5:04:20", "remaining_time": "5 days, 19:38:11", "throughput": 2717.45, "total_tokens": 284411232} {"current_steps": 1575, "total_steps": 9134, "loss": 0.7152, "learning_rate": 4.64206650470582e-05, "epoch": 0.1724185117271956, "percentage": 17.24, "elapsed_time": "1 day, 5:05:24", "remaining_time": "5 days, 19:36:51", "throughput": 2717.45, "total_tokens": 284583712} {"current_steps": 1576, "total_steps": 9134, "loss": 0.8709, "learning_rate": 4.6416230290317934e-05, "epoch": 0.1725279837981335, "percentage": 17.25, "elapsed_time": "1 day, 5:06:31", "remaining_time": "5 days, 19:35:46", "throughput": 2717.34, "total_tokens": 284754176} {"current_steps": 1577, "total_steps": 9134, "loss": 0.6065, "learning_rate": 4.641179300007857e-05, "epoch": 0.1726374558690714, "percentage": 17.27, "elapsed_time": "1 day, 5:07:35", "remaining_time": "5 days, 19:34:29", "throughput": 2717.05, "total_tokens": 284897984} {"current_steps": 1578, "total_steps": 9134, "loss": 0.713, "learning_rate": 4.640735317686502e-05, "epoch": 0.17274692794000931, "percentage": 17.28, "elapsed_time": "1 day, 5:08:44", "remaining_time": "5 days, 19:33:34", "throughput": 2716.86, "total_tokens": 285065536} {"current_steps": 1579, "total_steps": 9134, "loss": 0.7582, "learning_rate": 4.6402910821202525e-05, "epoch": 0.1728564000109472, "percentage": 17.29, "elapsed_time": "1 day, 5:09:49", "remaining_time": "5 days, 19:32:22", "throughput": 2716.81, "total_tokens": 285237568} {"current_steps": 1580, "total_steps": 9134, "loss": 0.8263, "learning_rate": 4.6398465933616585e-05, "epoch": 0.1729658720818851, "percentage": 17.3, "elapsed_time": "1 day, 5:10:59", "remaining_time": "5 days, 19:31:30", "throughput": 2716.9, "total_tokens": 285436032} {"current_steps": 1581, "total_steps": 9134, "loss": 0.6285, "learning_rate": 4.6394018514633033e-05, "epoch": 0.17307534415282302, "percentage": 17.31, "elapsed_time": "1 day, 5:12:08", "remaining_time": "5 days, 19:30:37", "throughput": 2716.95, "total_tokens": 285630016} {"current_steps": 1582, "total_steps": 9134, "loss": 0.7992, "learning_rate": 4.6389568564777994e-05, "epoch": 0.17318481622376092, "percentage": 17.32, "elapsed_time": "1 day, 5:13:18", "remaining_time": "5 days, 19:29:44", "throughput": 2716.67, "total_tokens": 285788608} {"current_steps": 1583, "total_steps": 9134, "loss": 0.8261, "learning_rate": 4.6385116084577874e-05, "epoch": 0.1732942882946988, "percentage": 17.33, "elapsed_time": "1 day, 5:14:24", "remaining_time": "5 days, 19:28:35", "throughput": 2716.63, "total_tokens": 285963104} {"current_steps": 1584, "total_steps": 9134, "loss": 0.7439, "learning_rate": 4.638066107455941e-05, "epoch": 0.1734037603656367, "percentage": 17.34, "elapsed_time": "1 day, 5:15:28", "remaining_time": "5 days, 19:27:17", "throughput": 2716.54, "total_tokens": 286128416} {"current_steps": 1585, "total_steps": 9134, "loss": 0.8627, "learning_rate": 4.637620353524962e-05, "epoch": 0.17351323243657463, "percentage": 17.35, "elapsed_time": "1 day, 5:16:35", "remaining_time": "5 days, 19:26:15", "throughput": 2716.51, "total_tokens": 286308288} {"current_steps": 1586, "total_steps": 9134, "loss": 0.7389, "learning_rate": 4.637174346717581e-05, "epoch": 0.17362270450751252, "percentage": 17.36, "elapsed_time": "1 day, 5:17:40", "remaining_time": "5 days, 19:25:03", "throughput": 2716.37, "total_tokens": 286471136} {"current_steps": 1587, "total_steps": 9134, "loss": 0.7723, "learning_rate": 4.63672808708656e-05, "epoch": 0.17373217657845041, "percentage": 17.37, "elapsed_time": "1 day, 5:18:46", "remaining_time": "5 days, 19:23:52", "throughput": 2716.38, "total_tokens": 286649664} {"current_steps": 1588, "total_steps": 9134, "loss": 0.5475, "learning_rate": 4.636281574684691e-05, "epoch": 0.17384164864938834, "percentage": 17.39, "elapsed_time": "1 day, 5:19:56", "remaining_time": "5 days, 19:23:01", "throughput": 2716.54, "total_tokens": 286856416} {"current_steps": 1589, "total_steps": 9134, "loss": 0.7104, "learning_rate": 4.635834809564796e-05, "epoch": 0.17395112072032623, "percentage": 17.4, "elapsed_time": "1 day, 5:21:02", "remaining_time": "5 days, 19:21:54", "throughput": 2716.51, "total_tokens": 287033152} {"current_steps": 1590, "total_steps": 9134, "loss": 0.5432, "learning_rate": 4.635387791779726e-05, "epoch": 0.17406059279126412, "percentage": 17.41, "elapsed_time": "1 day, 5:22:06", "remaining_time": "5 days, 19:20:34", "throughput": 2716.45, "total_tokens": 287200032} {"current_steps": 1591, "total_steps": 9134, "loss": 0.7116, "learning_rate": 4.634940521382362e-05, "epoch": 0.17417006486220202, "percentage": 17.42, "elapsed_time": "1 day, 5:23:15", "remaining_time": "5 days, 19:19:39", "throughput": 2716.48, "total_tokens": 287390880} {"current_steps": 1592, "total_steps": 9134, "loss": 0.7421, "learning_rate": 4.634492998425616e-05, "epoch": 0.17427953693313994, "percentage": 17.43, "elapsed_time": "1 day, 5:24:24", "remaining_time": "5 days, 19:18:46", "throughput": 2716.66, "total_tokens": 287597856} {"current_steps": 1593, "total_steps": 9134, "loss": 0.6394, "learning_rate": 4.6340452229624286e-05, "epoch": 0.17438900900407783, "percentage": 17.44, "elapsed_time": "1 day, 5:25:31", "remaining_time": "5 days, 19:17:43", "throughput": 2716.63, "total_tokens": 287777056} {"current_steps": 1594, "total_steps": 9134, "loss": 0.5943, "learning_rate": 4.6335971950457715e-05, "epoch": 0.17449848107501573, "percentage": 17.45, "elapsed_time": "1 day, 5:26:38", "remaining_time": "5 days, 19:16:37", "throughput": 2716.49, "total_tokens": 287943264} {"current_steps": 1595, "total_steps": 9134, "loss": 0.7475, "learning_rate": 4.6331489147286444e-05, "epoch": 0.17460795314595365, "percentage": 17.46, "elapsed_time": "1 day, 5:27:44", "remaining_time": "5 days, 19:15:29", "throughput": 2716.56, "total_tokens": 288130752} {"current_steps": 1596, "total_steps": 9134, "loss": 0.9054, "learning_rate": 4.632700382064079e-05, "epoch": 0.17471742521689154, "percentage": 17.47, "elapsed_time": "1 day, 5:28:48", "remaining_time": "5 days, 19:14:10", "throughput": 2716.39, "total_tokens": 288286208} {"current_steps": 1597, "total_steps": 9134, "loss": 0.7435, "learning_rate": 4.632251597105135e-05, "epoch": 0.17482689728782944, "percentage": 17.48, "elapsed_time": "1 day, 5:29:55", "remaining_time": "5 days, 19:13:04", "throughput": 2716.34, "total_tokens": 288461376} {"current_steps": 1598, "total_steps": 9134, "loss": 0.7022, "learning_rate": 4.631802559904903e-05, "epoch": 0.17493636935876736, "percentage": 17.5, "elapsed_time": "1 day, 5:31:01", "remaining_time": "5 days, 19:11:58", "throughput": 2716.36, "total_tokens": 288645056} {"current_steps": 1599, "total_steps": 9134, "loss": 0.6644, "learning_rate": 4.631353270516504e-05, "epoch": 0.17504584142970525, "percentage": 17.51, "elapsed_time": "1 day, 5:32:06", "remaining_time": "5 days, 19:10:44", "throughput": 2716.35, "total_tokens": 288820000} {"current_steps": 1600, "total_steps": 9134, "loss": 0.7047, "learning_rate": 4.6309037289930875e-05, "epoch": 0.17515531350064314, "percentage": 17.52, "elapsed_time": "1 day, 5:33:13", "remaining_time": "5 days, 19:09:41", "throughput": 2716.27, "total_tokens": 288994272} {"current_steps": 1601, "total_steps": 9134, "loss": 0.7493, "learning_rate": 4.630453935387833e-05, "epoch": 0.17526478557158104, "percentage": 17.53, "elapsed_time": "1 day, 5:34:22", "remaining_time": "5 days, 19:08:45", "throughput": 2716.48, "total_tokens": 289202816} {"current_steps": 1602, "total_steps": 9134, "loss": 0.6486, "learning_rate": 4.630003889753951e-05, "epoch": 0.17537425764251896, "percentage": 17.54, "elapsed_time": "1 day, 5:35:30", "remaining_time": "5 days, 19:07:45", "throughput": 2716.47, "total_tokens": 289386496} {"current_steps": 1603, "total_steps": 9134, "loss": 0.6121, "learning_rate": 4.629553592144681e-05, "epoch": 0.17548372971345685, "percentage": 17.55, "elapsed_time": "1 day, 5:36:36", "remaining_time": "5 days, 19:06:39", "throughput": 2716.6, "total_tokens": 289581824} {"current_steps": 1604, "total_steps": 9134, "loss": 0.6971, "learning_rate": 4.629103042613292e-05, "epoch": 0.17559320178439475, "percentage": 17.56, "elapsed_time": "1 day, 5:37:46", "remaining_time": "5 days, 19:05:47", "throughput": 2716.66, "total_tokens": 289776480} {"current_steps": 1605, "total_steps": 9134, "loss": 0.7046, "learning_rate": 4.628652241213083e-05, "epoch": 0.17570267385533267, "percentage": 17.57, "elapsed_time": "1 day, 5:38:47", "remaining_time": "5 days, 19:04:13", "throughput": 2716.54, "total_tokens": 289928352} {"current_steps": 1606, "total_steps": 9134, "loss": 0.8522, "learning_rate": 4.6282011879973833e-05, "epoch": 0.17581214592627056, "percentage": 17.58, "elapsed_time": "1 day, 5:39:54", "remaining_time": "5 days, 19:03:08", "throughput": 2716.55, "total_tokens": 290111136} {"current_steps": 1607, "total_steps": 9134, "loss": 0.9065, "learning_rate": 4.627749883019551e-05, "epoch": 0.17592161799720846, "percentage": 17.59, "elapsed_time": "1 day, 5:41:00", "remaining_time": "5 days, 19:02:03", "throughput": 2716.54, "total_tokens": 290292128} {"current_steps": 1608, "total_steps": 9134, "loss": 0.9542, "learning_rate": 4.627298326332975e-05, "epoch": 0.17603109006814635, "percentage": 17.6, "elapsed_time": "1 day, 5:42:09", "remaining_time": "5 days, 19:01:05", "throughput": 2716.73, "total_tokens": 290497760} {"current_steps": 1609, "total_steps": 9134, "loss": 0.5236, "learning_rate": 4.626846517991075e-05, "epoch": 0.17614056213908427, "percentage": 17.62, "elapsed_time": "1 day, 5:43:15", "remaining_time": "5 days, 19:00:00", "throughput": 2716.91, "total_tokens": 290698688} {"current_steps": 1610, "total_steps": 9134, "loss": 0.5208, "learning_rate": 4.626394458047296e-05, "epoch": 0.17625003421002217, "percentage": 17.63, "elapsed_time": "1 day, 5:44:20", "remaining_time": "5 days, 18:58:43", "throughput": 2716.83, "total_tokens": 290864448} {"current_steps": 1611, "total_steps": 9134, "loss": 0.6694, "learning_rate": 4.625942146555119e-05, "epoch": 0.17635950628096006, "percentage": 17.64, "elapsed_time": "1 day, 5:45:28", "remaining_time": "5 days, 18:57:47", "throughput": 2716.88, "total_tokens": 291056416} {"current_steps": 1612, "total_steps": 9134, "loss": 0.7317, "learning_rate": 4.62548958356805e-05, "epoch": 0.17646897835189798, "percentage": 17.65, "elapsed_time": "1 day, 5:46:36", "remaining_time": "5 days, 18:56:44", "throughput": 2716.97, "total_tokens": 291248832} {"current_steps": 1613, "total_steps": 9134, "loss": 0.6754, "learning_rate": 4.625036769139626e-05, "epoch": 0.17657845042283588, "percentage": 17.66, "elapsed_time": "1 day, 5:47:43", "remaining_time": "5 days, 18:55:42", "throughput": 2717.04, "total_tokens": 291439232} {"current_steps": 1614, "total_steps": 9134, "loss": 0.8223, "learning_rate": 4.624583703323415e-05, "epoch": 0.17668792249377377, "percentage": 17.67, "elapsed_time": "1 day, 5:48:49", "remaining_time": "5 days, 18:54:33", "throughput": 2716.87, "total_tokens": 291600960} {"current_steps": 1615, "total_steps": 9134, "loss": 0.7705, "learning_rate": 4.624130386173013e-05, "epoch": 0.1767973945647117, "percentage": 17.68, "elapsed_time": "1 day, 5:49:58", "remaining_time": "5 days, 18:53:37", "throughput": 2716.93, "total_tokens": 291793824} {"current_steps": 1616, "total_steps": 9134, "loss": 0.6863, "learning_rate": 4.623676817742047e-05, "epoch": 0.17690686663564958, "percentage": 17.69, "elapsed_time": "1 day, 5:51:01", "remaining_time": "5 days, 18:52:15", "throughput": 2716.7, "total_tokens": 291940768} {"current_steps": 1617, "total_steps": 9134, "loss": 0.5966, "learning_rate": 4.623222998084174e-05, "epoch": 0.17701633870658748, "percentage": 17.7, "elapsed_time": "1 day, 5:52:08", "remaining_time": "5 days, 18:51:10", "throughput": 2716.86, "total_tokens": 292139456} {"current_steps": 1618, "total_steps": 9134, "loss": 0.7892, "learning_rate": 4.6227689272530785e-05, "epoch": 0.17712581077752537, "percentage": 17.71, "elapsed_time": "1 day, 5:53:17", "remaining_time": "5 days, 18:50:17", "throughput": 2717.05, "total_tokens": 292348448} {"current_steps": 1619, "total_steps": 9134, "loss": 0.6496, "learning_rate": 4.622314605302477e-05, "epoch": 0.1772352828484633, "percentage": 17.72, "elapsed_time": "1 day, 5:54:23", "remaining_time": "5 days, 18:49:09", "throughput": 2717.19, "total_tokens": 292542880} {"current_steps": 1620, "total_steps": 9134, "loss": 0.7724, "learning_rate": 4.621860032286115e-05, "epoch": 0.1773447549194012, "percentage": 17.74, "elapsed_time": "1 day, 5:55:32", "remaining_time": "5 days, 18:48:11", "throughput": 2717.22, "total_tokens": 292732384} {"current_steps": 1621, "total_steps": 9134, "loss": 0.667, "learning_rate": 4.621405208257767e-05, "epoch": 0.17745422699033908, "percentage": 17.75, "elapsed_time": "1 day, 5:56:37", "remaining_time": "5 days, 18:47:01", "throughput": 2717.15, "total_tokens": 292902848} {"current_steps": 1622, "total_steps": 9134, "loss": 0.6736, "learning_rate": 4.620950133271239e-05, "epoch": 0.177563699061277, "percentage": 17.76, "elapsed_time": "1 day, 5:57:46", "remaining_time": "5 days, 18:46:05", "throughput": 2717.23, "total_tokens": 293098624} {"current_steps": 1623, "total_steps": 9134, "loss": 0.7815, "learning_rate": 4.620494807380365e-05, "epoch": 0.1776731711322149, "percentage": 17.77, "elapsed_time": "1 day, 5:58:53", "remaining_time": "5 days, 18:44:59", "throughput": 2717.46, "total_tokens": 293305152} {"current_steps": 1624, "total_steps": 9134, "loss": 0.6715, "learning_rate": 4.620039230639008e-05, "epoch": 0.1777826432031528, "percentage": 17.78, "elapsed_time": "1 day, 5:59:58", "remaining_time": "5 days, 18:43:44", "throughput": 2717.32, "total_tokens": 293465760} {"current_steps": 1625, "total_steps": 9134, "loss": 0.8146, "learning_rate": 4.619583403101063e-05, "epoch": 0.17789211527409068, "percentage": 17.79, "elapsed_time": "1 day, 6:01:03", "remaining_time": "5 days, 18:42:35", "throughput": 2717.17, "total_tokens": 293627712} {"current_steps": 1626, "total_steps": 9134, "loss": 0.9117, "learning_rate": 4.619127324820454e-05, "epoch": 0.1780015873450286, "percentage": 17.8, "elapsed_time": "1 day, 6:02:08", "remaining_time": "5 days, 18:41:21", "throughput": 2717.12, "total_tokens": 293799744} {"current_steps": 1627, "total_steps": 9134, "loss": 0.6862, "learning_rate": 4.6186709958511334e-05, "epoch": 0.1781110594159665, "percentage": 17.81, "elapsed_time": "1 day, 6:03:15", "remaining_time": "5 days, 18:40:15", "throughput": 2717.01, "total_tokens": 293968640} {"current_steps": 1628, "total_steps": 9134, "loss": 0.7929, "learning_rate": 4.618214416247084e-05, "epoch": 0.1782205314869044, "percentage": 17.82, "elapsed_time": "1 day, 6:04:24", "remaining_time": "5 days, 18:39:18", "throughput": 2716.98, "total_tokens": 294150752} {"current_steps": 1629, "total_steps": 9134, "loss": 0.8336, "learning_rate": 4.617757586062319e-05, "epoch": 0.17833000355784231, "percentage": 17.83, "elapsed_time": "1 day, 6:05:31", "remaining_time": "5 days, 18:38:16", "throughput": 2716.86, "total_tokens": 294321664} {"current_steps": 1630, "total_steps": 9134, "loss": 0.584, "learning_rate": 4.61730050535088e-05, "epoch": 0.1784394756287802, "percentage": 17.85, "elapsed_time": "1 day, 6:06:40", "remaining_time": "5 days, 18:37:19", "throughput": 2716.77, "total_tokens": 294498400} {"current_steps": 1631, "total_steps": 9134, "loss": 0.6597, "learning_rate": 4.6168431741668386e-05, "epoch": 0.1785489476997181, "percentage": 17.86, "elapsed_time": "1 day, 6:07:43", "remaining_time": "5 days, 18:35:58", "throughput": 2716.66, "total_tokens": 294658112} {"current_steps": 1632, "total_steps": 9134, "loss": 0.6758, "learning_rate": 4.6163855925642955e-05, "epoch": 0.17865841977065602, "percentage": 17.87, "elapsed_time": "1 day, 6:08:52", "remaining_time": "5 days, 18:35:04", "throughput": 2716.83, "total_tokens": 294864864} {"current_steps": 1633, "total_steps": 9134, "loss": 0.8215, "learning_rate": 4.6159277605973836e-05, "epoch": 0.17876789184159392, "percentage": 17.88, "elapsed_time": "1 day, 6:09:58", "remaining_time": "5 days, 18:33:56", "throughput": 2716.92, "total_tokens": 295054592} {"current_steps": 1634, "total_steps": 9134, "loss": 0.5943, "learning_rate": 4.615469678320262e-05, "epoch": 0.1788773639125318, "percentage": 17.89, "elapsed_time": "1 day, 6:11:03", "remaining_time": "5 days, 18:32:43", "throughput": 2717.04, "total_tokens": 295243872} {"current_steps": 1635, "total_steps": 9134, "loss": 0.9439, "learning_rate": 4.615011345787122e-05, "epoch": 0.1789868359834697, "percentage": 17.9, "elapsed_time": "1 day, 6:12:11", "remaining_time": "5 days, 18:31:40", "throughput": 2717.11, "total_tokens": 295434944} {"current_steps": 1636, "total_steps": 9134, "loss": 0.7777, "learning_rate": 4.6145527630521834e-05, "epoch": 0.17909630805440763, "percentage": 17.91, "elapsed_time": "1 day, 6:13:18", "remaining_time": "5 days, 18:30:37", "throughput": 2717.04, "total_tokens": 295609888} {"current_steps": 1637, "total_steps": 9134, "loss": 0.7905, "learning_rate": 4.614093930169695e-05, "epoch": 0.17920578012534552, "percentage": 17.92, "elapsed_time": "1 day, 6:14:25", "remaining_time": "5 days, 18:29:33", "throughput": 2716.89, "total_tokens": 295775424} {"current_steps": 1638, "total_steps": 9134, "loss": 0.6148, "learning_rate": 4.613634847193936e-05, "epoch": 0.17931525219628341, "percentage": 17.93, "elapsed_time": "1 day, 6:15:33", "remaining_time": "5 days, 18:28:32", "throughput": 2717.02, "total_tokens": 295973888} {"current_steps": 1639, "total_steps": 9134, "loss": 0.7418, "learning_rate": 4.613175514179215e-05, "epoch": 0.17942472426722134, "percentage": 17.94, "elapsed_time": "1 day, 6:16:37", "remaining_time": "5 days, 18:27:14", "throughput": 2717.08, "total_tokens": 296153760} {"current_steps": 1640, "total_steps": 9134, "loss": 0.7874, "learning_rate": 4.6127159311798705e-05, "epoch": 0.17953419633815923, "percentage": 17.95, "elapsed_time": "1 day, 6:17:45", "remaining_time": "5 days, 18:26:16", "throughput": 2717.21, "total_tokens": 296353568} {"current_steps": 1641, "total_steps": 9134, "loss": 0.6322, "learning_rate": 4.61225609825027e-05, "epoch": 0.17964366840909712, "percentage": 17.97, "elapsed_time": "1 day, 6:18:52", "remaining_time": "5 days, 18:25:13", "throughput": 2717.21, "total_tokens": 296537248} {"current_steps": 1642, "total_steps": 9134, "loss": 0.7468, "learning_rate": 4.6117960154448115e-05, "epoch": 0.17975314048003502, "percentage": 17.98, "elapsed_time": "1 day, 6:20:02", "remaining_time": "5 days, 18:24:20", "throughput": 2717.26, "total_tokens": 296731008} {"current_steps": 1643, "total_steps": 9134, "loss": 0.7362, "learning_rate": 4.611335682817921e-05, "epoch": 0.17986261255097294, "percentage": 17.99, "elapsed_time": "1 day, 6:21:11", "remaining_time": "5 days, 18:23:27", "throughput": 2717.32, "total_tokens": 296926336} {"current_steps": 1644, "total_steps": 9134, "loss": 0.7212, "learning_rate": 4.610875100424056e-05, "epoch": 0.17997208462191083, "percentage": 18.0, "elapsed_time": "1 day, 6:22:12", "remaining_time": "5 days, 18:21:55", "throughput": 2717.07, "total_tokens": 297065216} {"current_steps": 1645, "total_steps": 9134, "loss": 0.5876, "learning_rate": 4.610414268317701e-05, "epoch": 0.18008155669284873, "percentage": 18.01, "elapsed_time": "1 day, 6:23:21", "remaining_time": "5 days, 18:20:58", "throughput": 2716.93, "total_tokens": 297235680} {"current_steps": 1646, "total_steps": 9134, "loss": 0.6713, "learning_rate": 4.609953186553373e-05, "epoch": 0.18019102876378665, "percentage": 18.02, "elapsed_time": "1 day, 6:24:29", "remaining_time": "5 days, 18:20:01", "throughput": 2717.05, "total_tokens": 297435040} {"current_steps": 1647, "total_steps": 9134, "loss": 0.587, "learning_rate": 4.609491855185616e-05, "epoch": 0.18030050083472454, "percentage": 18.03, "elapsed_time": "1 day, 6:25:34", "remaining_time": "5 days, 18:18:45", "throughput": 2716.87, "total_tokens": 297590496} {"current_steps": 1648, "total_steps": 9134, "loss": 0.6131, "learning_rate": 4.609030274269006e-05, "epoch": 0.18040997290566244, "percentage": 18.04, "elapsed_time": "1 day, 6:26:41", "remaining_time": "5 days, 18:17:40", "throughput": 2716.64, "total_tokens": 297746624} {"current_steps": 1649, "total_steps": 9134, "loss": 0.6679, "learning_rate": 4.6085684438581464e-05, "epoch": 0.18051944497660036, "percentage": 18.05, "elapsed_time": "1 day, 6:27:49", "remaining_time": "5 days, 18:16:41", "throughput": 2716.54, "total_tokens": 297921120} {"current_steps": 1650, "total_steps": 9134, "loss": 0.6286, "learning_rate": 4.60810636400767e-05, "epoch": 0.18062891704753825, "percentage": 18.06, "elapsed_time": "1 day, 6:28:55", "remaining_time": "5 days, 18:15:35", "throughput": 2716.58, "total_tokens": 298105696} {"current_steps": 1651, "total_steps": 9134, "loss": 0.7899, "learning_rate": 4.6076440347722415e-05, "epoch": 0.18073838911847614, "percentage": 18.08, "elapsed_time": "1 day, 6:30:03", "remaining_time": "5 days, 18:14:32", "throughput": 2716.55, "total_tokens": 298285792} {"current_steps": 1652, "total_steps": 9134, "loss": 0.7693, "learning_rate": 4.6071814562065524e-05, "epoch": 0.18084786118941404, "percentage": 18.09, "elapsed_time": "1 day, 6:31:12", "remaining_time": "5 days, 18:13:39", "throughput": 2716.61, "total_tokens": 298481568} {"current_steps": 1653, "total_steps": 9134, "loss": 0.707, "learning_rate": 4.6067186283653255e-05, "epoch": 0.18095733326035196, "percentage": 18.1, "elapsed_time": "1 day, 6:32:18", "remaining_time": "5 days, 18:12:28", "throughput": 2716.47, "total_tokens": 298643296} {"current_steps": 1654, "total_steps": 9134, "loss": 0.7795, "learning_rate": 4.606255551303312e-05, "epoch": 0.18106680533128985, "percentage": 18.11, "elapsed_time": "1 day, 6:33:24", "remaining_time": "5 days, 18:11:21", "throughput": 2716.61, "total_tokens": 298839744} {"current_steps": 1655, "total_steps": 9134, "loss": 0.7214, "learning_rate": 4.6057922250752935e-05, "epoch": 0.18117627740222775, "percentage": 18.12, "elapsed_time": "1 day, 6:34:32", "remaining_time": "5 days, 18:10:19", "throughput": 2716.57, "total_tokens": 299018496} {"current_steps": 1656, "total_steps": 9134, "loss": 0.7098, "learning_rate": 4.60532864973608e-05, "epoch": 0.18128574947316567, "percentage": 18.13, "elapsed_time": "1 day, 6:35:41", "remaining_time": "5 days, 18:09:27", "throughput": 2716.82, "total_tokens": 299235776} {"current_steps": 1657, "total_steps": 9134, "loss": 0.7857, "learning_rate": 4.604864825340512e-05, "epoch": 0.18139522154410356, "percentage": 18.14, "elapsed_time": "1 day, 6:36:50", "remaining_time": "5 days, 18:08:31", "throughput": 2716.83, "total_tokens": 299423936} {"current_steps": 1658, "total_steps": 9134, "loss": 0.6768, "learning_rate": 4.6044007519434594e-05, "epoch": 0.18150469361504146, "percentage": 18.15, "elapsed_time": "1 day, 6:37:56", "remaining_time": "5 days, 18:07:21", "throughput": 2716.62, "total_tokens": 299578720} {"current_steps": 1659, "total_steps": 9134, "loss": 0.6078, "learning_rate": 4.603936429599821e-05, "epoch": 0.18161416568597935, "percentage": 18.16, "elapsed_time": "1 day, 6:39:02", "remaining_time": "5 days, 18:06:10", "throughput": 2716.34, "total_tokens": 299726112} {"current_steps": 1660, "total_steps": 9134, "loss": 0.818, "learning_rate": 4.6034718583645244e-05, "epoch": 0.18172363775691727, "percentage": 18.17, "elapsed_time": "1 day, 6:40:11", "remaining_time": "5 days, 18:05:16", "throughput": 2716.36, "total_tokens": 299916960} {"current_steps": 1661, "total_steps": 9134, "loss": 0.6143, "learning_rate": 4.603007038292528e-05, "epoch": 0.18183310982785517, "percentage": 18.18, "elapsed_time": "1 day, 6:41:20", "remaining_time": "5 days, 18:04:22", "throughput": 2716.46, "total_tokens": 300115648} {"current_steps": 1662, "total_steps": 9134, "loss": 0.7028, "learning_rate": 4.602541969438819e-05, "epoch": 0.18194258189879306, "percentage": 18.2, "elapsed_time": "1 day, 6:42:26", "remaining_time": "5 days, 18:03:14", "throughput": 2716.32, "total_tokens": 300279840} {"current_steps": 1663, "total_steps": 9134, "loss": 0.7645, "learning_rate": 4.602076651858416e-05, "epoch": 0.18205205396973098, "percentage": 18.21, "elapsed_time": "1 day, 6:43:36", "remaining_time": "5 days, 18:02:22", "throughput": 2716.63, "total_tokens": 300503392} {"current_steps": 1664, "total_steps": 9134, "loss": 0.7749, "learning_rate": 4.601611085606362e-05, "epoch": 0.18216152604066888, "percentage": 18.22, "elapsed_time": "1 day, 6:44:42", "remaining_time": "5 days, 18:01:14", "throughput": 2716.76, "total_tokens": 300698496} {"current_steps": 1665, "total_steps": 9134, "loss": 0.6195, "learning_rate": 4.601145270737735e-05, "epoch": 0.18227099811160677, "percentage": 18.23, "elapsed_time": "1 day, 6:45:47", "remaining_time": "5 days, 18:00:01", "throughput": 2716.65, "total_tokens": 300862016} {"current_steps": 1666, "total_steps": 9134, "loss": 0.7233, "learning_rate": 4.6006792073076385e-05, "epoch": 0.1823804701825447, "percentage": 18.24, "elapsed_time": "1 day, 6:46:54", "remaining_time": "5 days, 17:58:54", "throughput": 2716.79, "total_tokens": 301058688} {"current_steps": 1667, "total_steps": 9134, "loss": 0.8297, "learning_rate": 4.600212895371208e-05, "epoch": 0.18248994225348258, "percentage": 18.25, "elapsed_time": "1 day, 6:48:01", "remaining_time": "5 days, 17:57:51", "throughput": 2716.73, "total_tokens": 301235200} {"current_steps": 1668, "total_steps": 9134, "loss": 0.873, "learning_rate": 4.5997463349836066e-05, "epoch": 0.18259941432442048, "percentage": 18.26, "elapsed_time": "1 day, 6:49:08", "remaining_time": "5 days, 17:56:47", "throughput": 2716.95, "total_tokens": 301441504} {"current_steps": 1669, "total_steps": 9134, "loss": 0.6468, "learning_rate": 4.5992795262000285e-05, "epoch": 0.18270888639535837, "percentage": 18.27, "elapsed_time": "1 day, 6:50:13", "remaining_time": "5 days, 17:55:36", "throughput": 2716.7, "total_tokens": 301591808} {"current_steps": 1670, "total_steps": 9134, "loss": 0.8206, "learning_rate": 4.598812469075695e-05, "epoch": 0.1828183584662963, "percentage": 18.28, "elapsed_time": "1 day, 6:51:22", "remaining_time": "5 days, 17:54:40", "throughput": 2716.78, "total_tokens": 301788032} {"current_steps": 1671, "total_steps": 9134, "loss": 0.695, "learning_rate": 4.598345163665859e-05, "epoch": 0.1829278305372342, "percentage": 18.29, "elapsed_time": "1 day, 6:52:32", "remaining_time": "5 days, 17:53:49", "throughput": 2716.93, "total_tokens": 301994784} {"current_steps": 1672, "total_steps": 9134, "loss": 0.6364, "learning_rate": 4.5978776100258006e-05, "epoch": 0.18303730260817208, "percentage": 18.31, "elapsed_time": "1 day, 6:53:36", "remaining_time": "5 days, 17:52:31", "throughput": 2716.83, "total_tokens": 302156960} {"current_steps": 1673, "total_steps": 9134, "loss": 0.8763, "learning_rate": 4.597409808210832e-05, "epoch": 0.18314677467911, "percentage": 18.32, "elapsed_time": "1 day, 6:54:46", "remaining_time": "5 days, 17:51:37", "throughput": 2716.89, "total_tokens": 302351840} {"current_steps": 1674, "total_steps": 9134, "loss": 0.7779, "learning_rate": 4.596941758276293e-05, "epoch": 0.1832562467500479, "percentage": 18.33, "elapsed_time": "1 day, 6:55:54", "remaining_time": "5 days, 17:50:37", "throughput": 2717.04, "total_tokens": 302553664} {"current_steps": 1675, "total_steps": 9134, "loss": 0.7778, "learning_rate": 4.596473460277553e-05, "epoch": 0.1833657188209858, "percentage": 18.34, "elapsed_time": "1 day, 6:57:01", "remaining_time": "5 days, 17:49:36", "throughput": 2717.19, "total_tokens": 302754144} {"current_steps": 1676, "total_steps": 9134, "loss": 0.5931, "learning_rate": 4.5960049142700096e-05, "epoch": 0.1834751908919237, "percentage": 18.35, "elapsed_time": "1 day, 6:58:07", "remaining_time": "5 days, 17:48:28", "throughput": 2717.17, "total_tokens": 302931776} {"current_steps": 1677, "total_steps": 9134, "loss": 0.6655, "learning_rate": 4.595536120309092e-05, "epoch": 0.1835846629628616, "percentage": 18.36, "elapsed_time": "1 day, 6:59:14", "remaining_time": "5 days, 17:47:23", "throughput": 2717.19, "total_tokens": 303115232} {"current_steps": 1678, "total_steps": 9134, "loss": 0.8402, "learning_rate": 4.595067078450257e-05, "epoch": 0.1836941350337995, "percentage": 18.37, "elapsed_time": "1 day, 7:00:19", "remaining_time": "5 days, 17:46:07", "throughput": 2717.27, "total_tokens": 303300032} {"current_steps": 1679, "total_steps": 9134, "loss": 0.8069, "learning_rate": 4.5945977887489925e-05, "epoch": 0.1838036071047374, "percentage": 18.38, "elapsed_time": "1 day, 7:01:28", "remaining_time": "5 days, 17:45:12", "throughput": 2717.5, "total_tokens": 303513504} {"current_steps": 1680, "total_steps": 9134, "loss": 0.4643, "learning_rate": 4.594128251260813e-05, "epoch": 0.18391307917567531, "percentage": 18.39, "elapsed_time": "1 day, 7:02:36", "remaining_time": "5 days, 17:44:13", "throughput": 2717.5, "total_tokens": 303698976} {"current_steps": 1681, "total_steps": 9134, "loss": 0.7694, "learning_rate": 4.593658466041265e-05, "epoch": 0.1840225512466132, "percentage": 18.4, "elapsed_time": "1 day, 7:03:38", "remaining_time": "5 days, 17:42:45", "throughput": 2717.39, "total_tokens": 303853536} {"current_steps": 1682, "total_steps": 9134, "loss": 0.6043, "learning_rate": 4.593188433145923e-05, "epoch": 0.1841320233175511, "percentage": 18.41, "elapsed_time": "1 day, 7:04:46", "remaining_time": "5 days, 17:41:46", "throughput": 2717.4, "total_tokens": 304040128} {"current_steps": 1683, "total_steps": 9134, "loss": 0.5601, "learning_rate": 4.5927181526303906e-05, "epoch": 0.18424149538848902, "percentage": 18.43, "elapsed_time": "1 day, 7:05:50", "remaining_time": "5 days, 17:40:29", "throughput": 2717.38, "total_tokens": 304212608} {"current_steps": 1684, "total_steps": 9134, "loss": 1.0625, "learning_rate": 4.592247624550301e-05, "epoch": 0.18435096745942692, "percentage": 18.44, "elapsed_time": "1 day, 7:06:58", "remaining_time": "5 days, 17:39:29", "throughput": 2717.63, "total_tokens": 304425184} {"current_steps": 1685, "total_steps": 9134, "loss": 0.7646, "learning_rate": 4.591776848961318e-05, "epoch": 0.1844604395303648, "percentage": 18.45, "elapsed_time": "1 day, 7:08:08", "remaining_time": "5 days, 17:38:39", "throughput": 2717.84, "total_tokens": 304639328} {"current_steps": 1686, "total_steps": 9134, "loss": 0.6684, "learning_rate": 4.591305825919132e-05, "epoch": 0.1845699116013027, "percentage": 18.46, "elapsed_time": "1 day, 7:09:17", "remaining_time": "5 days, 17:37:40", "throughput": 2717.77, "total_tokens": 304817408} {"current_steps": 1687, "total_steps": 9134, "loss": 0.702, "learning_rate": 4.590834555479465e-05, "epoch": 0.18467938367224063, "percentage": 18.47, "elapsed_time": "1 day, 7:10:26", "remaining_time": "5 days, 17:36:46", "throughput": 2717.8, "total_tokens": 305009824} {"current_steps": 1688, "total_steps": 9134, "loss": 0.604, "learning_rate": 4.590363037698067e-05, "epoch": 0.18478885574317852, "percentage": 18.48, "elapsed_time": "1 day, 7:11:31", "remaining_time": "5 days, 17:35:32", "throughput": 2717.78, "total_tokens": 305182976} {"current_steps": 1689, "total_steps": 9134, "loss": 0.8205, "learning_rate": 4.589891272630717e-05, "epoch": 0.18489832781411641, "percentage": 18.49, "elapsed_time": "1 day, 7:12:36", "remaining_time": "5 days, 17:34:22", "throughput": 2717.72, "total_tokens": 305355008} {"current_steps": 1690, "total_steps": 9134, "loss": 0.8788, "learning_rate": 4.5894192603332254e-05, "epoch": 0.18500779988505434, "percentage": 18.5, "elapsed_time": "1 day, 7:13:43", "remaining_time": "5 days, 17:33:14", "throughput": 2717.84, "total_tokens": 305548544} {"current_steps": 1691, "total_steps": 9134, "loss": 0.6037, "learning_rate": 4.58894700086143e-05, "epoch": 0.18511727195599223, "percentage": 18.51, "elapsed_time": "1 day, 7:14:49", "remaining_time": "5 days, 17:32:07", "throughput": 2717.96, "total_tokens": 305742304} {"current_steps": 1692, "total_steps": 9134, "loss": 0.9564, "learning_rate": 4.5884744942711964e-05, "epoch": 0.18522674402693012, "percentage": 18.52, "elapsed_time": "1 day, 7:15:58", "remaining_time": "5 days, 17:31:12", "throughput": 2718.14, "total_tokens": 305950848} {"current_steps": 1693, "total_steps": 9134, "loss": 0.819, "learning_rate": 4.588001740618424e-05, "epoch": 0.18533621609786805, "percentage": 18.54, "elapsed_time": "1 day, 7:17:06", "remaining_time": "5 days, 17:30:10", "throughput": 2718.02, "total_tokens": 306120640} {"current_steps": 1694, "total_steps": 9134, "loss": 0.8601, "learning_rate": 4.587528739959036e-05, "epoch": 0.18544568816880594, "percentage": 18.55, "elapsed_time": "1 day, 7:18:12", "remaining_time": "5 days, 17:29:00", "throughput": 2718.04, "total_tokens": 306301632} {"current_steps": 1695, "total_steps": 9134, "loss": 0.6594, "learning_rate": 4.58705549234899e-05, "epoch": 0.18555516023974383, "percentage": 18.56, "elapsed_time": "1 day, 7:19:15", "remaining_time": "5 days, 17:27:38", "throughput": 2717.76, "total_tokens": 306441632} {"current_steps": 1696, "total_steps": 9134, "loss": 0.6408, "learning_rate": 4.5865819978442685e-05, "epoch": 0.18566463231068173, "percentage": 18.57, "elapsed_time": "1 day, 7:20:16", "remaining_time": "5 days, 17:26:08", "throughput": 2717.58, "total_tokens": 306586784} {"current_steps": 1697, "total_steps": 9134, "loss": 0.8256, "learning_rate": 4.586108256500885e-05, "epoch": 0.18577410438161965, "percentage": 18.58, "elapsed_time": "1 day, 7:21:22", "remaining_time": "5 days, 17:24:59", "throughput": 2717.57, "total_tokens": 306764864} {"current_steps": 1698, "total_steps": 9134, "loss": 0.5926, "learning_rate": 4.585634268374884e-05, "epoch": 0.18588357645255754, "percentage": 18.59, "elapsed_time": "1 day, 7:22:28", "remaining_time": "5 days, 17:23:50", "throughput": 2717.76, "total_tokens": 306965568} {"current_steps": 1699, "total_steps": 9134, "loss": 0.5739, "learning_rate": 4.585160033522335e-05, "epoch": 0.18599304852349544, "percentage": 18.6, "elapsed_time": "1 day, 7:23:34", "remaining_time": "5 days, 17:22:41", "throughput": 2717.66, "total_tokens": 307133792} {"current_steps": 1700, "total_steps": 9134, "loss": 0.7133, "learning_rate": 4.5846855519993404e-05, "epoch": 0.18610252059443336, "percentage": 18.61, "elapsed_time": "1 day, 7:24:39", "remaining_time": "5 days, 17:21:29", "throughput": 2717.4, "total_tokens": 307281632} {"current_steps": 1701, "total_steps": 9134, "loss": 0.7289, "learning_rate": 4.584210823862031e-05, "epoch": 0.18621199266537125, "percentage": 18.62, "elapsed_time": "1 day, 7:25:48", "remaining_time": "5 days, 17:20:32", "throughput": 2717.16, "total_tokens": 307441792} {"current_steps": 1702, "total_steps": 9134, "loss": 0.5245, "learning_rate": 4.583735849166564e-05, "epoch": 0.18632146473630914, "percentage": 18.63, "elapsed_time": "1 day, 7:26:53", "remaining_time": "5 days, 17:19:21", "throughput": 2717.05, "total_tokens": 307607328} {"current_steps": 1703, "total_steps": 9134, "loss": 0.7066, "learning_rate": 4.583260627969131e-05, "epoch": 0.18643093680724704, "percentage": 18.64, "elapsed_time": "1 day, 7:27:56", "remaining_time": "5 days, 17:17:58", "throughput": 2716.92, "total_tokens": 307763008} {"current_steps": 1704, "total_steps": 9134, "loss": 0.7144, "learning_rate": 4.5827851603259475e-05, "epoch": 0.18654040887818496, "percentage": 18.66, "elapsed_time": "1 day, 7:29:02", "remaining_time": "5 days, 17:16:52", "throughput": 2716.8, "total_tokens": 307930336} {"current_steps": 1705, "total_steps": 9134, "loss": 0.9109, "learning_rate": 4.582309446293261e-05, "epoch": 0.18664988094912285, "percentage": 18.67, "elapsed_time": "1 day, 7:30:07", "remaining_time": "5 days, 17:15:36", "throughput": 2716.72, "total_tokens": 308096320} {"current_steps": 1706, "total_steps": 9134, "loss": 0.6924, "learning_rate": 4.581833485927348e-05, "epoch": 0.18675935302006075, "percentage": 18.68, "elapsed_time": "1 day, 7:31:12", "remaining_time": "5 days, 17:14:22", "throughput": 2716.65, "total_tokens": 308263648} {"current_steps": 1707, "total_steps": 9134, "loss": 0.7552, "learning_rate": 4.5813572792845134e-05, "epoch": 0.18686882509099867, "percentage": 18.69, "elapsed_time": "1 day, 7:32:18", "remaining_time": "5 days, 17:13:16", "throughput": 2716.41, "total_tokens": 308417984} {"current_steps": 1708, "total_steps": 9134, "loss": 0.6805, "learning_rate": 4.580880826421091e-05, "epoch": 0.18697829716193656, "percentage": 18.7, "elapsed_time": "1 day, 7:33:28", "remaining_time": "5 days, 17:12:22", "throughput": 2716.54, "total_tokens": 308620256} {"current_steps": 1709, "total_steps": 9134, "loss": 0.7154, "learning_rate": 4.580404127393445e-05, "epoch": 0.18708776923287446, "percentage": 18.71, "elapsed_time": "1 day, 7:34:35", "remaining_time": "5 days, 17:11:19", "throughput": 2716.58, "total_tokens": 308807744} {"current_steps": 1710, "total_steps": 9134, "loss": 0.5956, "learning_rate": 4.579927182257968e-05, "epoch": 0.18719724130381238, "percentage": 18.72, "elapsed_time": "1 day, 7:35:44", "remaining_time": "5 days, 17:10:21", "throughput": 2716.41, "total_tokens": 308975072} {"current_steps": 1711, "total_steps": 9134, "loss": 0.8904, "learning_rate": 4.579449991071082e-05, "epoch": 0.18730671337475027, "percentage": 18.73, "elapsed_time": "1 day, 7:36:50", "remaining_time": "5 days, 17:09:17", "throughput": 2716.42, "total_tokens": 309158080} {"current_steps": 1712, "total_steps": 9134, "loss": 0.5257, "learning_rate": 4.578972553889237e-05, "epoch": 0.18741618544568817, "percentage": 18.74, "elapsed_time": "1 day, 7:37:56", "remaining_time": "5 days, 17:08:06", "throughput": 2716.45, "total_tokens": 309339968} {"current_steps": 1713, "total_steps": 9134, "loss": 0.8125, "learning_rate": 4.578494870768912e-05, "epoch": 0.18752565751662606, "percentage": 18.75, "elapsed_time": "1 day, 7:39:05", "remaining_time": "5 days, 17:07:11", "throughput": 2716.42, "total_tokens": 309524096} {"current_steps": 1714, "total_steps": 9134, "loss": 0.9795, "learning_rate": 4.578016941766619e-05, "epoch": 0.18763512958756398, "percentage": 18.77, "elapsed_time": "1 day, 7:40:15", "remaining_time": "5 days, 17:06:18", "throughput": 2716.47, "total_tokens": 309719424} {"current_steps": 1715, "total_steps": 9134, "loss": 0.5501, "learning_rate": 4.5775387669388935e-05, "epoch": 0.18774460165850188, "percentage": 18.78, "elapsed_time": "1 day, 7:41:22", "remaining_time": "5 days, 17:05:17", "throughput": 2716.57, "total_tokens": 309914976} {"current_steps": 1716, "total_steps": 9134, "loss": 0.7762, "learning_rate": 4.5770603463423035e-05, "epoch": 0.18785407372943977, "percentage": 18.79, "elapsed_time": "1 day, 7:42:30", "remaining_time": "5 days, 17:04:13", "throughput": 2716.61, "total_tokens": 310101344} {"current_steps": 1717, "total_steps": 9134, "loss": 0.7358, "learning_rate": 4.576581680033445e-05, "epoch": 0.1879635458003777, "percentage": 18.8, "elapsed_time": "1 day, 7:43:39", "remaining_time": "5 days, 17:03:17", "throughput": 2716.59, "total_tokens": 310286816} {"current_steps": 1718, "total_steps": 9134, "loss": 0.7913, "learning_rate": 4.576102768068944e-05, "epoch": 0.18807301787131558, "percentage": 18.81, "elapsed_time": "1 day, 7:44:47", "remaining_time": "5 days, 17:02:17", "throughput": 2716.51, "total_tokens": 310462432} {"current_steps": 1719, "total_steps": 9134, "loss": 0.6864, "learning_rate": 4.5756236105054534e-05, "epoch": 0.18818248994225348, "percentage": 18.82, "elapsed_time": "1 day, 7:45:47", "remaining_time": "5 days, 17:00:45", "throughput": 2716.28, "total_tokens": 310600864} {"current_steps": 1720, "total_steps": 9134, "loss": 0.7649, "learning_rate": 4.575144207399658e-05, "epoch": 0.18829196201319137, "percentage": 18.83, "elapsed_time": "1 day, 7:46:56", "remaining_time": "5 days, 16:59:49", "throughput": 2716.34, "total_tokens": 310794624} {"current_steps": 1721, "total_steps": 9134, "loss": 0.556, "learning_rate": 4.574664558808271e-05, "epoch": 0.1884014340841293, "percentage": 18.84, "elapsed_time": "1 day, 7:48:02", "remaining_time": "5 days, 16:58:40", "throughput": 2716.14, "total_tokens": 310951424} {"current_steps": 1722, "total_steps": 9134, "loss": 0.7297, "learning_rate": 4.574184664788031e-05, "epoch": 0.1885109061550672, "percentage": 18.85, "elapsed_time": "1 day, 7:49:10", "remaining_time": "5 days, 16:57:39", "throughput": 2716.1, "total_tokens": 311130848} {"current_steps": 1723, "total_steps": 9134, "loss": 0.7508, "learning_rate": 4.573704525395711e-05, "epoch": 0.18862037822600508, "percentage": 18.86, "elapsed_time": "1 day, 7:50:19", "remaining_time": "5 days, 16:56:42", "throughput": 2716.21, "total_tokens": 311330656} {"current_steps": 1724, "total_steps": 9134, "loss": 0.7034, "learning_rate": 4.573224140688111e-05, "epoch": 0.188729850296943, "percentage": 18.87, "elapsed_time": "1 day, 7:51:21", "remaining_time": "5 days, 16:55:19", "throughput": 2716.04, "total_tokens": 311480288} {"current_steps": 1725, "total_steps": 9134, "loss": 0.5854, "learning_rate": 4.5727435107220576e-05, "epoch": 0.1888393223678809, "percentage": 18.89, "elapsed_time": "1 day, 7:52:25", "remaining_time": "5 days, 16:53:58", "throughput": 2716.05, "total_tokens": 311653216} {"current_steps": 1726, "total_steps": 9134, "loss": 0.6283, "learning_rate": 4.5722626355544085e-05, "epoch": 0.1889487944388188, "percentage": 18.9, "elapsed_time": "1 day, 7:53:28", "remaining_time": "5 days, 16:52:37", "throughput": 2715.73, "total_tokens": 311787616} {"current_steps": 1727, "total_steps": 9134, "loss": 0.8857, "learning_rate": 4.5717815152420515e-05, "epoch": 0.1890582665097567, "percentage": 18.91, "elapsed_time": "1 day, 7:54:34", "remaining_time": "5 days, 16:51:29", "throughput": 2715.86, "total_tokens": 311982944} {"current_steps": 1728, "total_steps": 9134, "loss": 0.8558, "learning_rate": 4.5713001498419025e-05, "epoch": 0.1891677385806946, "percentage": 18.92, "elapsed_time": "1 day, 7:55:41", "remaining_time": "5 days, 16:50:26", "throughput": 2715.84, "total_tokens": 312163040} {"current_steps": 1729, "total_steps": 9134, "loss": 0.7916, "learning_rate": 4.570818539410905e-05, "epoch": 0.1892772106516325, "percentage": 18.93, "elapsed_time": "1 day, 7:56:48", "remaining_time": "5 days, 16:49:22", "throughput": 2715.81, "total_tokens": 312342240} {"current_steps": 1730, "total_steps": 9134, "loss": 0.6366, "learning_rate": 4.5703366840060335e-05, "epoch": 0.1893866827225704, "percentage": 18.94, "elapsed_time": "1 day, 7:57:54", "remaining_time": "5 days, 16:48:11", "throughput": 2715.75, "total_tokens": 312512928} {"current_steps": 1731, "total_steps": 9134, "loss": 0.7346, "learning_rate": 4.5698545836842896e-05, "epoch": 0.18949615479350831, "percentage": 18.95, "elapsed_time": "1 day, 7:59:02", "remaining_time": "5 days, 16:47:10", "throughput": 2715.58, "total_tokens": 312678016} {"current_steps": 1732, "total_steps": 9134, "loss": 0.7743, "learning_rate": 4.569372238502705e-05, "epoch": 0.1896056268644462, "percentage": 18.96, "elapsed_time": "1 day, 8:00:10", "remaining_time": "5 days, 16:46:10", "throughput": 2715.37, "total_tokens": 312838400} {"current_steps": 1733, "total_steps": 9134, "loss": 0.7329, "learning_rate": 4.568889648518341e-05, "epoch": 0.1897150989353841, "percentage": 18.97, "elapsed_time": "1 day, 8:01:12", "remaining_time": "5 days, 16:44:46", "throughput": 2715.25, "total_tokens": 312994528} {"current_steps": 1734, "total_steps": 9134, "loss": 0.8068, "learning_rate": 4.568406813788287e-05, "epoch": 0.18982457100632202, "percentage": 18.98, "elapsed_time": "1 day, 8:02:16", "remaining_time": "5 days, 16:43:30", "throughput": 2715.28, "total_tokens": 313172384} {"current_steps": 1735, "total_steps": 9134, "loss": 0.7402, "learning_rate": 4.5679237343696604e-05, "epoch": 0.18993404307725992, "percentage": 18.99, "elapsed_time": "1 day, 8:03:24", "remaining_time": "5 days, 16:42:30", "throughput": 2715.31, "total_tokens": 313359872} {"current_steps": 1736, "total_steps": 9134, "loss": 0.7864, "learning_rate": 4.567440410319609e-05, "epoch": 0.1900435151481978, "percentage": 19.01, "elapsed_time": "1 day, 8:04:34", "remaining_time": "5 days, 16:41:35", "throughput": 2715.07, "total_tokens": 313520704} {"current_steps": 1737, "total_steps": 9134, "loss": 0.9233, "learning_rate": 4.56695684169531e-05, "epoch": 0.1901529872191357, "percentage": 19.02, "elapsed_time": "1 day, 8:05:40", "remaining_time": "5 days, 16:40:29", "throughput": 2715.17, "total_tokens": 313712224} {"current_steps": 1738, "total_steps": 9134, "loss": 0.8014, "learning_rate": 4.5664730285539684e-05, "epoch": 0.19026245929007363, "percentage": 19.03, "elapsed_time": "1 day, 8:06:47", "remaining_time": "5 days, 16:39:22", "throughput": 2715.24, "total_tokens": 313900832} {"current_steps": 1739, "total_steps": 9134, "loss": 0.7296, "learning_rate": 4.565988970952817e-05, "epoch": 0.19037193136101152, "percentage": 19.04, "elapsed_time": "1 day, 8:07:53", "remaining_time": "5 days, 16:38:16", "throughput": 2715.28, "total_tokens": 314086304} {"current_steps": 1740, "total_steps": 9134, "loss": 0.761, "learning_rate": 4.5655046689491204e-05, "epoch": 0.19048140343194941, "percentage": 19.05, "elapsed_time": "1 day, 8:09:02", "remaining_time": "5 days, 16:37:19", "throughput": 2715.2, "total_tokens": 314264384} {"current_steps": 1741, "total_steps": 9134, "loss": 0.7569, "learning_rate": 4.56502012260017e-05, "epoch": 0.19059087550288734, "percentage": 19.06, "elapsed_time": "1 day, 8:10:07", "remaining_time": "5 days, 16:36:05", "throughput": 2714.89, "total_tokens": 314404608} {"current_steps": 1742, "total_steps": 9134, "loss": 0.6949, "learning_rate": 4.564535331963287e-05, "epoch": 0.19070034757382523, "percentage": 19.07, "elapsed_time": "1 day, 8:11:13", "remaining_time": "5 days, 16:34:57", "throughput": 2714.82, "total_tokens": 314576192} {"current_steps": 1743, "total_steps": 9134, "loss": 0.6304, "learning_rate": 4.56405029709582e-05, "epoch": 0.19080981964476312, "percentage": 19.08, "elapsed_time": "1 day, 8:12:19", "remaining_time": "5 days, 16:33:49", "throughput": 2714.68, "total_tokens": 314738592} {"current_steps": 1744, "total_steps": 9134, "loss": 0.6863, "learning_rate": 4.5635650180551494e-05, "epoch": 0.19091929171570104, "percentage": 19.09, "elapsed_time": "1 day, 8:13:26", "remaining_time": "5 days, 16:32:43", "throughput": 2714.72, "total_tokens": 314924960} {"current_steps": 1745, "total_steps": 9134, "loss": 0.5743, "learning_rate": 4.5630794948986814e-05, "epoch": 0.19102876378663894, "percentage": 19.1, "elapsed_time": "1 day, 8:14:25", "remaining_time": "5 days, 16:31:07", "throughput": 2714.47, "total_tokens": 315058016} {"current_steps": 1746, "total_steps": 9134, "loss": 0.6203, "learning_rate": 4.562593727683854e-05, "epoch": 0.19113823585757683, "percentage": 19.12, "elapsed_time": "1 day, 8:15:33", "remaining_time": "5 days, 16:30:06", "throughput": 2714.58, "total_tokens": 315254912} {"current_steps": 1747, "total_steps": 9134, "loss": 0.6785, "learning_rate": 4.562107716468131e-05, "epoch": 0.19124770792851473, "percentage": 19.13, "elapsed_time": "1 day, 8:16:37", "remaining_time": "5 days, 16:28:50", "throughput": 2714.57, "total_tokens": 315426944} {"current_steps": 1748, "total_steps": 9134, "loss": 0.6488, "learning_rate": 4.561621461309007e-05, "epoch": 0.19135717999945265, "percentage": 19.14, "elapsed_time": "1 day, 8:17:43", "remaining_time": "5 days, 16:27:40", "throughput": 2714.71, "total_tokens": 315621824} {"current_steps": 1749, "total_steps": 9134, "loss": 0.7032, "learning_rate": 4.561134962264006e-05, "epoch": 0.19146665207039054, "percentage": 19.15, "elapsed_time": "1 day, 8:18:52", "remaining_time": "5 days, 16:26:42", "throughput": 2714.79, "total_tokens": 315816928} {"current_steps": 1750, "total_steps": 9134, "loss": 0.6696, "learning_rate": 4.560648219390678e-05, "epoch": 0.19157612414132844, "percentage": 19.16, "elapsed_time": "1 day, 8:20:00", "remaining_time": "5 days, 16:25:44", "throughput": 2714.61, "total_tokens": 315982688} {"current_steps": 1751, "total_steps": 9134, "loss": 0.8413, "learning_rate": 4.560161232746606e-05, "epoch": 0.19168559621226636, "percentage": 19.17, "elapsed_time": "1 day, 8:21:09", "remaining_time": "5 days, 16:24:47", "throughput": 2714.83, "total_tokens": 316194816} {"current_steps": 1752, "total_steps": 9134, "loss": 0.8308, "learning_rate": 4.5596740023893986e-05, "epoch": 0.19179506828320425, "percentage": 19.18, "elapsed_time": "1 day, 8:22:17", "remaining_time": "5 days, 16:23:48", "throughput": 2715.09, "total_tokens": 316410752} {"current_steps": 1753, "total_steps": 9134, "loss": 0.54, "learning_rate": 4.559186528376694e-05, "epoch": 0.19190454035414214, "percentage": 19.19, "elapsed_time": "1 day, 8:23:24", "remaining_time": "5 days, 16:22:41", "throughput": 2715.11, "total_tokens": 316593088} {"current_steps": 1754, "total_steps": 9134, "loss": 0.7964, "learning_rate": 4.558698810766159e-05, "epoch": 0.19201401242508004, "percentage": 19.2, "elapsed_time": "1 day, 8:24:27", "remaining_time": "5 days, 16:21:19", "throughput": 2715.14, "total_tokens": 316767808} {"current_steps": 1755, "total_steps": 9134, "loss": 0.4845, "learning_rate": 4.558210849615491e-05, "epoch": 0.19212348449601796, "percentage": 19.21, "elapsed_time": "1 day, 8:25:34", "remaining_time": "5 days, 16:20:16", "throughput": 2715.01, "total_tokens": 316934688} {"current_steps": 1756, "total_steps": 9134, "loss": 0.7998, "learning_rate": 4.557722644982414e-05, "epoch": 0.19223295656695585, "percentage": 19.22, "elapsed_time": "1 day, 8:26:38", "remaining_time": "5 days, 16:19:00", "throughput": 2715.0, "total_tokens": 317108288} {"current_steps": 1757, "total_steps": 9134, "loss": 0.6236, "learning_rate": 4.5572341969246814e-05, "epoch": 0.19234242863789375, "percentage": 19.24, "elapsed_time": "1 day, 8:27:45", "remaining_time": "5 days, 16:17:54", "throughput": 2714.95, "total_tokens": 317283456} {"current_steps": 1758, "total_steps": 9134, "loss": 0.8564, "learning_rate": 4.556745505500076e-05, "epoch": 0.19245190070883167, "percentage": 19.25, "elapsed_time": "1 day, 8:28:53", "remaining_time": "5 days, 16:16:54", "throughput": 2714.99, "total_tokens": 317472960} {"current_steps": 1759, "total_steps": 9134, "loss": 0.5888, "learning_rate": 4.55625657076641e-05, "epoch": 0.19256137277976956, "percentage": 19.26, "elapsed_time": "1 day, 8:30:01", "remaining_time": "5 days, 16:15:54", "throughput": 2715.06, "total_tokens": 317666496} {"current_steps": 1760, "total_steps": 9134, "loss": 0.8448, "learning_rate": 4.555767392781522e-05, "epoch": 0.19267084485070746, "percentage": 19.27, "elapsed_time": "1 day, 8:31:10", "remaining_time": "5 days, 16:15:00", "throughput": 2715.14, "total_tokens": 317863840} {"current_steps": 1761, "total_steps": 9134, "loss": 0.7811, "learning_rate": 4.5552779716032815e-05, "epoch": 0.19278031692164538, "percentage": 19.28, "elapsed_time": "1 day, 8:32:17", "remaining_time": "5 days, 16:13:55", "throughput": 2715.11, "total_tokens": 318042368} {"current_steps": 1762, "total_steps": 9134, "loss": 0.8339, "learning_rate": 4.554788307289585e-05, "epoch": 0.19288978899258327, "percentage": 19.29, "elapsed_time": "1 day, 8:33:27", "remaining_time": "5 days, 16:13:00", "throughput": 2715.31, "total_tokens": 318253600} {"current_steps": 1763, "total_steps": 9134, "loss": 0.7666, "learning_rate": 4.5542983998983605e-05, "epoch": 0.19299926106352117, "percentage": 19.3, "elapsed_time": "1 day, 8:34:36", "remaining_time": "5 days, 16:12:04", "throughput": 2715.24, "total_tokens": 318432576} {"current_steps": 1764, "total_steps": 9134, "loss": 0.4976, "learning_rate": 4.5538082494875626e-05, "epoch": 0.19310873313445906, "percentage": 19.31, "elapsed_time": "1 day, 8:35:41", "remaining_time": "5 days, 16:10:52", "throughput": 2715.01, "total_tokens": 318582880} {"current_steps": 1765, "total_steps": 9134, "loss": 0.8529, "learning_rate": 4.553317856115176e-05, "epoch": 0.19321820520539698, "percentage": 19.32, "elapsed_time": "1 day, 8:36:50", "remaining_time": "5 days, 16:09:56", "throughput": 2715.11, "total_tokens": 318781568} {"current_steps": 1766, "total_steps": 9134, "loss": 0.7746, "learning_rate": 4.552827219839211e-05, "epoch": 0.19332767727633487, "percentage": 19.33, "elapsed_time": "1 day, 8:37:55", "remaining_time": "5 days, 16:08:45", "throughput": 2715.11, "total_tokens": 318959872} {"current_steps": 1767, "total_steps": 9134, "loss": 0.5816, "learning_rate": 4.55233634071771e-05, "epoch": 0.19343714934727277, "percentage": 19.35, "elapsed_time": "1 day, 8:39:02", "remaining_time": "5 days, 16:07:40", "throughput": 2715.18, "total_tokens": 319149152} {"current_steps": 1768, "total_steps": 9134, "loss": 0.89, "learning_rate": 4.5518452188087444e-05, "epoch": 0.1935466214182107, "percentage": 19.36, "elapsed_time": "1 day, 8:40:06", "remaining_time": "5 days, 16:06:21", "throughput": 2715.09, "total_tokens": 319311104} {"current_steps": 1769, "total_steps": 9134, "loss": 0.7718, "learning_rate": 4.551353854170411e-05, "epoch": 0.19365609348914858, "percentage": 19.37, "elapsed_time": "1 day, 8:41:12", "remaining_time": "5 days, 16:05:12", "throughput": 2715.08, "total_tokens": 319489184} {"current_steps": 1770, "total_steps": 9134, "loss": 0.7554, "learning_rate": 4.550862246860839e-05, "epoch": 0.19376556556008648, "percentage": 19.38, "elapsed_time": "1 day, 8:42:21", "remaining_time": "5 days, 16:04:19", "throughput": 2715.09, "total_tokens": 319679584} {"current_steps": 1771, "total_steps": 9134, "loss": 0.7449, "learning_rate": 4.5503703969381826e-05, "epoch": 0.19387503763102437, "percentage": 19.39, "elapsed_time": "1 day, 8:43:30", "remaining_time": "5 days, 16:03:21", "throughput": 2715.2, "total_tokens": 319879392} {"current_steps": 1772, "total_steps": 9134, "loss": 0.6338, "learning_rate": 4.5498783044606285e-05, "epoch": 0.1939845097019623, "percentage": 19.4, "elapsed_time": "1 day, 8:44:36", "remaining_time": "5 days, 16:02:13", "throughput": 2715.08, "total_tokens": 320044256} {"current_steps": 1773, "total_steps": 9134, "loss": 0.6581, "learning_rate": 4.5493859694863894e-05, "epoch": 0.1940939817729002, "percentage": 19.41, "elapsed_time": "1 day, 8:45:45", "remaining_time": "5 days, 16:01:18", "throughput": 2715.15, "total_tokens": 320241152} {"current_steps": 1774, "total_steps": 9134, "loss": 0.8496, "learning_rate": 4.5488933920737087e-05, "epoch": 0.19420345384383808, "percentage": 19.42, "elapsed_time": "1 day, 8:46:48", "remaining_time": "5 days, 15:59:55", "throughput": 2714.99, "total_tokens": 320391680} {"current_steps": 1775, "total_steps": 9134, "loss": 0.7812, "learning_rate": 4.5484005722808566e-05, "epoch": 0.194312925914776, "percentage": 19.43, "elapsed_time": "1 day, 8:47:57", "remaining_time": "5 days, 15:59:00", "throughput": 2715.1, "total_tokens": 320592832} {"current_steps": 1776, "total_steps": 9134, "loss": 0.7774, "learning_rate": 4.5479075101661316e-05, "epoch": 0.1944223979857139, "percentage": 19.44, "elapsed_time": "1 day, 8:49:00", "remaining_time": "5 days, 15:57:38", "throughput": 2715.05, "total_tokens": 320757696} {"current_steps": 1777, "total_steps": 9134, "loss": 0.664, "learning_rate": 4.5474142057878636e-05, "epoch": 0.1945318700566518, "percentage": 19.45, "elapsed_time": "1 day, 8:50:09", "remaining_time": "5 days, 15:56:43", "throughput": 2715.24, "total_tokens": 320967584} {"current_steps": 1778, "total_steps": 9134, "loss": 0.806, "learning_rate": 4.546920659204409e-05, "epoch": 0.1946413421275897, "percentage": 19.47, "elapsed_time": "1 day, 8:51:15", "remaining_time": "5 days, 15:55:33", "throughput": 2715.16, "total_tokens": 321136704} {"current_steps": 1779, "total_steps": 9134, "loss": 0.7577, "learning_rate": 4.546426870474154e-05, "epoch": 0.1947508141985276, "percentage": 19.48, "elapsed_time": "1 day, 8:52:25", "remaining_time": "5 days, 15:54:39", "throughput": 2715.36, "total_tokens": 321349504} {"current_steps": 1780, "total_steps": 9134, "loss": 0.7678, "learning_rate": 4.5459328396555114e-05, "epoch": 0.1948602862694655, "percentage": 19.49, "elapsed_time": "1 day, 8:53:34", "remaining_time": "5 days, 15:53:43", "throughput": 2715.54, "total_tokens": 321558720} {"current_steps": 1781, "total_steps": 9134, "loss": 0.693, "learning_rate": 4.545438566806925e-05, "epoch": 0.1949697583404034, "percentage": 19.5, "elapsed_time": "1 day, 8:54:40", "remaining_time": "5 days, 15:52:35", "throughput": 2715.56, "total_tokens": 321740160} {"current_steps": 1782, "total_steps": 9134, "loss": 0.7572, "learning_rate": 4.5449440519868675e-05, "epoch": 0.19507923041134131, "percentage": 19.51, "elapsed_time": "1 day, 8:55:46", "remaining_time": "5 days, 15:51:25", "throughput": 2715.65, "total_tokens": 321929888} {"current_steps": 1783, "total_steps": 9134, "loss": 0.5926, "learning_rate": 4.544449295253837e-05, "epoch": 0.1951887024822792, "percentage": 19.52, "elapsed_time": "1 day, 8:56:46", "remaining_time": "5 days, 15:49:53", "throughput": 2715.33, "total_tokens": 322055328} {"current_steps": 1784, "total_steps": 9134, "loss": 0.708, "learning_rate": 4.543954296666363e-05, "epoch": 0.1952981745532171, "percentage": 19.53, "elapsed_time": "1 day, 8:57:50", "remaining_time": "5 days, 15:48:35", "throughput": 2715.24, "total_tokens": 322217728} {"current_steps": 1785, "total_steps": 9134, "loss": 0.6501, "learning_rate": 4.5434590562830035e-05, "epoch": 0.19540764662415502, "percentage": 19.54, "elapsed_time": "1 day, 8:58:57", "remaining_time": "5 days, 15:47:32", "throughput": 2715.22, "total_tokens": 322398048} {"current_steps": 1786, "total_steps": 9134, "loss": 0.7077, "learning_rate": 4.542963574162344e-05, "epoch": 0.19551711869509292, "percentage": 19.55, "elapsed_time": "1 day, 9:00:01", "remaining_time": "5 days, 15:46:17", "throughput": 2715.13, "total_tokens": 322562688} {"current_steps": 1787, "total_steps": 9134, "loss": 0.6376, "learning_rate": 4.542467850363e-05, "epoch": 0.1956265907660308, "percentage": 19.56, "elapsed_time": "1 day, 9:01:08", "remaining_time": "5 days, 15:45:10", "throughput": 2715.14, "total_tokens": 322744352} {"current_steps": 1788, "total_steps": 9134, "loss": 1.2777, "learning_rate": 4.541971884943613e-05, "epoch": 0.1957360628369687, "percentage": 19.58, "elapsed_time": "1 day, 9:02:18", "remaining_time": "5 days, 15:44:17", "throughput": 2715.39, "total_tokens": 322963424} {"current_steps": 1789, "total_steps": 9134, "loss": 0.8742, "learning_rate": 4.5414756779628556e-05, "epoch": 0.19584553490790663, "percentage": 19.59, "elapsed_time": "1 day, 9:03:27", "remaining_time": "5 days, 15:43:21", "throughput": 2715.38, "total_tokens": 323149792} {"current_steps": 1790, "total_steps": 9134, "loss": 0.6351, "learning_rate": 4.5409792294794284e-05, "epoch": 0.19595500697884452, "percentage": 19.6, "elapsed_time": "1 day, 9:04:34", "remaining_time": "5 days, 15:42:19", "throughput": 2715.42, "total_tokens": 323338176} {"current_steps": 1791, "total_steps": 9134, "loss": 0.6919, "learning_rate": 4.54048253955206e-05, "epoch": 0.19606447904978241, "percentage": 19.61, "elapsed_time": "1 day, 9:05:37", "remaining_time": "5 days, 15:40:56", "throughput": 2715.35, "total_tokens": 323499904} {"current_steps": 1792, "total_steps": 9134, "loss": 0.787, "learning_rate": 4.5399856082395074e-05, "epoch": 0.19617395112072034, "percentage": 19.62, "elapsed_time": "1 day, 9:06:44", "remaining_time": "5 days, 15:39:53", "throughput": 2715.36, "total_tokens": 323684480} {"current_steps": 1793, "total_steps": 9134, "loss": 0.6584, "learning_rate": 4.5394884356005574e-05, "epoch": 0.19628342319165823, "percentage": 19.63, "elapsed_time": "1 day, 9:07:50", "remaining_time": "5 days, 15:38:45", "throughput": 2715.41, "total_tokens": 323868832} {"current_steps": 1794, "total_steps": 9134, "loss": 0.9239, "learning_rate": 4.538991021694025e-05, "epoch": 0.19639289526259612, "percentage": 19.64, "elapsed_time": "1 day, 9:08:56", "remaining_time": "5 days, 15:37:36", "throughput": 2715.35, "total_tokens": 324041312} {"current_steps": 1795, "total_steps": 9134, "loss": 0.764, "learning_rate": 4.5384933665787524e-05, "epoch": 0.19650236733353404, "percentage": 19.65, "elapsed_time": "1 day, 9:10:06", "remaining_time": "5 days, 15:36:42", "throughput": 2715.52, "total_tokens": 324250304} {"current_steps": 1796, "total_steps": 9134, "loss": 0.7487, "learning_rate": 4.537995470313611e-05, "epoch": 0.19661183940447194, "percentage": 19.66, "elapsed_time": "1 day, 9:11:10", "remaining_time": "5 days, 15:35:24", "throughput": 2715.42, "total_tokens": 324412032} {"current_steps": 1797, "total_steps": 9134, "loss": 0.6143, "learning_rate": 4.537497332957501e-05, "epoch": 0.19672131147540983, "percentage": 19.67, "elapsed_time": "1 day, 9:12:14", "remaining_time": "5 days, 15:34:11", "throughput": 2715.45, "total_tokens": 324591008} {"current_steps": 1798, "total_steps": 9134, "loss": 0.8605, "learning_rate": 4.536998954569353e-05, "epoch": 0.19683078354634773, "percentage": 19.68, "elapsed_time": "1 day, 9:13:20", "remaining_time": "5 days, 15:33:00", "throughput": 2715.35, "total_tokens": 324757888} {"current_steps": 1799, "total_steps": 9134, "loss": 0.5422, "learning_rate": 4.536500335208121e-05, "epoch": 0.19694025561728565, "percentage": 19.7, "elapsed_time": "1 day, 9:14:24", "remaining_time": "5 days, 15:31:44", "throughput": 2715.36, "total_tokens": 324932160} {"current_steps": 1800, "total_steps": 9134, "loss": 0.7896, "learning_rate": 4.536001474932793e-05, "epoch": 0.19704972768822354, "percentage": 19.71, "elapsed_time": "1 day, 9:15:33", "remaining_time": "5 days, 15:30:48", "throughput": 2715.48, "total_tokens": 325134880} {"current_steps": 1801, "total_steps": 9134, "loss": 0.92, "learning_rate": 4.535502373802383e-05, "epoch": 0.19715919975916144, "percentage": 19.72, "elapsed_time": "1 day, 9:16:37", "remaining_time": "5 days, 15:29:30", "throughput": 2715.36, "total_tokens": 325292800} {"current_steps": 1802, "total_steps": 9134, "loss": 0.9008, "learning_rate": 4.535003031875934e-05, "epoch": 0.19726867183009936, "percentage": 19.73, "elapsed_time": "1 day, 9:17:45", "remaining_time": "5 days, 15:28:30", "throughput": 2715.41, "total_tokens": 325484096} {"current_steps": 1803, "total_steps": 9134, "loss": 0.6776, "learning_rate": 4.534503449212516e-05, "epoch": 0.19737814390103725, "percentage": 19.74, "elapsed_time": "1 day, 9:18:52", "remaining_time": "5 days, 15:27:25", "throughput": 2715.48, "total_tokens": 325674272} {"current_steps": 1804, "total_steps": 9134, "loss": 0.6254, "learning_rate": 4.534003625871229e-05, "epoch": 0.19748761597197514, "percentage": 19.75, "elapsed_time": "1 day, 9:20:01", "remaining_time": "5 days, 15:26:27", "throughput": 2715.5, "total_tokens": 325862656} {"current_steps": 1805, "total_steps": 9134, "loss": 0.8917, "learning_rate": 4.533503561911202e-05, "epoch": 0.19759708804291304, "percentage": 19.76, "elapsed_time": "1 day, 9:21:10", "remaining_time": "5 days, 15:25:33", "throughput": 2715.55, "total_tokens": 326057984} {"current_steps": 1806, "total_steps": 9134, "loss": 0.8582, "learning_rate": 4.5330032573915903e-05, "epoch": 0.19770656011385096, "percentage": 19.77, "elapsed_time": "1 day, 9:22:14", "remaining_time": "5 days, 15:24:17", "throughput": 2715.55, "total_tokens": 326232256} {"current_steps": 1807, "total_steps": 9134, "loss": 0.734, "learning_rate": 4.53250271237158e-05, "epoch": 0.19781603218478885, "percentage": 19.78, "elapsed_time": "1 day, 9:23:20", "remaining_time": "5 days, 15:23:07", "throughput": 2715.57, "total_tokens": 326412800} {"current_steps": 1808, "total_steps": 9134, "loss": 0.7288, "learning_rate": 4.532001926910385e-05, "epoch": 0.19792550425572675, "percentage": 19.79, "elapsed_time": "1 day, 9:24:25", "remaining_time": "5 days, 15:21:55", "throughput": 2715.56, "total_tokens": 326589312} {"current_steps": 1809, "total_steps": 9134, "loss": 0.812, "learning_rate": 4.531500901067246e-05, "epoch": 0.19803497632666467, "percentage": 19.81, "elapsed_time": "1 day, 9:25:34", "remaining_time": "5 days, 15:20:56", "throughput": 2715.57, "total_tokens": 326775008} {"current_steps": 1810, "total_steps": 9134, "loss": 0.7664, "learning_rate": 4.5309996349014336e-05, "epoch": 0.19814444839760256, "percentage": 19.82, "elapsed_time": "1 day, 9:26:38", "remaining_time": "5 days, 15:19:41", "throughput": 2715.59, "total_tokens": 326953536} {"current_steps": 1811, "total_steps": 9134, "loss": 0.684, "learning_rate": 4.5304981284722484e-05, "epoch": 0.19825392046854046, "percentage": 19.83, "elapsed_time": "1 day, 9:27:44", "remaining_time": "5 days, 15:18:31", "throughput": 2715.62, "total_tokens": 327135424} {"current_steps": 1812, "total_steps": 9134, "loss": 0.8002, "learning_rate": 4.5299963818390144e-05, "epoch": 0.19836339253947838, "percentage": 19.84, "elapsed_time": "1 day, 9:28:51", "remaining_time": "5 days, 15:17:28", "throughput": 2715.72, "total_tokens": 327329632} {"current_steps": 1813, "total_steps": 9134, "loss": 0.7857, "learning_rate": 4.5294943950610904e-05, "epoch": 0.19847286461041627, "percentage": 19.85, "elapsed_time": "1 day, 9:29:53", "remaining_time": "5 days, 15:16:04", "throughput": 2715.56, "total_tokens": 327479936} {"current_steps": 1814, "total_steps": 9134, "loss": 0.6425, "learning_rate": 4.528992168197859e-05, "epoch": 0.19858233668135417, "percentage": 19.86, "elapsed_time": "1 day, 9:31:01", "remaining_time": "5 days, 15:15:04", "throughput": 2715.59, "total_tokens": 327668320} {"current_steps": 1815, "total_steps": 9134, "loss": 0.7205, "learning_rate": 4.5284897013087326e-05, "epoch": 0.19869180875229206, "percentage": 19.87, "elapsed_time": "1 day, 9:32:06", "remaining_time": "5 days, 15:13:51", "throughput": 2715.57, "total_tokens": 327841920} {"current_steps": 1816, "total_steps": 9134, "loss": 0.8387, "learning_rate": 4.527986994453152e-05, "epoch": 0.19880128082322998, "percentage": 19.88, "elapsed_time": "1 day, 9:33:16", "remaining_time": "5 days, 15:12:59", "throughput": 2715.68, "total_tokens": 328045536} {"current_steps": 1817, "total_steps": 9134, "loss": 0.5109, "learning_rate": 4.5274840476905873e-05, "epoch": 0.19891075289416787, "percentage": 19.89, "elapsed_time": "1 day, 9:34:21", "remaining_time": "5 days, 15:11:44", "throughput": 2715.58, "total_tokens": 328208832} {"current_steps": 1818, "total_steps": 9134, "loss": 0.8093, "learning_rate": 4.526980861080535e-05, "epoch": 0.19902022496510577, "percentage": 19.9, "elapsed_time": "1 day, 9:35:30", "remaining_time": "5 days, 15:10:49", "throughput": 2715.59, "total_tokens": 328397888} {"current_steps": 1819, "total_steps": 9134, "loss": 0.6252, "learning_rate": 4.5264774346825226e-05, "epoch": 0.1991296970360437, "percentage": 19.91, "elapsed_time": "1 day, 9:36:38", "remaining_time": "5 days, 15:09:47", "throughput": 2715.46, "total_tokens": 328565216} {"current_steps": 1820, "total_steps": 9134, "loss": 0.7201, "learning_rate": 4.5259737685561035e-05, "epoch": 0.19923916910698158, "percentage": 19.93, "elapsed_time": "1 day, 9:37:44", "remaining_time": "5 days, 15:08:38", "throughput": 2715.52, "total_tokens": 328753152} {"current_steps": 1821, "total_steps": 9134, "loss": 0.7332, "learning_rate": 4.52546986276086e-05, "epoch": 0.19934864117791948, "percentage": 19.94, "elapsed_time": "1 day, 9:38:51", "remaining_time": "5 days, 15:07:36", "throughput": 2715.65, "total_tokens": 328952512} {"current_steps": 1822, "total_steps": 9134, "loss": 0.5897, "learning_rate": 4.524965717356405e-05, "epoch": 0.19945811324885737, "percentage": 19.95, "elapsed_time": "1 day, 9:40:00", "remaining_time": "5 days, 15:06:37", "throughput": 2715.71, "total_tokens": 329144704} {"current_steps": 1823, "total_steps": 9134, "loss": 0.5396, "learning_rate": 4.524461332402375e-05, "epoch": 0.1995675853197953, "percentage": 19.96, "elapsed_time": "1 day, 9:41:08", "remaining_time": "5 days, 15:05:39", "throughput": 2715.66, "total_tokens": 329324800} {"current_steps": 1824, "total_steps": 9134, "loss": 0.6519, "learning_rate": 4.523956707958441e-05, "epoch": 0.1996770573907332, "percentage": 19.97, "elapsed_time": "1 day, 9:42:12", "remaining_time": "5 days, 15:04:20", "throughput": 2715.58, "total_tokens": 329487200} {"current_steps": 1825, "total_steps": 9134, "loss": 0.8408, "learning_rate": 4.523451844084297e-05, "epoch": 0.19978652946167108, "percentage": 19.98, "elapsed_time": "1 day, 9:43:17", "remaining_time": "5 days, 15:03:10", "throughput": 2715.69, "total_tokens": 329679392} {"current_steps": 1826, "total_steps": 9134, "loss": 0.6825, "learning_rate": 4.5229467408396686e-05, "epoch": 0.199896001532609, "percentage": 19.99, "elapsed_time": "1 day, 9:44:23", "remaining_time": "5 days, 15:02:00", "throughput": 2715.62, "total_tokens": 329848960} {"current_steps": 1827, "total_steps": 9134, "loss": 0.7168, "learning_rate": 4.5224413982843075e-05, "epoch": 0.2000054736035469, "percentage": 20.0, "elapsed_time": "1 day, 9:45:27", "remaining_time": "5 days, 15:00:43", "throughput": 2715.54, "total_tokens": 330012704} {"current_steps": 1828, "total_steps": 9134, "loss": 0.6705, "learning_rate": 4.521935816477995e-05, "epoch": 0.2001149456744848, "percentage": 20.01, "elapsed_time": "1 day, 9:46:34", "remaining_time": "5 days, 14:59:38", "throughput": 2715.66, "total_tokens": 330208704} {"current_steps": 1829, "total_steps": 9134, "loss": 0.5973, "learning_rate": 4.5214299954805404e-05, "epoch": 0.2002244177454227, "percentage": 20.02, "elapsed_time": "1 day, 9:47:36", "remaining_time": "5 days, 14:58:13", "throughput": 2715.54, "total_tokens": 330363040} {"current_steps": 1830, "total_steps": 9134, "loss": 0.6642, "learning_rate": 4.520923935351782e-05, "epoch": 0.2003338898163606, "percentage": 20.04, "elapsed_time": "1 day, 9:48:43", "remaining_time": "5 days, 14:57:10", "throughput": 2715.59, "total_tokens": 330551648} {"current_steps": 1831, "total_steps": 9134, "loss": 0.6393, "learning_rate": 4.520417636151586e-05, "epoch": 0.2004433618872985, "percentage": 20.05, "elapsed_time": "1 day, 9:49:50", "remaining_time": "5 days, 14:56:05", "throughput": 2715.59, "total_tokens": 330732640} {"current_steps": 1832, "total_steps": 9134, "loss": 0.728, "learning_rate": 4.5199110979398454e-05, "epoch": 0.2005528339582364, "percentage": 20.06, "elapsed_time": "1 day, 9:51:00", "remaining_time": "5 days, 14:55:11", "throughput": 2715.53, "total_tokens": 330914528} {"current_steps": 1833, "total_steps": 9134, "loss": 0.6575, "learning_rate": 4.5194043207764835e-05, "epoch": 0.20066230602917431, "percentage": 20.07, "elapsed_time": "1 day, 9:52:06", "remaining_time": "5 days, 14:54:03", "throughput": 2715.74, "total_tokens": 331119712} {"current_steps": 1834, "total_steps": 9134, "loss": 0.7018, "learning_rate": 4.5188973047214514e-05, "epoch": 0.2007717781001122, "percentage": 20.08, "elapsed_time": "1 day, 9:53:13", "remaining_time": "5 days, 14:52:58", "throughput": 2715.73, "total_tokens": 331300704} {"current_steps": 1835, "total_steps": 9134, "loss": 0.6257, "learning_rate": 4.518390049834727e-05, "epoch": 0.2008812501710501, "percentage": 20.09, "elapsed_time": "1 day, 9:54:22", "remaining_time": "5 days, 14:52:02", "throughput": 2715.76, "total_tokens": 331492224} {"current_steps": 1836, "total_steps": 9134, "loss": 0.7575, "learning_rate": 4.517882556176318e-05, "epoch": 0.20099072224198802, "percentage": 20.1, "elapsed_time": "1 day, 9:55:29", "remaining_time": "5 days, 14:50:58", "throughput": 2715.51, "total_tokens": 331644768} {"current_steps": 1837, "total_steps": 9134, "loss": 0.7399, "learning_rate": 4.51737482380626e-05, "epoch": 0.20110019431292592, "percentage": 20.11, "elapsed_time": "1 day, 9:56:35", "remaining_time": "5 days, 14:49:49", "throughput": 2715.54, "total_tokens": 331826432} {"current_steps": 1838, "total_steps": 9134, "loss": 0.6275, "learning_rate": 4.516866852784618e-05, "epoch": 0.2012096663838638, "percentage": 20.12, "elapsed_time": "1 day, 9:57:43", "remaining_time": "5 days, 14:48:47", "throughput": 2715.46, "total_tokens": 332001152} {"current_steps": 1839, "total_steps": 9134, "loss": 0.8783, "learning_rate": 4.516358643171482e-05, "epoch": 0.2013191384548017, "percentage": 20.13, "elapsed_time": "1 day, 9:58:52", "remaining_time": "5 days, 14:47:52", "throughput": 2715.52, "total_tokens": 332196928} {"current_steps": 1840, "total_steps": 9134, "loss": 0.6919, "learning_rate": 4.515850195026974e-05, "epoch": 0.20142861052573963, "percentage": 20.14, "elapsed_time": "1 day, 9:59:57", "remaining_time": "5 days, 14:46:40", "throughput": 2715.61, "total_tokens": 332383744} {"current_steps": 1841, "total_steps": 9134, "loss": 0.6655, "learning_rate": 4.5153415084112406e-05, "epoch": 0.20153808259667752, "percentage": 20.16, "elapsed_time": "1 day, 10:01:06", "remaining_time": "5 days, 14:45:43", "throughput": 2715.63, "total_tokens": 332574592} {"current_steps": 1842, "total_steps": 9134, "loss": 0.7179, "learning_rate": 4.5148325833844595e-05, "epoch": 0.20164755466761541, "percentage": 20.17, "elapsed_time": "1 day, 10:02:12", "remaining_time": "5 days, 14:44:35", "throughput": 2715.74, "total_tokens": 332767456} {"current_steps": 1843, "total_steps": 9134, "loss": 0.5503, "learning_rate": 4.514323420006836e-05, "epoch": 0.20175702673855334, "percentage": 20.18, "elapsed_time": "1 day, 10:03:12", "remaining_time": "5 days, 14:43:03", "throughput": 2715.53, "total_tokens": 332904992} {"current_steps": 1844, "total_steps": 9134, "loss": 1.0478, "learning_rate": 4.5138140183386025e-05, "epoch": 0.20186649880949123, "percentage": 20.19, "elapsed_time": "1 day, 10:04:22", "remaining_time": "5 days, 14:42:08", "throughput": 2715.67, "total_tokens": 333109952} {"current_steps": 1845, "total_steps": 9134, "loss": 0.7447, "learning_rate": 4.51330437844002e-05, "epoch": 0.20197597088042912, "percentage": 20.2, "elapsed_time": "1 day, 10:05:28", "remaining_time": "5 days, 14:41:00", "throughput": 2715.63, "total_tokens": 333285344} {"current_steps": 1846, "total_steps": 9134, "loss": 0.7165, "learning_rate": 4.512794500371379e-05, "epoch": 0.20208544295136704, "percentage": 20.21, "elapsed_time": "1 day, 10:06:34", "remaining_time": "5 days, 14:39:51", "throughput": 2715.75, "total_tokens": 333478432} {"current_steps": 1847, "total_steps": 9134, "loss": 0.8159, "learning_rate": 4.5122843841929965e-05, "epoch": 0.20219491502230494, "percentage": 20.22, "elapsed_time": "1 day, 10:07:42", "remaining_time": "5 days, 14:38:51", "throughput": 2715.94, "total_tokens": 333687872} {"current_steps": 1848, "total_steps": 9134, "loss": 0.7467, "learning_rate": 4.5117740299652175e-05, "epoch": 0.20230438709324283, "percentage": 20.23, "elapsed_time": "1 day, 10:08:41", "remaining_time": "5 days, 14:37:15", "throughput": 2715.63, "total_tokens": 333809504} {"current_steps": 1849, "total_steps": 9134, "loss": 0.8614, "learning_rate": 4.511263437748416e-05, "epoch": 0.20241385916418073, "percentage": 20.24, "elapsed_time": "1 day, 10:09:48", "remaining_time": "5 days, 14:36:09", "throughput": 2715.37, "total_tokens": 333958464} {"current_steps": 1850, "total_steps": 9134, "loss": 0.7666, "learning_rate": 4.510752607602996e-05, "epoch": 0.20252333123511865, "percentage": 20.25, "elapsed_time": "1 day, 10:10:50", "remaining_time": "5 days, 14:34:44", "throughput": 2715.28, "total_tokens": 334115264} {"current_steps": 1851, "total_steps": 9134, "loss": 0.5959, "learning_rate": 4.510241539589386e-05, "epoch": 0.20263280330605654, "percentage": 20.26, "elapsed_time": "1 day, 10:11:57", "remaining_time": "5 days, 14:33:41", "throughput": 2715.24, "total_tokens": 334293792} {"current_steps": 1852, "total_steps": 9134, "loss": 0.662, "learning_rate": 4.509730233768045e-05, "epoch": 0.20274227537699444, "percentage": 20.28, "elapsed_time": "1 day, 10:13:00", "remaining_time": "5 days, 14:32:23", "throughput": 2715.25, "total_tokens": 334467616} {"current_steps": 1853, "total_steps": 9134, "loss": 0.551, "learning_rate": 4.5092186901994594e-05, "epoch": 0.20285174744793236, "percentage": 20.29, "elapsed_time": "1 day, 10:14:09", "remaining_time": "5 days, 14:31:24", "throughput": 2715.36, "total_tokens": 334666304} {"current_steps": 1854, "total_steps": 9134, "loss": 0.6095, "learning_rate": 4.5087069089441434e-05, "epoch": 0.20296121951887025, "percentage": 20.3, "elapsed_time": "1 day, 10:15:15", "remaining_time": "5 days, 14:30:15", "throughput": 2715.4, "total_tokens": 334850880} {"current_steps": 1855, "total_steps": 9134, "loss": 0.6165, "learning_rate": 4.50819489006264e-05, "epoch": 0.20307069158980814, "percentage": 20.31, "elapsed_time": "1 day, 10:16:21", "remaining_time": "5 days, 14:29:06", "throughput": 2715.27, "total_tokens": 335013728} {"current_steps": 1856, "total_steps": 9134, "loss": 0.8556, "learning_rate": 4.5076826336155196e-05, "epoch": 0.20318016366074607, "percentage": 20.32, "elapsed_time": "1 day, 10:17:23", "remaining_time": "5 days, 14:27:43", "throughput": 2714.95, "total_tokens": 335142752} {"current_steps": 1857, "total_steps": 9134, "loss": 0.8702, "learning_rate": 4.507170139663382e-05, "epoch": 0.20328963573168396, "percentage": 20.33, "elapsed_time": "1 day, 10:18:26", "remaining_time": "5 days, 14:26:23", "throughput": 2714.71, "total_tokens": 335284320} {"current_steps": 1858, "total_steps": 9134, "loss": 0.7581, "learning_rate": 4.506657408266855e-05, "epoch": 0.20339910780262185, "percentage": 20.34, "elapsed_time": "1 day, 10:19:32", "remaining_time": "5 days, 14:25:16", "throughput": 2714.57, "total_tokens": 335446944} {"current_steps": 1859, "total_steps": 9134, "loss": 1.0415, "learning_rate": 4.506144439486591e-05, "epoch": 0.20350857987355975, "percentage": 20.35, "elapsed_time": "1 day, 10:20:42", "remaining_time": "5 days, 14:24:23", "throughput": 2714.75, "total_tokens": 335659296} {"current_steps": 1860, "total_steps": 9134, "loss": 0.5702, "learning_rate": 4.5056312333832764e-05, "epoch": 0.20361805194449767, "percentage": 20.36, "elapsed_time": "1 day, 10:21:46", "remaining_time": "5 days, 14:23:05", "throughput": 2714.62, "total_tokens": 335815872} {"current_steps": 1861, "total_steps": 9134, "loss": 0.631, "learning_rate": 4.505117790017621e-05, "epoch": 0.20372752401543556, "percentage": 20.37, "elapsed_time": "1 day, 10:22:55", "remaining_time": "5 days, 14:22:09", "throughput": 2714.81, "total_tokens": 336027552} {"current_steps": 1862, "total_steps": 9134, "loss": 0.6895, "learning_rate": 4.504604109450363e-05, "epoch": 0.20383699608637346, "percentage": 20.39, "elapsed_time": "1 day, 10:24:02", "remaining_time": "5 days, 14:21:04", "throughput": 2714.86, "total_tokens": 336215264} {"current_steps": 1863, "total_steps": 9134, "loss": 0.8398, "learning_rate": 4.504090191742272e-05, "epoch": 0.20394646815731138, "percentage": 20.4, "elapsed_time": "1 day, 10:25:08", "remaining_time": "5 days, 14:19:54", "throughput": 2714.8, "total_tokens": 336386400} {"current_steps": 1864, "total_steps": 9134, "loss": 0.8084, "learning_rate": 4.503576036954142e-05, "epoch": 0.20405594022824927, "percentage": 20.41, "elapsed_time": "1 day, 10:26:15", "remaining_time": "5 days, 14:18:51", "throughput": 2714.93, "total_tokens": 336585760} {"current_steps": 1865, "total_steps": 9134, "loss": 0.8067, "learning_rate": 4.5030616451467964e-05, "epoch": 0.20416541229918717, "percentage": 20.42, "elapsed_time": "1 day, 10:27:25", "remaining_time": "5 days, 14:17:57", "throughput": 2715.07, "total_tokens": 336792064} {"current_steps": 1866, "total_steps": 9134, "loss": 0.7804, "learning_rate": 4.502547016381089e-05, "epoch": 0.20427488437012506, "percentage": 20.43, "elapsed_time": "1 day, 10:28:30", "remaining_time": "5 days, 14:16:45", "throughput": 2715.04, "total_tokens": 336964320} {"current_steps": 1867, "total_steps": 9134, "loss": 0.8149, "learning_rate": 4.5020321507178965e-05, "epoch": 0.20438435644106298, "percentage": 20.44, "elapsed_time": "1 day, 10:29:40", "remaining_time": "5 days, 14:15:51", "throughput": 2715.04, "total_tokens": 337153824} {"current_steps": 1868, "total_steps": 9134, "loss": 0.7003, "learning_rate": 4.501517048218128e-05, "epoch": 0.20449382851200087, "percentage": 20.45, "elapsed_time": "1 day, 10:30:45", "remaining_time": "5 days, 14:14:41", "throughput": 2714.95, "total_tokens": 337320480} {"current_steps": 1869, "total_steps": 9134, "loss": 0.7328, "learning_rate": 4.5010017089427195e-05, "epoch": 0.20460330058293877, "percentage": 20.46, "elapsed_time": "1 day, 10:31:50", "remaining_time": "5 days, 14:13:28", "throughput": 2714.81, "total_tokens": 337478848} {"current_steps": 1870, "total_steps": 9134, "loss": 0.6813, "learning_rate": 4.500486132952634e-05, "epoch": 0.2047127726538767, "percentage": 20.47, "elapsed_time": "1 day, 10:32:56", "remaining_time": "5 days, 14:12:19", "throughput": 2714.89, "total_tokens": 337669248} {"current_steps": 1871, "total_steps": 9134, "loss": 0.5509, "learning_rate": 4.499970320308863e-05, "epoch": 0.20482224472481458, "percentage": 20.48, "elapsed_time": "1 day, 10:33:56", "remaining_time": "5 days, 14:10:46", "throughput": 2714.71, "total_tokens": 337808128} {"current_steps": 1872, "total_steps": 9134, "loss": 0.5976, "learning_rate": 4.4994542710724264e-05, "epoch": 0.20493171679575248, "percentage": 20.49, "elapsed_time": "1 day, 10:35:02", "remaining_time": "5 days, 14:09:39", "throughput": 2714.63, "total_tokens": 337979264} {"current_steps": 1873, "total_steps": 9134, "loss": 0.619, "learning_rate": 4.498937985304371e-05, "epoch": 0.2050411888666904, "percentage": 20.51, "elapsed_time": "1 day, 10:36:09", "remaining_time": "5 days, 14:08:34", "throughput": 2714.57, "total_tokens": 338153088} {"current_steps": 1874, "total_steps": 9134, "loss": 0.7421, "learning_rate": 4.4984214630657744e-05, "epoch": 0.2051506609376283, "percentage": 20.52, "elapsed_time": "1 day, 10:37:18", "remaining_time": "5 days, 14:07:39", "throughput": 2714.62, "total_tokens": 338347744} {"current_steps": 1875, "total_steps": 9134, "loss": 1.0407, "learning_rate": 4.497904704417739e-05, "epoch": 0.2052601330085662, "percentage": 20.53, "elapsed_time": "1 day, 10:38:27", "remaining_time": "5 days, 14:06:41", "throughput": 2714.63, "total_tokens": 338535680} {"current_steps": 1876, "total_steps": 9134, "loss": 0.6343, "learning_rate": 4.4973877094213954e-05, "epoch": 0.20536960507950408, "percentage": 20.54, "elapsed_time": "1 day, 10:39:26", "remaining_time": "5 days, 14:05:05", "throughput": 2714.37, "total_tokens": 338662240} {"current_steps": 1877, "total_steps": 9134, "loss": 0.7782, "learning_rate": 4.496870478137906e-05, "epoch": 0.205479077150442, "percentage": 20.55, "elapsed_time": "1 day, 10:40:33", "remaining_time": "5 days, 14:03:59", "throughput": 2714.35, "total_tokens": 338840992} {"current_steps": 1878, "total_steps": 9134, "loss": 0.6019, "learning_rate": 4.496353010628455e-05, "epoch": 0.2055885492213799, "percentage": 20.56, "elapsed_time": "1 day, 10:41:41", "remaining_time": "5 days, 14:03:00", "throughput": 2714.39, "total_tokens": 339032064} {"current_steps": 1879, "total_steps": 9134, "loss": 0.6098, "learning_rate": 4.495835306954259e-05, "epoch": 0.2056980212923178, "percentage": 20.57, "elapsed_time": "1 day, 10:42:44", "remaining_time": "5 days, 14:01:41", "throughput": 2714.35, "total_tokens": 339198944} {"current_steps": 1880, "total_steps": 9134, "loss": 0.6677, "learning_rate": 4.495317367176562e-05, "epoch": 0.2058074933632557, "percentage": 20.58, "elapsed_time": "1 day, 10:43:49", "remaining_time": "5 days, 14:00:28", "throughput": 2714.23, "total_tokens": 339359552} {"current_steps": 1881, "total_steps": 9134, "loss": 0.8619, "learning_rate": 4.4947991913566355e-05, "epoch": 0.2059169654341936, "percentage": 20.59, "elapsed_time": "1 day, 10:44:56", "remaining_time": "5 days, 13:59:22", "throughput": 2714.26, "total_tokens": 339544128} {"current_steps": 1882, "total_steps": 9134, "loss": 1.0113, "learning_rate": 4.494280779555777e-05, "epoch": 0.2060264375051315, "percentage": 20.6, "elapsed_time": "1 day, 10:46:02", "remaining_time": "5 days, 13:58:14", "throughput": 2714.23, "total_tokens": 339720192} {"current_steps": 1883, "total_steps": 9134, "loss": 0.5132, "learning_rate": 4.493762131835315e-05, "epoch": 0.2061359095760694, "percentage": 20.62, "elapsed_time": "1 day, 10:47:08", "remaining_time": "5 days, 13:57:07", "throughput": 2714.17, "total_tokens": 339892448} {"current_steps": 1884, "total_steps": 9134, "loss": 0.5052, "learning_rate": 4.4932432482566045e-05, "epoch": 0.20624538164700731, "percentage": 20.63, "elapsed_time": "1 day, 10:48:12", "remaining_time": "5 days, 13:55:49", "throughput": 2714.04, "total_tokens": 340049024} {"current_steps": 1885, "total_steps": 9134, "loss": 0.7394, "learning_rate": 4.492724128881029e-05, "epoch": 0.2063548537179452, "percentage": 20.64, "elapsed_time": "1 day, 10:49:21", "remaining_time": "5 days, 13:54:51", "throughput": 2714.18, "total_tokens": 340253312} {"current_steps": 1886, "total_steps": 9134, "loss": 0.6585, "learning_rate": 4.492204773769997e-05, "epoch": 0.2064643257888831, "percentage": 20.65, "elapsed_time": "1 day, 10:50:24", "remaining_time": "5 days, 13:53:34", "throughput": 2714.15, "total_tokens": 340421088} {"current_steps": 1887, "total_steps": 9134, "loss": 0.6671, "learning_rate": 4.491685182984949e-05, "epoch": 0.20657379785982102, "percentage": 20.66, "elapsed_time": "1 day, 10:51:30", "remaining_time": "5 days, 13:52:25", "throughput": 2714.01, "total_tokens": 340583488} {"current_steps": 1888, "total_steps": 9134, "loss": 0.5914, "learning_rate": 4.4911653565873524e-05, "epoch": 0.20668326993075892, "percentage": 20.67, "elapsed_time": "1 day, 10:52:38", "remaining_time": "5 days, 13:51:23", "throughput": 2714.18, "total_tokens": 340788448} {"current_steps": 1889, "total_steps": 9134, "loss": 0.6703, "learning_rate": 4.4906452946386995e-05, "epoch": 0.2067927420016968, "percentage": 20.68, "elapsed_time": "1 day, 10:53:47", "remaining_time": "5 days, 13:50:25", "throughput": 2714.25, "total_tokens": 340983328} {"current_steps": 1890, "total_steps": 9134, "loss": 0.6257, "learning_rate": 4.490124997200514e-05, "epoch": 0.20690221407263473, "percentage": 20.69, "elapsed_time": "1 day, 10:54:56", "remaining_time": "5 days, 13:49:30", "throughput": 2714.35, "total_tokens": 341184256} {"current_steps": 1891, "total_steps": 9134, "loss": 0.7084, "learning_rate": 4.489604464334346e-05, "epoch": 0.20701168614357263, "percentage": 20.7, "elapsed_time": "1 day, 10:56:02", "remaining_time": "5 days, 13:48:21", "throughput": 2714.48, "total_tokens": 341379360} {"current_steps": 1892, "total_steps": 9134, "loss": 0.6465, "learning_rate": 4.489083696101773e-05, "epoch": 0.20712115821451052, "percentage": 20.71, "elapsed_time": "1 day, 10:57:04", "remaining_time": "5 days, 13:46:59", "throughput": 2714.22, "total_tokens": 341516224} {"current_steps": 1893, "total_steps": 9134, "loss": 0.7529, "learning_rate": 4.4885626925644016e-05, "epoch": 0.20723063028544841, "percentage": 20.72, "elapsed_time": "1 day, 10:58:10", "remaining_time": "5 days, 13:45:49", "throughput": 2714.06, "total_tokens": 341673920} {"current_steps": 1894, "total_steps": 9134, "loss": 0.7849, "learning_rate": 4.4880414537838643e-05, "epoch": 0.20734010235638634, "percentage": 20.74, "elapsed_time": "1 day, 10:59:14", "remaining_time": "5 days, 13:44:33", "throughput": 2713.98, "total_tokens": 341837888} {"current_steps": 1895, "total_steps": 9134, "loss": 0.6271, "learning_rate": 4.487519979821824e-05, "epoch": 0.20744957442732423, "percentage": 20.75, "elapsed_time": "1 day, 11:00:19", "remaining_time": "5 days, 13:43:19", "throughput": 2713.92, "total_tokens": 342005664} {"current_steps": 1896, "total_steps": 9134, "loss": 1.0387, "learning_rate": 4.486998270739971e-05, "epoch": 0.20755904649826212, "percentage": 20.76, "elapsed_time": "1 day, 11:01:25", "remaining_time": "5 days, 13:42:11", "throughput": 2713.87, "total_tokens": 342178592} {"current_steps": 1897, "total_steps": 9134, "loss": 0.8455, "learning_rate": 4.486476326600019e-05, "epoch": 0.20766851856920004, "percentage": 20.77, "elapsed_time": "1 day, 11:02:31", "remaining_time": "5 days, 13:41:04", "throughput": 2713.83, "total_tokens": 342353312} {"current_steps": 1898, "total_steps": 9134, "loss": 0.7172, "learning_rate": 4.4859541474637153e-05, "epoch": 0.20777799064013794, "percentage": 20.78, "elapsed_time": "1 day, 11:03:38", "remaining_time": "5 days, 13:40:01", "throughput": 2713.77, "total_tokens": 342528704} {"current_steps": 1899, "total_steps": 9134, "loss": 0.6398, "learning_rate": 4.4854317333928335e-05, "epoch": 0.20788746271107583, "percentage": 20.79, "elapsed_time": "1 day, 11:04:45", "remaining_time": "5 days, 13:38:55", "throughput": 2713.87, "total_tokens": 342722464} {"current_steps": 1900, "total_steps": 9134, "loss": 0.6009, "learning_rate": 4.484909084449172e-05, "epoch": 0.20799693478201373, "percentage": 20.8, "elapsed_time": "1 day, 11:05:51", "remaining_time": "5 days, 13:37:46", "throughput": 2713.83, "total_tokens": 342896960} {"current_steps": 1901, "total_steps": 9134, "loss": 0.8514, "learning_rate": 4.484386200694561e-05, "epoch": 0.20810640685295165, "percentage": 20.81, "elapsed_time": "1 day, 11:07:00", "remaining_time": "5 days, 13:36:48", "throughput": 2713.94, "total_tokens": 343096544} {"current_steps": 1902, "total_steps": 9134, "loss": 0.6413, "learning_rate": 4.4838630821908564e-05, "epoch": 0.20821587892388954, "percentage": 20.82, "elapsed_time": "1 day, 11:08:04", "remaining_time": "5 days, 13:35:33", "throughput": 2713.82, "total_tokens": 343256704} {"current_steps": 1903, "total_steps": 9134, "loss": 0.7912, "learning_rate": 4.483339728999941e-05, "epoch": 0.20832535099482744, "percentage": 20.83, "elapsed_time": "1 day, 11:09:14", "remaining_time": "5 days, 13:34:38", "throughput": 2714.05, "total_tokens": 343473536} {"current_steps": 1904, "total_steps": 9134, "loss": 0.7125, "learning_rate": 4.482816141183728e-05, "epoch": 0.20843482306576536, "percentage": 20.85, "elapsed_time": "1 day, 11:10:13", "remaining_time": "5 days, 13:33:05", "throughput": 2713.85, "total_tokens": 343610624} {"current_steps": 1905, "total_steps": 9134, "loss": 0.7315, "learning_rate": 4.4822923188041555e-05, "epoch": 0.20854429513670325, "percentage": 20.86, "elapsed_time": "1 day, 11:11:17", "remaining_time": "5 days, 13:31:49", "throughput": 2713.81, "total_tokens": 343779296} {"current_steps": 1906, "total_steps": 9134, "loss": 0.7621, "learning_rate": 4.481768261923191e-05, "epoch": 0.20865376720764114, "percentage": 20.87, "elapsed_time": "1 day, 11:12:27", "remaining_time": "5 days, 13:30:55", "throughput": 2713.92, "total_tokens": 343981120} {"current_steps": 1907, "total_steps": 9134, "loss": 0.5179, "learning_rate": 4.48124397060283e-05, "epoch": 0.20876323927857907, "percentage": 20.88, "elapsed_time": "1 day, 11:13:33", "remaining_time": "5 days, 13:29:47", "throughput": 2713.96, "total_tokens": 344165920} {"current_steps": 1908, "total_steps": 9134, "loss": 0.7012, "learning_rate": 4.4807194449050936e-05, "epoch": 0.20887271134951696, "percentage": 20.89, "elapsed_time": "1 day, 11:14:42", "remaining_time": "5 days, 13:28:50", "throughput": 2714.15, "total_tokens": 344377376} {"current_steps": 1909, "total_steps": 9134, "loss": 0.7162, "learning_rate": 4.480194684892035e-05, "epoch": 0.20898218342045485, "percentage": 20.9, "elapsed_time": "1 day, 11:15:46", "remaining_time": "5 days, 13:27:36", "throughput": 2714.0, "total_tokens": 344533952} {"current_steps": 1910, "total_steps": 9134, "loss": 0.8421, "learning_rate": 4.4796696906257294e-05, "epoch": 0.20909165549139275, "percentage": 20.91, "elapsed_time": "1 day, 11:16:52", "remaining_time": "5 days, 13:26:27", "throughput": 2714.01, "total_tokens": 344714272} {"current_steps": 1911, "total_steps": 9134, "loss": 0.6532, "learning_rate": 4.479144462168284e-05, "epoch": 0.20920112756233067, "percentage": 20.92, "elapsed_time": "1 day, 11:18:00", "remaining_time": "5 days, 13:25:24", "throughput": 2713.92, "total_tokens": 344885632} {"current_steps": 1912, "total_steps": 9134, "loss": 0.7443, "learning_rate": 4.478618999581833e-05, "epoch": 0.20931059963326856, "percentage": 20.93, "elapsed_time": "1 day, 11:19:06", "remaining_time": "5 days, 13:24:17", "throughput": 2714.0, "total_tokens": 345076032} {"current_steps": 1913, "total_steps": 9134, "loss": 0.5801, "learning_rate": 4.4780933029285365e-05, "epoch": 0.20942007170420646, "percentage": 20.94, "elapsed_time": "1 day, 11:20:12", "remaining_time": "5 days, 13:23:09", "throughput": 2713.99, "total_tokens": 345253664} {"current_steps": 1914, "total_steps": 9134, "loss": 0.7066, "learning_rate": 4.4775673722705836e-05, "epoch": 0.20952954377514438, "percentage": 20.95, "elapsed_time": "1 day, 11:21:19", "remaining_time": "5 days, 13:22:04", "throughput": 2714.08, "total_tokens": 345447200} {"current_steps": 1915, "total_steps": 9134, "loss": 0.8532, "learning_rate": 4.47704120767019e-05, "epoch": 0.20963901584608227, "percentage": 20.97, "elapsed_time": "1 day, 11:22:29", "remaining_time": "5 days, 13:21:09", "throughput": 2714.25, "total_tokens": 345657984} {"current_steps": 1916, "total_steps": 9134, "loss": 0.7004, "learning_rate": 4.476514809189603e-05, "epoch": 0.20974848791702017, "percentage": 20.98, "elapsed_time": "1 day, 11:23:38", "remaining_time": "5 days, 13:20:15", "throughput": 2714.43, "total_tokens": 345868992} {"current_steps": 1917, "total_steps": 9134, "loss": 0.8298, "learning_rate": 4.4759881768910915e-05, "epoch": 0.20985795998795806, "percentage": 20.99, "elapsed_time": "1 day, 11:24:47", "remaining_time": "5 days, 13:19:17", "throughput": 2714.51, "total_tokens": 346066112} {"current_steps": 1918, "total_steps": 9134, "loss": 0.6776, "learning_rate": 4.475461310836957e-05, "epoch": 0.20996743205889598, "percentage": 21.0, "elapsed_time": "1 day, 11:25:54", "remaining_time": "5 days, 13:18:13", "throughput": 2714.51, "total_tokens": 346249120} {"current_steps": 1919, "total_steps": 9134, "loss": 0.8439, "learning_rate": 4.4749342110895244e-05, "epoch": 0.21007690412983387, "percentage": 21.01, "elapsed_time": "1 day, 11:26:58", "remaining_time": "5 days, 13:16:54", "throughput": 2714.42, "total_tokens": 346409280} {"current_steps": 1920, "total_steps": 9134, "loss": 0.5991, "learning_rate": 4.4744068777111506e-05, "epoch": 0.21018637620077177, "percentage": 21.02, "elapsed_time": "1 day, 11:28:00", "remaining_time": "5 days, 13:15:32", "throughput": 2714.27, "total_tokens": 346559136} {"current_steps": 1921, "total_steps": 9134, "loss": 0.5326, "learning_rate": 4.4738793107642174e-05, "epoch": 0.2102958482717097, "percentage": 21.03, "elapsed_time": "1 day, 11:29:07", "remaining_time": "5 days, 13:14:27", "throughput": 2714.22, "total_tokens": 346733856} {"current_steps": 1922, "total_steps": 9134, "loss": 0.6439, "learning_rate": 4.4733515103111356e-05, "epoch": 0.21040532034264758, "percentage": 21.04, "elapsed_time": "1 day, 11:30:11", "remaining_time": "5 days, 13:13:12", "throughput": 2714.21, "total_tokens": 346907232} {"current_steps": 1923, "total_steps": 9134, "loss": 0.859, "learning_rate": 4.472823476414343e-05, "epoch": 0.21051479241358548, "percentage": 21.05, "elapsed_time": "1 day, 11:31:18", "remaining_time": "5 days, 13:12:08", "throughput": 2714.2, "total_tokens": 347088448} {"current_steps": 1924, "total_steps": 9134, "loss": 0.7572, "learning_rate": 4.4722952091363034e-05, "epoch": 0.2106242644845234, "percentage": 21.06, "elapsed_time": "1 day, 11:32:28", "remaining_time": "5 days, 13:11:13", "throughput": 2714.32, "total_tokens": 347292288} {"current_steps": 1925, "total_steps": 9134, "loss": 0.8705, "learning_rate": 4.471766708539512e-05, "epoch": 0.2107337365554613, "percentage": 21.08, "elapsed_time": "1 day, 11:33:33", "remaining_time": "5 days, 13:10:02", "throughput": 2714.39, "total_tokens": 347478880} {"current_steps": 1926, "total_steps": 9134, "loss": 0.8501, "learning_rate": 4.4712379746864876e-05, "epoch": 0.2108432086263992, "percentage": 21.09, "elapsed_time": "1 day, 11:34:34", "remaining_time": "5 days, 13:08:33", "throughput": 2714.13, "total_tokens": 347609472} {"current_steps": 1927, "total_steps": 9134, "loss": 0.8559, "learning_rate": 4.4707090076397795e-05, "epoch": 0.21095268069733708, "percentage": 21.1, "elapsed_time": "1 day, 11:35:37", "remaining_time": "5 days, 13:07:17", "throughput": 2714.09, "total_tokens": 347778368} {"current_steps": 1928, "total_steps": 9134, "loss": 0.6504, "learning_rate": 4.4701798074619626e-05, "epoch": 0.211062152768275, "percentage": 21.11, "elapsed_time": "1 day, 11:36:45", "remaining_time": "5 days, 13:06:14", "throughput": 2714.08, "total_tokens": 347960256} {"current_steps": 1929, "total_steps": 9134, "loss": 0.6153, "learning_rate": 4.4696503742156414e-05, "epoch": 0.2111716248392129, "percentage": 21.12, "elapsed_time": "1 day, 11:37:51", "remaining_time": "5 days, 13:05:04", "throughput": 2714.08, "total_tokens": 348138336} {"current_steps": 1930, "total_steps": 9134, "loss": 0.8939, "learning_rate": 4.469120707963447e-05, "epoch": 0.2112810969101508, "percentage": 21.13, "elapsed_time": "1 day, 11:38:56", "remaining_time": "5 days, 13:03:55", "throughput": 2713.86, "total_tokens": 348288416} {"current_steps": 1931, "total_steps": 9134, "loss": 0.5701, "learning_rate": 4.468590808768036e-05, "epoch": 0.2113905689810887, "percentage": 21.14, "elapsed_time": "1 day, 11:40:02", "remaining_time": "5 days, 13:02:46", "throughput": 2713.83, "total_tokens": 348462464} {"current_steps": 1932, "total_steps": 9134, "loss": 0.6949, "learning_rate": 4.4680606766920954e-05, "epoch": 0.2115000410520266, "percentage": 21.15, "elapsed_time": "1 day, 11:41:11", "remaining_time": "5 days, 13:01:48", "throughput": 2713.77, "total_tokens": 348642112} {"current_steps": 1933, "total_steps": 9134, "loss": 0.9169, "learning_rate": 4.46753031179834e-05, "epoch": 0.2116095131229645, "percentage": 21.16, "elapsed_time": "1 day, 11:42:19", "remaining_time": "5 days, 13:00:47", "throughput": 2713.82, "total_tokens": 348832736} {"current_steps": 1934, "total_steps": 9134, "loss": 0.688, "learning_rate": 4.4669997141495095e-05, "epoch": 0.2117189851939024, "percentage": 21.17, "elapsed_time": "1 day, 11:43:28", "remaining_time": "5 days, 12:59:50", "throughput": 2713.88, "total_tokens": 349028512} {"current_steps": 1935, "total_steps": 9134, "loss": 0.77, "learning_rate": 4.466468883808373e-05, "epoch": 0.21182845726484031, "percentage": 21.18, "elapsed_time": "1 day, 11:44:35", "remaining_time": "5 days, 12:58:46", "throughput": 2713.9, "total_tokens": 349212192} {"current_steps": 1936, "total_steps": 9134, "loss": 0.7475, "learning_rate": 4.4659378208377276e-05, "epoch": 0.2119379293357782, "percentage": 21.2, "elapsed_time": "1 day, 11:45:43", "remaining_time": "5 days, 12:57:44", "throughput": 2713.9, "total_tokens": 349396768} {"current_steps": 1937, "total_steps": 9134, "loss": 0.7057, "learning_rate": 4.465406525300395e-05, "epoch": 0.2120474014067161, "percentage": 21.21, "elapsed_time": "1 day, 11:46:51", "remaining_time": "5 days, 12:56:43", "throughput": 2713.85, "total_tokens": 349573952} {"current_steps": 1938, "total_steps": 9134, "loss": 0.9661, "learning_rate": 4.4648749972592286e-05, "epoch": 0.21215687347765402, "percentage": 21.22, "elapsed_time": "1 day, 11:47:55", "remaining_time": "5 days, 12:55:30", "throughput": 2713.94, "total_tokens": 349761664} {"current_steps": 1939, "total_steps": 9134, "loss": 0.6221, "learning_rate": 4.464343236777106e-05, "epoch": 0.21226634554859192, "percentage": 21.23, "elapsed_time": "1 day, 11:49:01", "remaining_time": "5 days, 12:54:18", "throughput": 2713.81, "total_tokens": 349921152} {"current_steps": 1940, "total_steps": 9134, "loss": 0.8982, "learning_rate": 4.463811243916933e-05, "epoch": 0.2123758176195298, "percentage": 21.24, "elapsed_time": "1 day, 11:50:08", "remaining_time": "5 days, 12:53:13", "throughput": 2713.75, "total_tokens": 350095424} {"current_steps": 1941, "total_steps": 9134, "loss": 0.8376, "learning_rate": 4.463279018741645e-05, "epoch": 0.21248528969046773, "percentage": 21.25, "elapsed_time": "1 day, 11:51:14", "remaining_time": "5 days, 12:52:05", "throughput": 2713.76, "total_tokens": 350275744} {"current_steps": 1942, "total_steps": 9134, "loss": 0.6347, "learning_rate": 4.4627465613142014e-05, "epoch": 0.21259476176140563, "percentage": 21.26, "elapsed_time": "1 day, 11:52:20", "remaining_time": "5 days, 12:50:57", "throughput": 2713.72, "total_tokens": 350449792} {"current_steps": 1943, "total_steps": 9134, "loss": 0.6734, "learning_rate": 4.462213871697592e-05, "epoch": 0.21270423383234352, "percentage": 21.27, "elapsed_time": "1 day, 11:53:28", "remaining_time": "5 days, 12:49:57", "throughput": 2713.79, "total_tokens": 350644000} {"current_steps": 1944, "total_steps": 9134, "loss": 0.798, "learning_rate": 4.4616809499548334e-05, "epoch": 0.2128137059032814, "percentage": 21.28, "elapsed_time": "1 day, 11:54:31", "remaining_time": "5 days, 12:48:39", "throughput": 2713.83, "total_tokens": 350821856} {"current_steps": 1945, "total_steps": 9134, "loss": 0.74, "learning_rate": 4.461147796148968e-05, "epoch": 0.21292317797421934, "percentage": 21.29, "elapsed_time": "1 day, 11:55:35", "remaining_time": "5 days, 12:47:23", "throughput": 2713.75, "total_tokens": 350984928} {"current_steps": 1946, "total_steps": 9134, "loss": 0.6716, "learning_rate": 4.460614410343067e-05, "epoch": 0.21303265004515723, "percentage": 21.31, "elapsed_time": "1 day, 11:56:42", "remaining_time": "5 days, 12:46:17", "throughput": 2713.66, "total_tokens": 351154496} {"current_steps": 1947, "total_steps": 9134, "loss": 0.703, "learning_rate": 4.46008079260023e-05, "epoch": 0.21314212211609512, "percentage": 21.32, "elapsed_time": "1 day, 11:57:48", "remaining_time": "5 days, 12:45:08", "throughput": 2713.55, "total_tokens": 351318240} {"current_steps": 1948, "total_steps": 9134, "loss": 0.6723, "learning_rate": 4.4595469429835826e-05, "epoch": 0.21325159418703304, "percentage": 21.33, "elapsed_time": "1 day, 11:58:53", "remaining_time": "5 days, 12:43:58", "throughput": 2713.54, "total_tokens": 351494752} {"current_steps": 1949, "total_steps": 9134, "loss": 0.7073, "learning_rate": 4.4590128615562765e-05, "epoch": 0.21336106625797094, "percentage": 21.34, "elapsed_time": "1 day, 11:59:59", "remaining_time": "5 days, 12:42:50", "throughput": 2713.53, "total_tokens": 351673952} {"current_steps": 1950, "total_steps": 9134, "loss": 0.6136, "learning_rate": 4.458478548381495e-05, "epoch": 0.21347053832890883, "percentage": 21.35, "elapsed_time": "1 day, 12:01:06", "remaining_time": "5 days, 12:41:44", "throughput": 2713.5, "total_tokens": 351849120} {"current_steps": 1951, "total_steps": 9134, "loss": 0.4825, "learning_rate": 4.4579440035224446e-05, "epoch": 0.21358001039984673, "percentage": 21.36, "elapsed_time": "1 day, 12:02:11", "remaining_time": "5 days, 12:40:31", "throughput": 2713.4, "total_tokens": 352012864} {"current_steps": 1952, "total_steps": 9134, "loss": 0.7573, "learning_rate": 4.457409227042362e-05, "epoch": 0.21368948247078465, "percentage": 21.37, "elapsed_time": "1 day, 12:03:18", "remaining_time": "5 days, 12:39:28", "throughput": 2713.56, "total_tokens": 352215584} {"current_steps": 1953, "total_steps": 9134, "loss": 0.514, "learning_rate": 4.456874219004509e-05, "epoch": 0.21379895454172254, "percentage": 21.38, "elapsed_time": "1 day, 12:04:26", "remaining_time": "5 days, 12:38:25", "throughput": 2713.6, "total_tokens": 352405536} {"current_steps": 1954, "total_steps": 9134, "loss": 0.7939, "learning_rate": 4.4563389794721776e-05, "epoch": 0.21390842661266044, "percentage": 21.39, "elapsed_time": "1 day, 12:05:35", "remaining_time": "5 days, 12:37:31", "throughput": 2713.72, "total_tokens": 352610272} {"current_steps": 1955, "total_steps": 9134, "loss": 0.8915, "learning_rate": 4.455803508508685e-05, "epoch": 0.21401789868359836, "percentage": 21.4, "elapsed_time": "1 day, 12:06:42", "remaining_time": "5 days, 12:36:24", "throughput": 2713.68, "total_tokens": 352784544} {"current_steps": 1956, "total_steps": 9134, "loss": 0.8095, "learning_rate": 4.455267806177376e-05, "epoch": 0.21412737075453625, "percentage": 21.41, "elapsed_time": "1 day, 12:07:48", "remaining_time": "5 days, 12:35:18", "throughput": 2713.61, "total_tokens": 352955680} {"current_steps": 1957, "total_steps": 9134, "loss": 0.76, "learning_rate": 4.454731872541622e-05, "epoch": 0.21423684282547414, "percentage": 21.43, "elapsed_time": "1 day, 12:08:54", "remaining_time": "5 days, 12:34:09", "throughput": 2713.42, "total_tokens": 353110240} {"current_steps": 1958, "total_steps": 9134, "loss": 0.8617, "learning_rate": 4.454195707664825e-05, "epoch": 0.21434631489641207, "percentage": 21.44, "elapsed_time": "1 day, 12:09:59", "remaining_time": "5 days, 12:32:55", "throughput": 2713.52, "total_tokens": 353297952} {"current_steps": 1959, "total_steps": 9134, "loss": 0.658, "learning_rate": 4.4536593116104125e-05, "epoch": 0.21445578696734996, "percentage": 21.45, "elapsed_time": "1 day, 12:10:59", "remaining_time": "5 days, 12:31:27", "throughput": 2713.37, "total_tokens": 353442880} {"current_steps": 1960, "total_steps": 9134, "loss": 0.6638, "learning_rate": 4.453122684441837e-05, "epoch": 0.21456525903828785, "percentage": 21.46, "elapsed_time": "1 day, 12:12:04", "remaining_time": "5 days, 12:30:15", "throughput": 2713.41, "total_tokens": 353624320} {"current_steps": 1961, "total_steps": 9134, "loss": 0.723, "learning_rate": 4.452585826222583e-05, "epoch": 0.21467473110922575, "percentage": 21.47, "elapsed_time": "1 day, 12:13:12", "remaining_time": "5 days, 12:29:14", "throughput": 2713.56, "total_tokens": 353829056} {"current_steps": 1962, "total_steps": 9134, "loss": 0.7129, "learning_rate": 4.4520487370161576e-05, "epoch": 0.21478420318016367, "percentage": 21.48, "elapsed_time": "1 day, 12:14:22", "remaining_time": "5 days, 12:28:18", "throughput": 2713.54, "total_tokens": 354013632} {"current_steps": 1963, "total_steps": 9134, "loss": 0.8509, "learning_rate": 4.451511416886099e-05, "epoch": 0.21489367525110156, "percentage": 21.49, "elapsed_time": "1 day, 12:15:32", "remaining_time": "5 days, 12:27:24", "throughput": 2713.84, "total_tokens": 354243008} {"current_steps": 1964, "total_steps": 9134, "loss": 0.7095, "learning_rate": 4.45097386589597e-05, "epoch": 0.21500314732203946, "percentage": 21.5, "elapsed_time": "1 day, 12:16:35", "remaining_time": "5 days, 12:26:07", "throughput": 2713.8, "total_tokens": 354410336} {"current_steps": 1965, "total_steps": 9134, "loss": 0.8761, "learning_rate": 4.450436084109362e-05, "epoch": 0.21511261939297738, "percentage": 21.51, "elapsed_time": "1 day, 12:17:41", "remaining_time": "5 days, 12:24:59", "throughput": 2713.82, "total_tokens": 354592448} {"current_steps": 1966, "total_steps": 9134, "loss": 0.6093, "learning_rate": 4.449898071589894e-05, "epoch": 0.21522209146391527, "percentage": 21.52, "elapsed_time": "1 day, 12:18:45", "remaining_time": "5 days, 12:23:43", "throughput": 2713.79, "total_tokens": 354762240} {"current_steps": 1967, "total_steps": 9134, "loss": 0.7803, "learning_rate": 4.449359828401212e-05, "epoch": 0.21533156353485317, "percentage": 21.53, "elapsed_time": "1 day, 12:19:54", "remaining_time": "5 days, 12:22:46", "throughput": 2713.72, "total_tokens": 354939648} {"current_steps": 1968, "total_steps": 9134, "loss": 0.8137, "learning_rate": 4.4488213546069884e-05, "epoch": 0.21544103560579106, "percentage": 21.55, "elapsed_time": "1 day, 12:21:01", "remaining_time": "5 days, 12:21:38", "throughput": 2713.68, "total_tokens": 355115488} {"current_steps": 1969, "total_steps": 9134, "loss": 0.6437, "learning_rate": 4.448282650270924e-05, "epoch": 0.21555050767672898, "percentage": 21.56, "elapsed_time": "1 day, 12:22:00", "remaining_time": "5 days, 12:20:06", "throughput": 2713.52, "total_tokens": 355254816} {"current_steps": 1970, "total_steps": 9134, "loss": 0.6666, "learning_rate": 4.447743715456747e-05, "epoch": 0.21565997974766687, "percentage": 21.57, "elapsed_time": "1 day, 12:23:04", "remaining_time": "5 days, 12:18:52", "throughput": 2713.42, "total_tokens": 355415872} {"current_steps": 1971, "total_steps": 9134, "loss": 0.7389, "learning_rate": 4.4472045502282115e-05, "epoch": 0.21576945181860477, "percentage": 21.58, "elapsed_time": "1 day, 12:24:13", "remaining_time": "5 days, 12:17:52", "throughput": 2713.45, "total_tokens": 355606720} {"current_steps": 1972, "total_steps": 9134, "loss": 1.0017, "learning_rate": 4.4466651546491006e-05, "epoch": 0.2158789238895427, "percentage": 21.59, "elapsed_time": "1 day, 12:25:22", "remaining_time": "5 days, 12:16:55", "throughput": 2713.57, "total_tokens": 355809664} {"current_steps": 1973, "total_steps": 9134, "loss": 0.8947, "learning_rate": 4.4461255287832235e-05, "epoch": 0.21598839596048058, "percentage": 21.6, "elapsed_time": "1 day, 12:26:26", "remaining_time": "5 days, 12:15:42", "throughput": 2713.62, "total_tokens": 355991552} {"current_steps": 1974, "total_steps": 9134, "loss": 0.806, "learning_rate": 4.4455856726944155e-05, "epoch": 0.21609786803141848, "percentage": 21.61, "elapsed_time": "1 day, 12:27:36", "remaining_time": "5 days, 12:14:46", "throughput": 2713.83, "total_tokens": 356207040} {"current_steps": 1975, "total_steps": 9134, "loss": 0.8259, "learning_rate": 4.445045586446543e-05, "epoch": 0.2162073401023564, "percentage": 21.62, "elapsed_time": "1 day, 12:28:43", "remaining_time": "5 days, 12:13:42", "throughput": 2713.9, "total_tokens": 356398784} {"current_steps": 1976, "total_steps": 9134, "loss": 0.6571, "learning_rate": 4.4445052701034955e-05, "epoch": 0.2163168121732943, "percentage": 21.63, "elapsed_time": "1 day, 12:29:50", "remaining_time": "5 days, 12:12:39", "throughput": 2714.01, "total_tokens": 356596800} {"current_steps": 1977, "total_steps": 9134, "loss": 0.9279, "learning_rate": 4.443964723729191e-05, "epoch": 0.2164262842442322, "percentage": 21.64, "elapsed_time": "1 day, 12:30:59", "remaining_time": "5 days, 12:11:40", "throughput": 2714.05, "total_tokens": 356788096} {"current_steps": 1978, "total_steps": 9134, "loss": 0.8563, "learning_rate": 4.443423947387577e-05, "epoch": 0.21653575631517008, "percentage": 21.66, "elapsed_time": "1 day, 12:32:06", "remaining_time": "5 days, 12:10:37", "throughput": 2714.07, "total_tokens": 356972672} {"current_steps": 1979, "total_steps": 9134, "loss": 0.6347, "learning_rate": 4.4428829411426254e-05, "epoch": 0.216645228386108, "percentage": 21.67, "elapsed_time": "1 day, 12:33:15", "remaining_time": "5 days, 12:09:40", "throughput": 2714.1, "total_tokens": 357163968} {"current_steps": 1980, "total_steps": 9134, "loss": 0.7792, "learning_rate": 4.442341705058335e-05, "epoch": 0.2167547004570459, "percentage": 21.68, "elapsed_time": "1 day, 12:34:25", "remaining_time": "5 days, 12:08:44", "throughput": 2714.12, "total_tokens": 357355936} {"current_steps": 1981, "total_steps": 9134, "loss": 0.8749, "learning_rate": 4.4418002391987345e-05, "epoch": 0.2168641725279838, "percentage": 21.69, "elapsed_time": "1 day, 12:35:32", "remaining_time": "5 days, 12:07:40", "throughput": 2714.25, "total_tokens": 357555072} {"current_steps": 1982, "total_steps": 9134, "loss": 0.7566, "learning_rate": 4.441258543627879e-05, "epoch": 0.2169736445989217, "percentage": 21.7, "elapsed_time": "1 day, 12:36:36", "remaining_time": "5 days, 12:06:23", "throughput": 2714.19, "total_tokens": 357720608} {"current_steps": 1983, "total_steps": 9134, "loss": 0.8343, "learning_rate": 4.440716618409847e-05, "epoch": 0.2170831166698596, "percentage": 21.71, "elapsed_time": "1 day, 12:37:42", "remaining_time": "5 days, 12:05:15", "throughput": 2714.23, "total_tokens": 357904512} {"current_steps": 1984, "total_steps": 9134, "loss": 0.6336, "learning_rate": 4.4401744636087495e-05, "epoch": 0.2171925887407975, "percentage": 21.72, "elapsed_time": "1 day, 12:38:46", "remaining_time": "5 days, 12:03:59", "throughput": 2714.2, "total_tokens": 358073632} {"current_steps": 1985, "total_steps": 9134, "loss": 0.7854, "learning_rate": 4.439632079288722e-05, "epoch": 0.2173020608117354, "percentage": 21.73, "elapsed_time": "1 day, 12:39:55", "remaining_time": "5 days, 12:03:04", "throughput": 2714.36, "total_tokens": 358283744} {"current_steps": 1986, "total_steps": 9134, "loss": 0.6696, "learning_rate": 4.439089465513928e-05, "epoch": 0.21741153288267331, "percentage": 21.74, "elapsed_time": "1 day, 12:40:59", "remaining_time": "5 days, 12:01:46", "throughput": 2714.22, "total_tokens": 358437856} {"current_steps": 1987, "total_steps": 9134, "loss": 0.8466, "learning_rate": 4.438546622348557e-05, "epoch": 0.2175210049536112, "percentage": 21.75, "elapsed_time": "1 day, 12:42:06", "remaining_time": "5 days, 12:00:43", "throughput": 2714.21, "total_tokens": 358619072} {"current_steps": 1988, "total_steps": 9134, "loss": 0.5911, "learning_rate": 4.438003549856826e-05, "epoch": 0.2176304770245491, "percentage": 21.76, "elapsed_time": "1 day, 12:43:12", "remaining_time": "5 days, 11:59:36", "throughput": 2714.05, "total_tokens": 358778112} {"current_steps": 1989, "total_steps": 9134, "loss": 0.858, "learning_rate": 4.4374602481029807e-05, "epoch": 0.21773994909548702, "percentage": 21.78, "elapsed_time": "1 day, 12:44:22", "remaining_time": "5 days, 11:58:41", "throughput": 2714.23, "total_tokens": 358991136} {"current_steps": 1990, "total_steps": 9134, "loss": 0.6973, "learning_rate": 4.43691671715129e-05, "epoch": 0.21784942116642492, "percentage": 21.79, "elapsed_time": "1 day, 12:45:22", "remaining_time": "5 days, 11:57:11", "throughput": 2714.04, "total_tokens": 359128672} {"current_steps": 1991, "total_steps": 9134, "loss": 0.6666, "learning_rate": 4.436372957066056e-05, "epoch": 0.2179588932373628, "percentage": 21.8, "elapsed_time": "1 day, 12:46:29", "remaining_time": "5 days, 11:56:05", "throughput": 2713.96, "total_tokens": 359299360} {"current_steps": 1992, "total_steps": 9134, "loss": 0.7876, "learning_rate": 4.4358289679116026e-05, "epoch": 0.21806836530830073, "percentage": 21.81, "elapsed_time": "1 day, 12:47:36", "remaining_time": "5 days, 11:55:01", "throughput": 2714.03, "total_tokens": 359490208} {"current_steps": 1993, "total_steps": 9134, "loss": 0.6753, "learning_rate": 4.435284749752283e-05, "epoch": 0.21817783737923863, "percentage": 21.82, "elapsed_time": "1 day, 12:48:40", "remaining_time": "5 days, 11:53:44", "throughput": 2714.01, "total_tokens": 359661120} {"current_steps": 1994, "total_steps": 9134, "loss": 0.8226, "learning_rate": 4.434740302652477e-05, "epoch": 0.21828730945017652, "percentage": 21.83, "elapsed_time": "1 day, 12:49:45", "remaining_time": "5 days, 11:52:35", "throughput": 2714.02, "total_tokens": 359840096} {"current_steps": 1995, "total_steps": 9134, "loss": 0.569, "learning_rate": 4.434195626676592e-05, "epoch": 0.2183967815211144, "percentage": 21.84, "elapsed_time": "1 day, 12:50:51", "remaining_time": "5 days, 11:51:27", "throughput": 2714.02, "total_tokens": 360019520} {"current_steps": 1996, "total_steps": 9134, "loss": 0.688, "learning_rate": 4.4336507218890624e-05, "epoch": 0.21850625359205234, "percentage": 21.85, "elapsed_time": "1 day, 12:51:57", "remaining_time": "5 days, 11:50:16", "throughput": 2714.06, "total_tokens": 360202528} {"current_steps": 1997, "total_steps": 9134, "loss": 0.7879, "learning_rate": 4.433105588354348e-05, "epoch": 0.21861572566299023, "percentage": 21.86, "elapsed_time": "1 day, 12:53:03", "remaining_time": "5 days, 11:49:10", "throughput": 2714.06, "total_tokens": 360382848} {"current_steps": 1998, "total_steps": 9134, "loss": 0.8162, "learning_rate": 4.4325602261369384e-05, "epoch": 0.21872519773392812, "percentage": 21.87, "elapsed_time": "1 day, 12:54:13", "remaining_time": "5 days, 11:48:14", "throughput": 2714.24, "total_tokens": 360595200} {"current_steps": 1999, "total_steps": 9134, "loss": 0.4785, "learning_rate": 4.432014635301348e-05, "epoch": 0.21883466980486604, "percentage": 21.89, "elapsed_time": "1 day, 12:55:18", "remaining_time": "5 days, 11:47:05", "throughput": 2714.14, "total_tokens": 360760960} {"current_steps": 2000, "total_steps": 9134, "loss": 0.8412, "learning_rate": 4.43146881591212e-05, "epoch": 0.21894414187580394, "percentage": 21.9, "elapsed_time": "1 day, 12:56:28", "remaining_time": "5 days, 11:46:08", "throughput": 2714.22, "total_tokens": 360958752} {"current_steps": 2001, "total_steps": 9134, "loss": 1.052, "learning_rate": 4.430922768033824e-05, "epoch": 0.21905361394674183, "percentage": 21.91, "elapsed_time": "1 day, 12:59:54", "remaining_time": "5 days, 11:53:21", "throughput": 2711.39, "total_tokens": 361143552} {"current_steps": 2002, "total_steps": 9134, "loss": 0.711, "learning_rate": 4.4303764917310555e-05, "epoch": 0.21916308601767973, "percentage": 21.92, "elapsed_time": "1 day, 13:01:02", "remaining_time": "5 days, 11:52:20", "throughput": 2711.49, "total_tokens": 361340224} {"current_steps": 2003, "total_steps": 9134, "loss": 0.6528, "learning_rate": 4.429829987068438e-05, "epoch": 0.21927255808861765, "percentage": 21.93, "elapsed_time": "1 day, 13:02:06", "remaining_time": "5 days, 11:51:04", "throughput": 2711.48, "total_tokens": 361512032} {"current_steps": 2004, "total_steps": 9134, "loss": 0.8474, "learning_rate": 4.4292832541106214e-05, "epoch": 0.21938203015955554, "percentage": 21.94, "elapsed_time": "1 day, 13:03:15", "remaining_time": "5 days, 11:50:04", "throughput": 2711.58, "total_tokens": 361712288} {"current_steps": 2005, "total_steps": 9134, "loss": 0.8661, "learning_rate": 4.428736292922285e-05, "epoch": 0.21949150223049343, "percentage": 21.95, "elapsed_time": "1 day, 13:04:22", "remaining_time": "5 days, 11:49:01", "throughput": 2711.66, "total_tokens": 361905600} {"current_steps": 2006, "total_steps": 9134, "loss": 0.6566, "learning_rate": 4.428189103568132e-05, "epoch": 0.21960097430143136, "percentage": 21.96, "elapsed_time": "1 day, 13:05:31", "remaining_time": "5 days, 11:48:04", "throughput": 2711.78, "total_tokens": 362109216} {"current_steps": 2007, "total_steps": 9134, "loss": 0.6232, "learning_rate": 4.427641686112894e-05, "epoch": 0.21971044637236925, "percentage": 21.97, "elapsed_time": "1 day, 13:06:38", "remaining_time": "5 days, 11:46:58", "throughput": 2711.92, "total_tokens": 362308576} {"current_steps": 2008, "total_steps": 9134, "loss": 0.6635, "learning_rate": 4.4270940406213304e-05, "epoch": 0.21981991844330714, "percentage": 21.98, "elapsed_time": "1 day, 13:07:44", "remaining_time": "5 days, 11:45:50", "throughput": 2711.87, "total_tokens": 362481952} {"current_steps": 2009, "total_steps": 9134, "loss": 0.6922, "learning_rate": 4.4265461671582254e-05, "epoch": 0.21992939051424507, "percentage": 21.99, "elapsed_time": "1 day, 13:08:49", "remaining_time": "5 days, 11:44:38", "throughput": 2711.66, "total_tokens": 362630912} {"current_steps": 2010, "total_steps": 9134, "loss": 1.0244, "learning_rate": 4.4259980657883916e-05, "epoch": 0.22003886258518296, "percentage": 22.01, "elapsed_time": "1 day, 13:09:58", "remaining_time": "5 days, 11:43:40", "throughput": 2711.94, "total_tokens": 362855136} {"current_steps": 2011, "total_steps": 9134, "loss": 0.7141, "learning_rate": 4.425449736576668e-05, "epoch": 0.22014833465612085, "percentage": 22.02, "elapsed_time": "1 day, 13:11:06", "remaining_time": "5 days, 11:42:35", "throughput": 2712.06, "total_tokens": 363052256} {"current_steps": 2012, "total_steps": 9134, "loss": 0.8426, "learning_rate": 4.424901179587922e-05, "epoch": 0.22025780672705875, "percentage": 22.03, "elapsed_time": "1 day, 13:12:09", "remaining_time": "5 days, 11:41:19", "throughput": 2711.99, "total_tokens": 363216000} {"current_steps": 2013, "total_steps": 9134, "loss": 0.6569, "learning_rate": 4.4243523948870465e-05, "epoch": 0.22036727879799667, "percentage": 22.04, "elapsed_time": "1 day, 13:13:12", "remaining_time": "5 days, 11:39:58", "throughput": 2711.89, "total_tokens": 363372352} {"current_steps": 2014, "total_steps": 9134, "loss": 0.6161, "learning_rate": 4.4238033825389605e-05, "epoch": 0.22047675086893456, "percentage": 22.05, "elapsed_time": "1 day, 13:14:21", "remaining_time": "5 days, 11:39:00", "throughput": 2712.06, "total_tokens": 363582464} {"current_steps": 2015, "total_steps": 9134, "loss": 0.6432, "learning_rate": 4.423254142608613e-05, "epoch": 0.22058622293987246, "percentage": 22.06, "elapsed_time": "1 day, 13:15:24", "remaining_time": "5 days, 11:37:41", "throughput": 2711.93, "total_tokens": 363736352} {"current_steps": 2016, "total_steps": 9134, "loss": 0.6241, "learning_rate": 4.422704675160976e-05, "epoch": 0.22069569501081038, "percentage": 22.07, "elapsed_time": "1 day, 13:16:32", "remaining_time": "5 days, 11:36:40", "throughput": 2712.13, "total_tokens": 363946688} {"current_steps": 2017, "total_steps": 9134, "loss": 0.6576, "learning_rate": 4.422154980261053e-05, "epoch": 0.22080516708174827, "percentage": 22.08, "elapsed_time": "1 day, 13:17:40", "remaining_time": "5 days, 11:35:37", "throughput": 2712.2, "total_tokens": 364140896} {"current_steps": 2018, "total_steps": 9134, "loss": 0.7891, "learning_rate": 4.4216050579738685e-05, "epoch": 0.22091463915268617, "percentage": 22.09, "elapsed_time": "1 day, 13:18:45", "remaining_time": "5 days, 11:34:28", "throughput": 2712.17, "total_tokens": 364314272} {"current_steps": 2019, "total_steps": 9134, "loss": 0.6892, "learning_rate": 4.42105490836448e-05, "epoch": 0.22102411122362406, "percentage": 22.1, "elapsed_time": "1 day, 13:19:54", "remaining_time": "5 days, 11:33:30", "throughput": 2712.44, "total_tokens": 364537376} {"current_steps": 2020, "total_steps": 9134, "loss": 0.7486, "learning_rate": 4.420504531497969e-05, "epoch": 0.22113358329456198, "percentage": 22.12, "elapsed_time": "1 day, 13:21:03", "remaining_time": "5 days, 11:32:32", "throughput": 2712.5, "total_tokens": 364732480} {"current_steps": 2021, "total_steps": 9134, "loss": 0.6361, "learning_rate": 4.419953927439443e-05, "epoch": 0.22124305536549987, "percentage": 22.13, "elapsed_time": "1 day, 13:22:10", "remaining_time": "5 days, 11:31:27", "throughput": 2712.49, "total_tokens": 364914144} {"current_steps": 2022, "total_steps": 9134, "loss": 0.5429, "learning_rate": 4.419403096254037e-05, "epoch": 0.22135252743643777, "percentage": 22.14, "elapsed_time": "1 day, 13:23:18", "remaining_time": "5 days, 11:30:26", "throughput": 2712.49, "total_tokens": 365098720} {"current_steps": 2023, "total_steps": 9134, "loss": 0.7161, "learning_rate": 4.4188520380069145e-05, "epoch": 0.2214619995073757, "percentage": 22.15, "elapsed_time": "1 day, 13:24:24", "remaining_time": "5 days, 11:29:16", "throughput": 2712.33, "total_tokens": 365254400} {"current_steps": 2024, "total_steps": 9134, "loss": 0.7134, "learning_rate": 4.418300752763264e-05, "epoch": 0.22157147157831358, "percentage": 22.16, "elapsed_time": "1 day, 13:25:28", "remaining_time": "5 days, 11:27:59", "throughput": 2712.14, "total_tokens": 365401120} {"current_steps": 2025, "total_steps": 9134, "loss": 0.6245, "learning_rate": 4.4177492405883016e-05, "epoch": 0.22168094364925148, "percentage": 22.17, "elapsed_time": "1 day, 13:26:35", "remaining_time": "5 days, 11:26:57", "throughput": 2712.22, "total_tokens": 365595776} {"current_steps": 2026, "total_steps": 9134, "loss": 0.5532, "learning_rate": 4.4171975015472705e-05, "epoch": 0.2217904157201894, "percentage": 22.18, "elapsed_time": "1 day, 13:27:40", "remaining_time": "5 days, 11:25:43", "throughput": 2712.21, "total_tokens": 365770048} {"current_steps": 2027, "total_steps": 9134, "loss": 0.6425, "learning_rate": 4.4166455357054394e-05, "epoch": 0.2218998877911273, "percentage": 22.19, "elapsed_time": "1 day, 13:28:42", "remaining_time": "5 days, 11:24:19", "throughput": 2712.15, "total_tokens": 365929312} {"current_steps": 2028, "total_steps": 9134, "loss": 0.5842, "learning_rate": 4.416093343128106e-05, "epoch": 0.2220093598620652, "percentage": 22.2, "elapsed_time": "1 day, 13:29:45", "remaining_time": "5 days, 11:23:01", "throughput": 2712.06, "total_tokens": 366089248} {"current_steps": 2029, "total_steps": 9134, "loss": 0.8142, "learning_rate": 4.415540923880593e-05, "epoch": 0.22211883193300308, "percentage": 22.21, "elapsed_time": "1 day, 13:30:50", "remaining_time": "5 days, 11:21:50", "throughput": 2712.19, "total_tokens": 366283232} {"current_steps": 2030, "total_steps": 9134, "loss": 1.0114, "learning_rate": 4.41498827802825e-05, "epoch": 0.222228304003941, "percentage": 22.22, "elapsed_time": "1 day, 13:31:55", "remaining_time": "5 days, 11:20:36", "throughput": 2712.25, "total_tokens": 366466240} {"current_steps": 2031, "total_steps": 9134, "loss": 0.8991, "learning_rate": 4.414435405636455e-05, "epoch": 0.2223377760748789, "percentage": 22.24, "elapsed_time": "1 day, 13:33:03", "remaining_time": "5 days, 11:19:35", "throughput": 2712.33, "total_tokens": 366662464} {"current_steps": 2032, "total_steps": 9134, "loss": 0.6525, "learning_rate": 4.4138823067706116e-05, "epoch": 0.2224472481458168, "percentage": 22.25, "elapsed_time": "1 day, 13:34:10", "remaining_time": "5 days, 11:18:31", "throughput": 2712.27, "total_tokens": 366836960} {"current_steps": 2033, "total_steps": 9134, "loss": 0.5975, "learning_rate": 4.413328981496149e-05, "epoch": 0.2225567202167547, "percentage": 22.26, "elapsed_time": "1 day, 13:35:09", "remaining_time": "5 days, 11:16:58", "throughput": 2712.07, "total_tokens": 366969120} {"current_steps": 2034, "total_steps": 9134, "loss": 0.7552, "learning_rate": 4.412775429878527e-05, "epoch": 0.2226661922876926, "percentage": 22.27, "elapsed_time": "1 day, 13:36:17", "remaining_time": "5 days, 11:15:55", "throughput": 2712.0, "total_tokens": 367142496} {"current_steps": 2035, "total_steps": 9134, "loss": 0.6497, "learning_rate": 4.412221651983227e-05, "epoch": 0.2227756643586305, "percentage": 22.28, "elapsed_time": "1 day, 13:37:20", "remaining_time": "5 days, 11:14:37", "throughput": 2712.0, "total_tokens": 367314528} {"current_steps": 2036, "total_steps": 9134, "loss": 0.7986, "learning_rate": 4.4116676478757616e-05, "epoch": 0.22288513642956842, "percentage": 22.29, "elapsed_time": "1 day, 13:38:22", "remaining_time": "5 days, 11:13:14", "throughput": 2712.01, "total_tokens": 367483200} {"current_steps": 2037, "total_steps": 9134, "loss": 0.9344, "learning_rate": 4.4111134176216685e-05, "epoch": 0.22299460850050631, "percentage": 22.3, "elapsed_time": "1 day, 13:39:30", "remaining_time": "5 days, 11:12:12", "throughput": 2712.07, "total_tokens": 367675392} {"current_steps": 2038, "total_steps": 9134, "loss": 0.803, "learning_rate": 4.410558961286511e-05, "epoch": 0.2231040805714442, "percentage": 22.31, "elapsed_time": "1 day, 13:40:35", "remaining_time": "5 days, 11:11:02", "throughput": 2712.04, "total_tokens": 367848544} {"current_steps": 2039, "total_steps": 9134, "loss": 0.4954, "learning_rate": 4.41000427893588e-05, "epoch": 0.2232135526423821, "percentage": 22.32, "elapsed_time": "1 day, 13:41:40", "remaining_time": "5 days, 11:09:48", "throughput": 2712.06, "total_tokens": 368026624} {"current_steps": 2040, "total_steps": 9134, "loss": 0.79, "learning_rate": 4.409449370635395e-05, "epoch": 0.22332302471332002, "percentage": 22.33, "elapsed_time": "1 day, 13:42:47", "remaining_time": "5 days, 11:08:43", "throughput": 2712.12, "total_tokens": 368216128} {"current_steps": 2041, "total_steps": 9134, "loss": 0.8221, "learning_rate": 4.4088942364506994e-05, "epoch": 0.22343249678425792, "percentage": 22.35, "elapsed_time": "1 day, 13:43:55", "remaining_time": "5 days, 11:07:43", "throughput": 2712.34, "total_tokens": 368432512} {"current_steps": 2042, "total_steps": 9134, "loss": 0.7129, "learning_rate": 4.408338876447465e-05, "epoch": 0.2235419688551958, "percentage": 22.36, "elapsed_time": "1 day, 13:45:04", "remaining_time": "5 days, 11:06:45", "throughput": 2712.58, "total_tokens": 368652032} {"current_steps": 2043, "total_steps": 9134, "loss": 0.7354, "learning_rate": 4.4077832906913895e-05, "epoch": 0.22365144092613373, "percentage": 22.37, "elapsed_time": "1 day, 13:46:13", "remaining_time": "5 days, 11:05:46", "throughput": 2712.72, "total_tokens": 368857440} {"current_steps": 2044, "total_steps": 9134, "loss": 1.0417, "learning_rate": 4.407227479248198e-05, "epoch": 0.22376091299707163, "percentage": 22.38, "elapsed_time": "1 day, 13:47:19", "remaining_time": "5 days, 11:04:39", "throughput": 2712.8, "total_tokens": 369048512} {"current_steps": 2045, "total_steps": 9134, "loss": 0.8381, "learning_rate": 4.406671442183642e-05, "epoch": 0.22387038506800952, "percentage": 22.39, "elapsed_time": "1 day, 13:48:25", "remaining_time": "5 days, 11:03:30", "throughput": 2712.9, "total_tokens": 369241600} {"current_steps": 2046, "total_steps": 9134, "loss": 0.7005, "learning_rate": 4.4061151795634985e-05, "epoch": 0.2239798571389474, "percentage": 22.4, "elapsed_time": "1 day, 13:49:31", "remaining_time": "5 days, 11:02:22", "throughput": 2713.08, "total_tokens": 369445440} {"current_steps": 2047, "total_steps": 9134, "loss": 0.6792, "learning_rate": 4.405558691453574e-05, "epoch": 0.22408932920988534, "percentage": 22.41, "elapsed_time": "1 day, 13:50:36", "remaining_time": "5 days, 11:01:08", "throughput": 2713.14, "total_tokens": 369628448} {"current_steps": 2048, "total_steps": 9134, "loss": 0.6395, "learning_rate": 4.4050019779196984e-05, "epoch": 0.22419880128082323, "percentage": 22.42, "elapsed_time": "1 day, 13:51:37", "remaining_time": "5 days, 10:59:43", "throughput": 2713.05, "total_tokens": 369781216} {"current_steps": 2049, "total_steps": 9134, "loss": 0.7212, "learning_rate": 4.4044450390277306e-05, "epoch": 0.22430827335176112, "percentage": 22.43, "elapsed_time": "1 day, 13:52:41", "remaining_time": "5 days, 10:58:30", "throughput": 2713.09, "total_tokens": 369962208} {"current_steps": 2050, "total_steps": 9134, "loss": 0.8673, "learning_rate": 4.403887874843556e-05, "epoch": 0.22441774542269904, "percentage": 22.44, "elapsed_time": "1 day, 13:53:51", "remaining_time": "5 days, 10:57:33", "throughput": 2713.2, "total_tokens": 370166048} {"current_steps": 2051, "total_steps": 9134, "loss": 0.7634, "learning_rate": 4.403330485433085e-05, "epoch": 0.22452721749363694, "percentage": 22.45, "elapsed_time": "1 day, 13:54:56", "remaining_time": "5 days, 10:56:23", "throughput": 2713.09, "total_tokens": 370328448} {"current_steps": 2052, "total_steps": 9134, "loss": 0.7397, "learning_rate": 4.4027728708622555e-05, "epoch": 0.22463668956457483, "percentage": 22.47, "elapsed_time": "1 day, 13:56:03", "remaining_time": "5 days, 10:55:16", "throughput": 2713.01, "total_tokens": 370497792} {"current_steps": 2053, "total_steps": 9134, "loss": 0.6868, "learning_rate": 4.4022150311970335e-05, "epoch": 0.22474616163551275, "percentage": 22.48, "elapsed_time": "1 day, 13:57:12", "remaining_time": "5 days, 10:54:17", "throughput": 2713.03, "total_tokens": 370686176} {"current_steps": 2054, "total_steps": 9134, "loss": 0.8084, "learning_rate": 4.4016569665034105e-05, "epoch": 0.22485563370645065, "percentage": 22.49, "elapsed_time": "1 day, 13:58:18", "remaining_time": "5 days, 10:53:11", "throughput": 2713.17, "total_tokens": 370887552} {"current_steps": 2055, "total_steps": 9134, "loss": 0.7042, "learning_rate": 4.401098676847402e-05, "epoch": 0.22496510577738854, "percentage": 22.5, "elapsed_time": "1 day, 13:59:22", "remaining_time": "5 days, 10:51:55", "throughput": 2713.16, "total_tokens": 371058912} {"current_steps": 2056, "total_steps": 9134, "loss": 0.702, "learning_rate": 4.400540162295056e-05, "epoch": 0.22507457784832643, "percentage": 22.51, "elapsed_time": "1 day, 14:00:24", "remaining_time": "5 days, 10:50:32", "throughput": 2713.02, "total_tokens": 371208096} {"current_steps": 2057, "total_steps": 9134, "loss": 0.5679, "learning_rate": 4.399981422912441e-05, "epoch": 0.22518404991926436, "percentage": 22.52, "elapsed_time": "1 day, 14:01:27", "remaining_time": "5 days, 10:49:13", "throughput": 2712.94, "total_tokens": 371367136} {"current_steps": 2058, "total_steps": 9134, "loss": 0.6447, "learning_rate": 4.3994224587656556e-05, "epoch": 0.22529352199020225, "percentage": 22.53, "elapsed_time": "1 day, 14:02:33", "remaining_time": "5 days, 10:48:06", "throughput": 2712.96, "total_tokens": 371550368} {"current_steps": 2059, "total_steps": 9134, "loss": 0.5606, "learning_rate": 4.398863269920825e-05, "epoch": 0.22540299406114014, "percentage": 22.54, "elapsed_time": "1 day, 14:03:36", "remaining_time": "5 days, 10:46:47", "throughput": 2712.95, "total_tokens": 371719040} {"current_steps": 2060, "total_steps": 9134, "loss": 0.9015, "learning_rate": 4.398303856444099e-05, "epoch": 0.22551246613207807, "percentage": 22.55, "elapsed_time": "1 day, 14:04:45", "remaining_time": "5 days, 10:45:48", "throughput": 2712.96, "total_tokens": 371906304} {"current_steps": 2061, "total_steps": 9134, "loss": 0.8008, "learning_rate": 4.397744218401657e-05, "epoch": 0.22562193820301596, "percentage": 22.56, "elapsed_time": "1 day, 14:05:54", "remaining_time": "5 days, 10:44:49", "throughput": 2713.01, "total_tokens": 372101408} {"current_steps": 2062, "total_steps": 9134, "loss": 0.6843, "learning_rate": 4.3971843558597e-05, "epoch": 0.22573141027395385, "percentage": 22.57, "elapsed_time": "1 day, 14:07:02", "remaining_time": "5 days, 10:43:50", "throughput": 2713.21, "total_tokens": 372314880} {"current_steps": 2063, "total_steps": 9134, "loss": 0.5991, "learning_rate": 4.396624268884462e-05, "epoch": 0.22584088234489175, "percentage": 22.59, "elapsed_time": "1 day, 14:08:11", "remaining_time": "5 days, 10:42:51", "throughput": 2713.06, "total_tokens": 372480640} {"current_steps": 2064, "total_steps": 9134, "loss": 0.9296, "learning_rate": 4.396063957542198e-05, "epoch": 0.22595035441582967, "percentage": 22.6, "elapsed_time": "1 day, 14:09:20", "remaining_time": "5 days, 10:41:53", "throughput": 2713.15, "total_tokens": 372680000} {"current_steps": 2065, "total_steps": 9134, "loss": 0.8449, "learning_rate": 4.3955034218991934e-05, "epoch": 0.22605982648676756, "percentage": 22.61, "elapsed_time": "1 day, 14:10:27", "remaining_time": "5 days, 10:40:46", "throughput": 2713.31, "total_tokens": 372882944} {"current_steps": 2066, "total_steps": 9134, "loss": 0.7749, "learning_rate": 4.394942662021756e-05, "epoch": 0.22616929855770546, "percentage": 22.62, "elapsed_time": "1 day, 14:11:33", "remaining_time": "5 days, 10:39:39", "throughput": 2713.35, "total_tokens": 373067968} {"current_steps": 2067, "total_steps": 9134, "loss": 0.7659, "learning_rate": 4.3943816779762256e-05, "epoch": 0.22627877062864338, "percentage": 22.63, "elapsed_time": "1 day, 14:12:33", "remaining_time": "5 days, 10:38:11", "throughput": 2713.28, "total_tokens": 373221184} {"current_steps": 2068, "total_steps": 9134, "loss": 0.9793, "learning_rate": 4.393820469828964e-05, "epoch": 0.22638824269958127, "percentage": 22.64, "elapsed_time": "1 day, 14:13:41", "remaining_time": "5 days, 10:37:07", "throughput": 2713.48, "total_tokens": 373432416} {"current_steps": 2069, "total_steps": 9134, "loss": 0.6913, "learning_rate": 4.39325903764636e-05, "epoch": 0.22649771477051917, "percentage": 22.65, "elapsed_time": "1 day, 14:14:47", "remaining_time": "5 days, 10:35:59", "throughput": 2713.45, "total_tokens": 373606688} {"current_steps": 2070, "total_steps": 9134, "loss": 0.681, "learning_rate": 4.392697381494832e-05, "epoch": 0.2266071868414571, "percentage": 22.66, "elapsed_time": "1 day, 14:15:54", "remaining_time": "5 days, 10:34:55", "throughput": 2713.48, "total_tokens": 373793728} {"current_steps": 2071, "total_steps": 9134, "loss": 0.6642, "learning_rate": 4.3921355014408226e-05, "epoch": 0.22671665891239498, "percentage": 22.67, "elapsed_time": "1 day, 14:16:57", "remaining_time": "5 days, 10:33:38", "throughput": 2713.39, "total_tokens": 373954112} {"current_steps": 2072, "total_steps": 9134, "loss": 0.8819, "learning_rate": 4.3915733975508e-05, "epoch": 0.22682613098333287, "percentage": 22.68, "elapsed_time": "1 day, 14:18:06", "remaining_time": "5 days, 10:32:37", "throughput": 2713.54, "total_tokens": 374159968} {"current_steps": 2073, "total_steps": 9134, "loss": 0.7061, "learning_rate": 4.39101106989126e-05, "epoch": 0.22693560305427077, "percentage": 22.7, "elapsed_time": "1 day, 14:19:15", "remaining_time": "5 days, 10:31:39", "throughput": 2713.46, "total_tokens": 374335584} {"current_steps": 2074, "total_steps": 9134, "loss": 0.7383, "learning_rate": 4.3904485185287256e-05, "epoch": 0.2270450751252087, "percentage": 22.71, "elapsed_time": "1 day, 14:20:19", "remaining_time": "5 days, 10:30:24", "throughput": 2713.53, "total_tokens": 374519040} {"current_steps": 2075, "total_steps": 9134, "loss": 0.8211, "learning_rate": 4.389885743529746e-05, "epoch": 0.22715454719614658, "percentage": 22.72, "elapsed_time": "1 day, 14:21:25", "remaining_time": "5 days, 10:29:17", "throughput": 2713.54, "total_tokens": 374700480} {"current_steps": 2076, "total_steps": 9134, "loss": 0.7222, "learning_rate": 4.389322744960895e-05, "epoch": 0.22726401926708448, "percentage": 22.73, "elapsed_time": "1 day, 14:22:31", "remaining_time": "5 days, 10:28:07", "throughput": 2713.42, "total_tokens": 374862432} {"current_steps": 2077, "total_steps": 9134, "loss": 0.7916, "learning_rate": 4.388759522888776e-05, "epoch": 0.2273734913380224, "percentage": 22.74, "elapsed_time": "1 day, 14:23:35", "remaining_time": "5 days, 10:26:53", "throughput": 2713.52, "total_tokens": 375050816} {"current_steps": 2078, "total_steps": 9134, "loss": 0.659, "learning_rate": 4.3881960773800154e-05, "epoch": 0.2274829634089603, "percentage": 22.75, "elapsed_time": "1 day, 14:24:39", "remaining_time": "5 days, 10:25:37", "throughput": 2713.5, "total_tokens": 375220384} {"current_steps": 2079, "total_steps": 9134, "loss": 0.8047, "learning_rate": 4.387632408501269e-05, "epoch": 0.2275924354798982, "percentage": 22.76, "elapsed_time": "1 day, 14:25:46", "remaining_time": "5 days, 10:24:32", "throughput": 2713.63, "total_tokens": 375421312} {"current_steps": 2080, "total_steps": 9134, "loss": 0.8133, "learning_rate": 4.3870685163192165e-05, "epoch": 0.22770190755083608, "percentage": 22.77, "elapsed_time": "1 day, 14:26:49", "remaining_time": "5 days, 10:23:13", "throughput": 2713.58, "total_tokens": 375584384} {"current_steps": 2081, "total_steps": 9134, "loss": 0.6045, "learning_rate": 4.386504400900566e-05, "epoch": 0.227811379621774, "percentage": 22.78, "elapsed_time": "1 day, 14:27:58", "remaining_time": "5 days, 10:22:15", "throughput": 2713.77, "total_tokens": 375797632} {"current_steps": 2082, "total_steps": 9134, "loss": 0.6957, "learning_rate": 4.3859400623120515e-05, "epoch": 0.2279208516927119, "percentage": 22.79, "elapsed_time": "1 day, 14:29:04", "remaining_time": "5 days, 10:21:09", "throughput": 2713.77, "total_tokens": 375979744} {"current_steps": 2083, "total_steps": 9134, "loss": 0.8164, "learning_rate": 4.3853755006204334e-05, "epoch": 0.2280303237636498, "percentage": 22.8, "elapsed_time": "1 day, 14:30:11", "remaining_time": "5 days, 10:20:01", "throughput": 2713.74, "total_tokens": 376154016} {"current_steps": 2084, "total_steps": 9134, "loss": 0.6439, "learning_rate": 4.384810715892498e-05, "epoch": 0.2281397958345877, "percentage": 22.82, "elapsed_time": "1 day, 14:31:20", "remaining_time": "5 days, 10:19:04", "throughput": 2713.69, "total_tokens": 376335904} {"current_steps": 2085, "total_steps": 9134, "loss": 0.6883, "learning_rate": 4.3842457081950575e-05, "epoch": 0.2282492679055256, "percentage": 22.83, "elapsed_time": "1 day, 14:32:25", "remaining_time": "5 days, 10:17:53", "throughput": 2713.73, "total_tokens": 376517568} {"current_steps": 2086, "total_steps": 9134, "loss": 0.6989, "learning_rate": 4.383680477594951e-05, "epoch": 0.2283587399764635, "percentage": 22.84, "elapsed_time": "1 day, 14:33:28", "remaining_time": "5 days, 10:16:33", "throughput": 2713.57, "total_tokens": 376665632} {"current_steps": 2087, "total_steps": 9134, "loss": 0.9081, "learning_rate": 4.3831150241590464e-05, "epoch": 0.22846821204740142, "percentage": 22.85, "elapsed_time": "1 day, 14:34:33", "remaining_time": "5 days, 10:15:21", "throughput": 2713.61, "total_tokens": 376847072} {"current_steps": 2088, "total_steps": 9134, "loss": 0.5016, "learning_rate": 4.382549347954233e-05, "epoch": 0.2285776841183393, "percentage": 22.86, "elapsed_time": "1 day, 14:35:38", "remaining_time": "5 days, 10:14:10", "throughput": 2713.66, "total_tokens": 377031872} {"current_steps": 2089, "total_steps": 9134, "loss": 0.7132, "learning_rate": 4.381983449047432e-05, "epoch": 0.2286871561892772, "percentage": 22.87, "elapsed_time": "1 day, 14:36:43", "remaining_time": "5 days, 10:13:00", "throughput": 2713.66, "total_tokens": 377209728} {"current_steps": 2090, "total_steps": 9134, "loss": 0.7477, "learning_rate": 4.381417327505586e-05, "epoch": 0.2287966282602151, "percentage": 22.88, "elapsed_time": "1 day, 14:37:50", "remaining_time": "5 days, 10:11:52", "throughput": 2713.8, "total_tokens": 377408864} {"current_steps": 2091, "total_steps": 9134, "loss": 0.4857, "learning_rate": 4.3808509833956666e-05, "epoch": 0.22890610033115302, "percentage": 22.89, "elapsed_time": "1 day, 14:38:57", "remaining_time": "5 days, 10:10:48", "throughput": 2713.94, "total_tokens": 377609344} {"current_steps": 2092, "total_steps": 9134, "loss": 0.6178, "learning_rate": 4.380284416784672e-05, "epoch": 0.22901557240209092, "percentage": 22.9, "elapsed_time": "1 day, 14:40:01", "remaining_time": "5 days, 10:09:35", "throughput": 2713.93, "total_tokens": 377783616} {"current_steps": 2093, "total_steps": 9134, "loss": 0.8217, "learning_rate": 4.3797176277396245e-05, "epoch": 0.2291250444730288, "percentage": 22.91, "elapsed_time": "1 day, 14:41:10", "remaining_time": "5 days, 10:08:36", "throughput": 2713.96, "total_tokens": 377975360} {"current_steps": 2094, "total_steps": 9134, "loss": 0.8519, "learning_rate": 4.3791506163275764e-05, "epoch": 0.22923451654396673, "percentage": 22.93, "elapsed_time": "1 day, 14:42:16", "remaining_time": "5 days, 10:07:25", "throughput": 2713.97, "total_tokens": 378153888} {"current_steps": 2095, "total_steps": 9134, "loss": 0.8439, "learning_rate": 4.378583382615601e-05, "epoch": 0.22934398861490463, "percentage": 22.94, "elapsed_time": "1 day, 14:43:21", "remaining_time": "5 days, 10:06:16", "throughput": 2713.87, "total_tokens": 378318528} {"current_steps": 2096, "total_steps": 9134, "loss": 0.682, "learning_rate": 4.378015926670804e-05, "epoch": 0.22945346068584252, "percentage": 22.95, "elapsed_time": "1 day, 14:44:30", "remaining_time": "5 days, 10:05:16", "throughput": 2713.88, "total_tokens": 378505120} {"current_steps": 2097, "total_steps": 9134, "loss": 0.8057, "learning_rate": 4.377448248560313e-05, "epoch": 0.2295629327567804, "percentage": 22.96, "elapsed_time": "1 day, 14:45:38", "remaining_time": "5 days, 10:04:15", "throughput": 2713.85, "total_tokens": 378686560} {"current_steps": 2098, "total_steps": 9134, "loss": 0.7287, "learning_rate": 4.376880348351283e-05, "epoch": 0.22967240482771833, "percentage": 22.97, "elapsed_time": "1 day, 14:46:43", "remaining_time": "5 days, 10:03:02", "throughput": 2713.67, "total_tokens": 378836416} {"current_steps": 2099, "total_steps": 9134, "loss": 0.5919, "learning_rate": 4.376312226110895e-05, "epoch": 0.22978187689865623, "percentage": 22.98, "elapsed_time": "1 day, 14:47:43", "remaining_time": "5 days, 10:01:37", "throughput": 2713.62, "total_tokens": 378994336} {"current_steps": 2100, "total_steps": 9134, "loss": 0.7046, "learning_rate": 4.375743881906359e-05, "epoch": 0.22989134896959412, "percentage": 22.99, "elapsed_time": "1 day, 14:48:46", "remaining_time": "5 days, 10:00:17", "throughput": 2713.51, "total_tokens": 379149568} {"current_steps": 2101, "total_steps": 9134, "loss": 1.1376, "learning_rate": 4.3751753158049065e-05, "epoch": 0.23000082104053204, "percentage": 23.0, "elapsed_time": "1 day, 14:49:52", "remaining_time": "5 days, 9:59:07", "throughput": 2713.5, "total_tokens": 379326304} {"current_steps": 2102, "total_steps": 9134, "loss": 0.7187, "learning_rate": 4.374606527873799e-05, "epoch": 0.23011029311146994, "percentage": 23.01, "elapsed_time": "1 day, 14:51:00", "remaining_time": "5 days, 9:58:08", "throughput": 2713.47, "total_tokens": 379507968} {"current_steps": 2103, "total_steps": 9134, "loss": 0.6193, "learning_rate": 4.3740375181803225e-05, "epoch": 0.23021976518240783, "percentage": 23.02, "elapsed_time": "1 day, 14:52:08", "remaining_time": "5 days, 9:57:06", "throughput": 2713.59, "total_tokens": 379709792} {"current_steps": 2104, "total_steps": 9134, "loss": 0.6533, "learning_rate": 4.373468286791792e-05, "epoch": 0.23032923725334575, "percentage": 23.03, "elapsed_time": "1 day, 14:53:16", "remaining_time": "5 days, 9:56:03", "throughput": 2713.53, "total_tokens": 379883616} {"current_steps": 2105, "total_steps": 9134, "loss": 0.8281, "learning_rate": 4.3728988337755426e-05, "epoch": 0.23043870932428365, "percentage": 23.05, "elapsed_time": "1 day, 14:54:25", "remaining_time": "5 days, 9:55:05", "throughput": 2713.37, "total_tokens": 380048704} {"current_steps": 2106, "total_steps": 9134, "loss": 0.6358, "learning_rate": 4.372329159198943e-05, "epoch": 0.23054818139522154, "percentage": 23.06, "elapsed_time": "1 day, 14:55:33", "remaining_time": "5 days, 9:54:04", "throughput": 2713.46, "total_tokens": 380246720} {"current_steps": 2107, "total_steps": 9134, "loss": 0.7766, "learning_rate": 4.371759263129382e-05, "epoch": 0.23065765346615943, "percentage": 23.07, "elapsed_time": "1 day, 14:56:38", "remaining_time": "5 days, 9:52:51", "throughput": 2713.39, "total_tokens": 380412256} {"current_steps": 2108, "total_steps": 9134, "loss": 0.7225, "learning_rate": 4.371189145634279e-05, "epoch": 0.23076712553709736, "percentage": 23.08, "elapsed_time": "1 day, 14:57:47", "remaining_time": "5 days, 9:51:53", "throughput": 2713.38, "total_tokens": 380597952} {"current_steps": 2109, "total_steps": 9134, "loss": 0.6908, "learning_rate": 4.3706188067810766e-05, "epoch": 0.23087659760803525, "percentage": 23.09, "elapsed_time": "1 day, 14:58:51", "remaining_time": "5 days, 9:50:39", "throughput": 2713.27, "total_tokens": 380758336} {"current_steps": 2110, "total_steps": 9134, "loss": 0.6135, "learning_rate": 4.370048246637246e-05, "epoch": 0.23098606967897314, "percentage": 23.1, "elapsed_time": "1 day, 14:59:57", "remaining_time": "5 days, 9:49:30", "throughput": 2713.38, "total_tokens": 380951648} {"current_steps": 2111, "total_steps": 9134, "loss": 0.7887, "learning_rate": 4.369477465270282e-05, "epoch": 0.23109554174991107, "percentage": 23.11, "elapsed_time": "1 day, 15:01:02", "remaining_time": "5 days, 9:48:19", "throughput": 2713.53, "total_tokens": 381150112} {"current_steps": 2112, "total_steps": 9134, "loss": 0.7214, "learning_rate": 4.3689064627477084e-05, "epoch": 0.23120501382084896, "percentage": 23.12, "elapsed_time": "1 day, 15:02:10", "remaining_time": "5 days, 9:47:17", "throughput": 2713.71, "total_tokens": 381359104} {"current_steps": 2113, "total_steps": 9134, "loss": 0.658, "learning_rate": 4.368335239137073e-05, "epoch": 0.23131448589178685, "percentage": 23.13, "elapsed_time": "1 day, 15:03:16", "remaining_time": "5 days, 9:46:07", "throughput": 2713.72, "total_tokens": 381538080} {"current_steps": 2114, "total_steps": 9134, "loss": 0.6878, "learning_rate": 4.36776379450595e-05, "epoch": 0.23142395796272475, "percentage": 23.14, "elapsed_time": "1 day, 15:04:22", "remaining_time": "5 days, 9:45:01", "throughput": 2713.76, "total_tokens": 381725344} {"current_steps": 2115, "total_steps": 9134, "loss": 0.8352, "learning_rate": 4.3671921289219415e-05, "epoch": 0.23153343003366267, "percentage": 23.16, "elapsed_time": "1 day, 15:05:27", "remaining_time": "5 days, 9:43:48", "throughput": 2713.72, "total_tokens": 381894240} {"current_steps": 2116, "total_steps": 9134, "loss": 0.6355, "learning_rate": 4.3666202424526724e-05, "epoch": 0.23164290210460056, "percentage": 23.17, "elapsed_time": "1 day, 15:06:32", "remaining_time": "5 days, 9:42:38", "throughput": 2713.79, "total_tokens": 382082176} {"current_steps": 2117, "total_steps": 9134, "loss": 0.8084, "learning_rate": 4.366048135165798e-05, "epoch": 0.23175237417553846, "percentage": 23.18, "elapsed_time": "1 day, 15:07:37", "remaining_time": "5 days, 9:41:26", "throughput": 2713.83, "total_tokens": 382264736} {"current_steps": 2118, "total_steps": 9134, "loss": 0.727, "learning_rate": 4.365475807128996e-05, "epoch": 0.23186184624647638, "percentage": 23.19, "elapsed_time": "1 day, 15:08:43", "remaining_time": "5 days, 9:40:18", "throughput": 2713.83, "total_tokens": 382443264} {"current_steps": 2119, "total_steps": 9134, "loss": 0.7689, "learning_rate": 4.364903258409973e-05, "epoch": 0.23197131831741427, "percentage": 23.2, "elapsed_time": "1 day, 15:09:52", "remaining_time": "5 days, 9:39:17", "throughput": 2713.84, "total_tokens": 382629632} {"current_steps": 2120, "total_steps": 9134, "loss": 0.6362, "learning_rate": 4.364330489076458e-05, "epoch": 0.23208079038835217, "percentage": 23.21, "elapsed_time": "1 day, 15:10:53", "remaining_time": "5 days, 9:37:54", "throughput": 2713.83, "total_tokens": 382795840} {"current_steps": 2121, "total_steps": 9134, "loss": 0.7211, "learning_rate": 4.3637574991962113e-05, "epoch": 0.2321902624592901, "percentage": 23.22, "elapsed_time": "1 day, 15:11:55", "remaining_time": "5 days, 9:36:32", "throughput": 2713.77, "total_tokens": 382955104} {"current_steps": 2122, "total_steps": 9134, "loss": 0.8299, "learning_rate": 4.3631842888370154e-05, "epoch": 0.23229973453022798, "percentage": 23.23, "elapsed_time": "1 day, 15:13:02", "remaining_time": "5 days, 9:35:27", "throughput": 2713.89, "total_tokens": 383152896} {"current_steps": 2123, "total_steps": 9134, "loss": 0.6905, "learning_rate": 4.362610858066679e-05, "epoch": 0.23240920660116587, "percentage": 23.24, "elapsed_time": "1 day, 15:14:06", "remaining_time": "5 days, 9:34:13", "throughput": 2713.93, "total_tokens": 383333888} {"current_steps": 2124, "total_steps": 9134, "loss": 0.7238, "learning_rate": 4.3620372069530404e-05, "epoch": 0.23251867867210377, "percentage": 23.25, "elapsed_time": "1 day, 15:15:12", "remaining_time": "5 days, 9:33:04", "throughput": 2713.9, "total_tokens": 383508832} {"current_steps": 2125, "total_steps": 9134, "loss": 0.6629, "learning_rate": 4.361463335563959e-05, "epoch": 0.2326281507430417, "percentage": 23.26, "elapsed_time": "1 day, 15:16:18", "remaining_time": "5 days, 9:31:55", "throughput": 2713.81, "total_tokens": 383673472} {"current_steps": 2126, "total_steps": 9134, "loss": 0.5215, "learning_rate": 4.3608892439673234e-05, "epoch": 0.23273762281397958, "percentage": 23.28, "elapsed_time": "1 day, 15:17:26", "remaining_time": "5 days, 9:30:53", "throughput": 2713.93, "total_tokens": 383874624} {"current_steps": 2127, "total_steps": 9134, "loss": 0.5942, "learning_rate": 4.360314932231048e-05, "epoch": 0.23284709488491748, "percentage": 23.29, "elapsed_time": "1 day, 15:18:31", "remaining_time": "5 days, 9:29:43", "throughput": 2714.03, "total_tokens": 384067936} {"current_steps": 2128, "total_steps": 9134, "loss": 0.5175, "learning_rate": 4.3597404004230714e-05, "epoch": 0.2329565669558554, "percentage": 23.3, "elapsed_time": "1 day, 15:19:37", "remaining_time": "5 days, 9:28:36", "throughput": 2714.07, "total_tokens": 384252064} {"current_steps": 2129, "total_steps": 9134, "loss": 0.7117, "learning_rate": 4.3591656486113616e-05, "epoch": 0.2330660390267933, "percentage": 23.31, "elapsed_time": "1 day, 15:20:45", "remaining_time": "5 days, 9:27:32", "throughput": 2714.11, "total_tokens": 384441120} {"current_steps": 2130, "total_steps": 9134, "loss": 0.6636, "learning_rate": 4.3585906768639095e-05, "epoch": 0.2331755110977312, "percentage": 23.32, "elapsed_time": "1 day, 15:21:51", "remaining_time": "5 days, 9:26:23", "throughput": 2714.14, "total_tokens": 384623232} {"current_steps": 2131, "total_steps": 9134, "loss": 0.7299, "learning_rate": 4.358015485248733e-05, "epoch": 0.23328498316866908, "percentage": 23.33, "elapsed_time": "1 day, 15:22:58", "remaining_time": "5 days, 9:25:21", "throughput": 2714.15, "total_tokens": 384808928} {"current_steps": 2132, "total_steps": 9134, "loss": 0.6303, "learning_rate": 4.357440073833877e-05, "epoch": 0.233394455239607, "percentage": 23.34, "elapsed_time": "1 day, 15:24:00", "remaining_time": "5 days, 9:23:57", "throughput": 2713.97, "total_tokens": 384949376} {"current_steps": 2133, "total_steps": 9134, "loss": 0.8497, "learning_rate": 4.356864442687411e-05, "epoch": 0.2335039273105449, "percentage": 23.35, "elapsed_time": "1 day, 15:25:06", "remaining_time": "5 days, 9:22:49", "throughput": 2714.05, "total_tokens": 385141120} {"current_steps": 2134, "total_steps": 9134, "loss": 0.6641, "learning_rate": 4.356288591877431e-05, "epoch": 0.2336133993814828, "percentage": 23.36, "elapsed_time": "1 day, 15:26:14", "remaining_time": "5 days, 9:21:48", "throughput": 2714.27, "total_tokens": 385357280} {"current_steps": 2135, "total_steps": 9134, "loss": 0.6397, "learning_rate": 4.355712521472059e-05, "epoch": 0.2337228714524207, "percentage": 23.37, "elapsed_time": "1 day, 15:27:20", "remaining_time": "5 days, 9:20:40", "throughput": 2714.23, "total_tokens": 385529984} {"current_steps": 2136, "total_steps": 9134, "loss": 0.8616, "learning_rate": 4.355136231539443e-05, "epoch": 0.2338323435233586, "percentage": 23.39, "elapsed_time": "1 day, 15:28:24", "remaining_time": "5 days, 9:19:26", "throughput": 2714.31, "total_tokens": 385716352} {"current_steps": 2137, "total_steps": 9134, "loss": 0.7354, "learning_rate": 4.3545597221477585e-05, "epoch": 0.2339418155942965, "percentage": 23.4, "elapsed_time": "1 day, 15:29:27", "remaining_time": "5 days, 9:18:07", "throughput": 2714.28, "total_tokens": 385882112} {"current_steps": 2138, "total_steps": 9134, "loss": 0.6767, "learning_rate": 4.353982993365203e-05, "epoch": 0.23405128766523442, "percentage": 23.41, "elapsed_time": "1 day, 15:30:28", "remaining_time": "5 days, 9:16:41", "throughput": 2714.18, "total_tokens": 386033312} {"current_steps": 2139, "total_steps": 9134, "loss": 0.5562, "learning_rate": 4.3534060452600046e-05, "epoch": 0.2341607597361723, "percentage": 23.42, "elapsed_time": "1 day, 15:31:35", "remaining_time": "5 days, 9:15:37", "throughput": 2714.31, "total_tokens": 386233792} {"current_steps": 2140, "total_steps": 9134, "loss": 0.7539, "learning_rate": 4.3528288779004135e-05, "epoch": 0.2342702318071102, "percentage": 23.43, "elapsed_time": "1 day, 15:32:39", "remaining_time": "5 days, 9:14:21", "throughput": 2714.32, "total_tokens": 386407616} {"current_steps": 2141, "total_steps": 9134, "loss": 0.6199, "learning_rate": 4.352251491354708e-05, "epoch": 0.2343797038780481, "percentage": 23.44, "elapsed_time": "1 day, 15:33:41", "remaining_time": "5 days, 9:13:02", "throughput": 2714.25, "total_tokens": 386567776} {"current_steps": 2142, "total_steps": 9134, "loss": 0.6844, "learning_rate": 4.351673885691192e-05, "epoch": 0.23448917594898602, "percentage": 23.45, "elapsed_time": "1 day, 15:34:46", "remaining_time": "5 days, 9:11:50", "throughput": 2714.28, "total_tokens": 386748544} {"current_steps": 2143, "total_steps": 9134, "loss": 0.8967, "learning_rate": 4.3510960609781954e-05, "epoch": 0.23459864801992392, "percentage": 23.46, "elapsed_time": "1 day, 15:35:52", "remaining_time": "5 days, 9:10:42", "throughput": 2714.37, "total_tokens": 386940736} {"current_steps": 2144, "total_steps": 9134, "loss": 0.5102, "learning_rate": 4.350518017284073e-05, "epoch": 0.2347081200908618, "percentage": 23.47, "elapsed_time": "1 day, 15:36:56", "remaining_time": "5 days, 9:09:26", "throughput": 2714.28, "total_tokens": 387100896} {"current_steps": 2145, "total_steps": 9134, "loss": 0.6685, "learning_rate": 4.349939754677208e-05, "epoch": 0.23481759216179973, "percentage": 23.48, "elapsed_time": "1 day, 15:38:05", "remaining_time": "5 days, 9:08:28", "throughput": 2714.43, "total_tokens": 387310112} {"current_steps": 2146, "total_steps": 9134, "loss": 0.6578, "learning_rate": 4.349361273226005e-05, "epoch": 0.23492706423273763, "percentage": 23.49, "elapsed_time": "1 day, 15:39:06", "remaining_time": "5 days, 9:07:02", "throughput": 2714.24, "total_tokens": 387446528} {"current_steps": 2147, "total_steps": 9134, "loss": 0.9187, "learning_rate": 4.3487825729988995e-05, "epoch": 0.23503653630367552, "percentage": 23.51, "elapsed_time": "1 day, 15:40:14", "remaining_time": "5 days, 9:06:00", "throughput": 2714.38, "total_tokens": 387650816} {"current_steps": 2148, "total_steps": 9134, "loss": 0.6088, "learning_rate": 4.34820365406435e-05, "epoch": 0.2351460083746134, "percentage": 23.52, "elapsed_time": "1 day, 15:41:18", "remaining_time": "5 days, 9:04:46", "throughput": 2714.26, "total_tokens": 387808288} {"current_steps": 2149, "total_steps": 9134, "loss": 0.7736, "learning_rate": 4.347624516490841e-05, "epoch": 0.23525548044555133, "percentage": 23.53, "elapsed_time": "1 day, 15:42:26", "remaining_time": "5 days, 9:03:45", "throughput": 2714.42, "total_tokens": 388017056} {"current_steps": 2150, "total_steps": 9134, "loss": 0.7928, "learning_rate": 4.3470451603468836e-05, "epoch": 0.23536495251648923, "percentage": 23.54, "elapsed_time": "1 day, 15:43:35", "remaining_time": "5 days, 9:02:47", "throughput": 2714.52, "total_tokens": 388217760} {"current_steps": 2151, "total_steps": 9134, "loss": 0.7631, "learning_rate": 4.346465585701015e-05, "epoch": 0.23547442458742712, "percentage": 23.55, "elapsed_time": "1 day, 15:44:39", "remaining_time": "5 days, 9:01:31", "throughput": 2714.42, "total_tokens": 388377248} {"current_steps": 2152, "total_steps": 9134, "loss": 0.7203, "learning_rate": 4.345885792621798e-05, "epoch": 0.23558389665836504, "percentage": 23.56, "elapsed_time": "1 day, 15:45:46", "remaining_time": "5 days, 9:00:27", "throughput": 2714.56, "total_tokens": 388578848} {"current_steps": 2153, "total_steps": 9134, "loss": 0.7063, "learning_rate": 4.34530578117782e-05, "epoch": 0.23569336872930294, "percentage": 23.57, "elapsed_time": "1 day, 15:46:53", "remaining_time": "5 days, 8:59:23", "throughput": 2714.54, "total_tokens": 388758720} {"current_steps": 2154, "total_steps": 9134, "loss": 0.6471, "learning_rate": 4.344725551437695e-05, "epoch": 0.23580284080024083, "percentage": 23.58, "elapsed_time": "1 day, 15:47:58", "remaining_time": "5 days, 8:58:11", "throughput": 2714.52, "total_tokens": 388932544} {"current_steps": 2155, "total_steps": 9134, "loss": 0.699, "learning_rate": 4.344145103470065e-05, "epoch": 0.23591231287117875, "percentage": 23.59, "elapsed_time": "1 day, 15:49:06", "remaining_time": "5 days, 8:57:09", "throughput": 2714.53, "total_tokens": 389117792} {"current_steps": 2156, "total_steps": 9134, "loss": 0.8703, "learning_rate": 4.343564437343594e-05, "epoch": 0.23602178494211665, "percentage": 23.6, "elapsed_time": "1 day, 15:50:12", "remaining_time": "5 days, 8:56:01", "throughput": 2714.47, "total_tokens": 389288256} {"current_steps": 2157, "total_steps": 9134, "loss": 0.5769, "learning_rate": 4.342983553126974e-05, "epoch": 0.23613125701305454, "percentage": 23.62, "elapsed_time": "1 day, 15:51:15", "remaining_time": "5 days, 8:54:43", "throughput": 2714.5, "total_tokens": 389463200} {"current_steps": 2158, "total_steps": 9134, "loss": 0.8318, "learning_rate": 4.342402450888924e-05, "epoch": 0.23624072908399243, "percentage": 23.63, "elapsed_time": "1 day, 15:52:24", "remaining_time": "5 days, 8:53:43", "throughput": 2714.76, "total_tokens": 389688320} {"current_steps": 2159, "total_steps": 9134, "loss": 0.6685, "learning_rate": 4.341821130698185e-05, "epoch": 0.23635020115493036, "percentage": 23.64, "elapsed_time": "1 day, 15:53:30", "remaining_time": "5 days, 8:52:35", "throughput": 2714.89, "total_tokens": 389885664} {"current_steps": 2160, "total_steps": 9134, "loss": 1.1616, "learning_rate": 4.341239592623527e-05, "epoch": 0.23645967322586825, "percentage": 23.65, "elapsed_time": "1 day, 15:54:36", "remaining_time": "5 days, 8:51:28", "throughput": 2715.03, "total_tokens": 390085696} {"current_steps": 2161, "total_steps": 9134, "loss": 0.6276, "learning_rate": 4.3406578367337466e-05, "epoch": 0.23656914529680614, "percentage": 23.66, "elapsed_time": "1 day, 15:55:42", "remaining_time": "5 days, 8:50:19", "throughput": 2715.05, "total_tokens": 390266688} {"current_steps": 2162, "total_steps": 9134, "loss": 0.7528, "learning_rate": 4.340075863097662e-05, "epoch": 0.23667861736774407, "percentage": 23.67, "elapsed_time": "1 day, 15:56:51", "remaining_time": "5 days, 8:49:20", "throughput": 2715.26, "total_tokens": 390484640} {"current_steps": 2163, "total_steps": 9134, "loss": 0.7423, "learning_rate": 4.33949367178412e-05, "epoch": 0.23678808943868196, "percentage": 23.68, "elapsed_time": "1 day, 15:57:55", "remaining_time": "5 days, 8:48:08", "throughput": 2715.23, "total_tokens": 390656000} {"current_steps": 2164, "total_steps": 9134, "loss": 0.5792, "learning_rate": 4.338911262861993e-05, "epoch": 0.23689756150961985, "percentage": 23.69, "elapsed_time": "1 day, 15:58:58", "remaining_time": "5 days, 8:46:51", "throughput": 2715.21, "total_tokens": 390824000} {"current_steps": 2165, "total_steps": 9134, "loss": 0.5947, "learning_rate": 4.3383286364001794e-05, "epoch": 0.23700703358055775, "percentage": 23.7, "elapsed_time": "1 day, 16:00:06", "remaining_time": "5 days, 8:45:46", "throughput": 2715.16, "total_tokens": 391000064} {"current_steps": 2166, "total_steps": 9134, "loss": 0.677, "learning_rate": 4.337745792467604e-05, "epoch": 0.23711650565149567, "percentage": 23.71, "elapsed_time": "1 day, 16:01:09", "remaining_time": "5 days, 8:44:31", "throughput": 2715.16, "total_tokens": 391172544} {"current_steps": 2167, "total_steps": 9134, "loss": 0.6756, "learning_rate": 4.337162731133212e-05, "epoch": 0.23722597772243356, "percentage": 23.72, "elapsed_time": "1 day, 16:02:14", "remaining_time": "5 days, 8:43:19", "throughput": 2715.07, "total_tokens": 391335392} {"current_steps": 2168, "total_steps": 9134, "loss": 0.6934, "learning_rate": 4.336579452465982e-05, "epoch": 0.23733544979337146, "percentage": 23.74, "elapsed_time": "1 day, 16:03:18", "remaining_time": "5 days, 8:42:05", "throughput": 2714.88, "total_tokens": 391483232} {"current_steps": 2169, "total_steps": 9134, "loss": 0.6566, "learning_rate": 4.335995956534914e-05, "epoch": 0.23744492186430938, "percentage": 23.75, "elapsed_time": "1 day, 16:04:23", "remaining_time": "5 days, 8:40:52", "throughput": 2714.94, "total_tokens": 391667136} {"current_steps": 2170, "total_steps": 9134, "loss": 0.7516, "learning_rate": 4.335412243409034e-05, "epoch": 0.23755439393524727, "percentage": 23.76, "elapsed_time": "1 day, 16:05:25", "remaining_time": "5 days, 8:39:31", "throughput": 2714.83, "total_tokens": 391818784} {"current_steps": 2171, "total_steps": 9134, "loss": 0.5706, "learning_rate": 4.3348283131573944e-05, "epoch": 0.23766386600618516, "percentage": 23.77, "elapsed_time": "1 day, 16:06:26", "remaining_time": "5 days, 8:38:07", "throughput": 2714.77, "total_tokens": 391975360} {"current_steps": 2172, "total_steps": 9134, "loss": 0.7973, "learning_rate": 4.3342441658490724e-05, "epoch": 0.2377733380771231, "percentage": 23.78, "elapsed_time": "1 day, 16:07:32", "remaining_time": "5 days, 8:36:59", "throughput": 2714.7, "total_tokens": 392146048} {"current_steps": 2173, "total_steps": 9134, "loss": 0.7025, "learning_rate": 4.333659801553173e-05, "epoch": 0.23788281014806098, "percentage": 23.79, "elapsed_time": "1 day, 16:08:36", "remaining_time": "5 days, 8:35:44", "throughput": 2714.63, "total_tokens": 392308672} {"current_steps": 2174, "total_steps": 9134, "loss": 0.8281, "learning_rate": 4.3330752203388234e-05, "epoch": 0.23799228221899887, "percentage": 23.8, "elapsed_time": "1 day, 16:09:44", "remaining_time": "5 days, 8:34:41", "throughput": 2714.71, "total_tokens": 392503104} {"current_steps": 2175, "total_steps": 9134, "loss": 0.8117, "learning_rate": 4.3324904222751796e-05, "epoch": 0.23810175428993677, "percentage": 23.81, "elapsed_time": "1 day, 16:10:50", "remaining_time": "5 days, 8:33:34", "throughput": 2714.71, "total_tokens": 392684096} {"current_steps": 2176, "total_steps": 9134, "loss": 0.6373, "learning_rate": 4.331905407431422e-05, "epoch": 0.2382112263608747, "percentage": 23.82, "elapsed_time": "1 day, 16:11:57", "remaining_time": "5 days, 8:32:29", "throughput": 2714.75, "total_tokens": 392870912} {"current_steps": 2177, "total_steps": 9134, "loss": 0.6628, "learning_rate": 4.3313201758767574e-05, "epoch": 0.23832069843181258, "percentage": 23.83, "elapsed_time": "1 day, 16:13:03", "remaining_time": "5 days, 8:31:20", "throughput": 2714.81, "total_tokens": 393057952} {"current_steps": 2178, "total_steps": 9134, "loss": 0.8184, "learning_rate": 4.330734727680417e-05, "epoch": 0.23843017050275048, "percentage": 23.84, "elapsed_time": "1 day, 16:14:11", "remaining_time": "5 days, 8:30:21", "throughput": 2714.92, "total_tokens": 393260896} {"current_steps": 2179, "total_steps": 9134, "loss": 0.7815, "learning_rate": 4.330149062911657e-05, "epoch": 0.2385396425736884, "percentage": 23.86, "elapsed_time": "1 day, 16:15:16", "remaining_time": "5 days, 8:29:09", "throughput": 2714.92, "total_tokens": 393437408} {"current_steps": 2180, "total_steps": 9134, "loss": 0.8418, "learning_rate": 4.3295631816397626e-05, "epoch": 0.2386491146446263, "percentage": 23.87, "elapsed_time": "1 day, 16:16:25", "remaining_time": "5 days, 8:28:09", "throughput": 2714.97, "total_tokens": 393630272} {"current_steps": 2181, "total_steps": 9134, "loss": 0.743, "learning_rate": 4.32897708393404e-05, "epoch": 0.23875858671556419, "percentage": 23.88, "elapsed_time": "1 day, 16:17:33", "remaining_time": "5 days, 8:27:08", "throughput": 2715.08, "total_tokens": 393832320} {"current_steps": 2182, "total_steps": 9134, "loss": 0.6785, "learning_rate": 4.328390769863826e-05, "epoch": 0.23886805878650208, "percentage": 23.89, "elapsed_time": "1 day, 16:18:41", "remaining_time": "5 days, 8:26:08", "throughput": 2715.11, "total_tokens": 394022048} {"current_steps": 2183, "total_steps": 9134, "loss": 0.6435, "learning_rate": 4.327804239498479e-05, "epoch": 0.23897753085744, "percentage": 23.9, "elapsed_time": "1 day, 16:19:49", "remaining_time": "5 days, 8:25:04", "throughput": 2715.06, "total_tokens": 394197216} {"current_steps": 2184, "total_steps": 9134, "loss": 0.7714, "learning_rate": 4.3272174929073846e-05, "epoch": 0.2390870029283779, "percentage": 23.91, "elapsed_time": "1 day, 16:20:50", "remaining_time": "5 days, 8:23:42", "throughput": 2715.0, "total_tokens": 394355584} {"current_steps": 2185, "total_steps": 9134, "loss": 0.6722, "learning_rate": 4.326630530159954e-05, "epoch": 0.2391964749993158, "percentage": 23.92, "elapsed_time": "1 day, 16:21:54", "remaining_time": "5 days, 8:22:28", "throughput": 2715.06, "total_tokens": 394539488} {"current_steps": 2186, "total_steps": 9134, "loss": 0.8328, "learning_rate": 4.3260433513256227e-05, "epoch": 0.2393059470702537, "percentage": 23.93, "elapsed_time": "1 day, 16:23:03", "remaining_time": "5 days, 8:21:28", "throughput": 2715.11, "total_tokens": 394732800} {"current_steps": 2187, "total_steps": 9134, "loss": 0.6082, "learning_rate": 4.325455956473854e-05, "epoch": 0.2394154191411916, "percentage": 23.94, "elapsed_time": "1 day, 16:24:11", "remaining_time": "5 days, 8:20:25", "throughput": 2715.18, "total_tokens": 394925888} {"current_steps": 2188, "total_steps": 9134, "loss": 0.7465, "learning_rate": 4.324868345674136e-05, "epoch": 0.2395248912121295, "percentage": 23.95, "elapsed_time": "1 day, 16:25:19", "remaining_time": "5 days, 8:19:24", "throughput": 2715.01, "total_tokens": 395087168} {"current_steps": 2189, "total_steps": 9134, "loss": 0.6871, "learning_rate": 4.324280518995981e-05, "epoch": 0.23963436328306742, "percentage": 23.97, "elapsed_time": "1 day, 16:26:23", "remaining_time": "5 days, 8:18:09", "throughput": 2714.97, "total_tokens": 395254720} {"current_steps": 2190, "total_steps": 9134, "loss": 0.8124, "learning_rate": 4.3236924765089284e-05, "epoch": 0.2397438353540053, "percentage": 23.98, "elapsed_time": "1 day, 16:27:28", "remaining_time": "5 days, 8:16:59", "throughput": 2714.87, "total_tokens": 395418016} {"current_steps": 2191, "total_steps": 9134, "loss": 0.7596, "learning_rate": 4.323104218282542e-05, "epoch": 0.2398533074249432, "percentage": 23.99, "elapsed_time": "1 day, 16:28:32", "remaining_time": "5 days, 8:15:44", "throughput": 2714.88, "total_tokens": 395592064} {"current_steps": 2192, "total_steps": 9134, "loss": 0.8633, "learning_rate": 4.322515744386411e-05, "epoch": 0.2399627794958811, "percentage": 24.0, "elapsed_time": "1 day, 16:29:37", "remaining_time": "5 days, 8:14:32", "throughput": 2714.89, "total_tokens": 395768576} {"current_steps": 2193, "total_steps": 9134, "loss": 0.7009, "learning_rate": 4.321927054890153e-05, "epoch": 0.24007225156681902, "percentage": 24.01, "elapsed_time": "1 day, 16:30:46", "remaining_time": "5 days, 8:13:33", "throughput": 2714.93, "total_tokens": 395962336} {"current_steps": 2194, "total_steps": 9134, "loss": 0.871, "learning_rate": 4.3213381498634056e-05, "epoch": 0.24018172363775692, "percentage": 24.02, "elapsed_time": "1 day, 16:31:55", "remaining_time": "5 days, 8:12:35", "throughput": 2714.99, "total_tokens": 396158784} {"current_steps": 2195, "total_steps": 9134, "loss": 0.8203, "learning_rate": 4.3207490293758374e-05, "epoch": 0.2402911957086948, "percentage": 24.03, "elapsed_time": "1 day, 16:33:01", "remaining_time": "5 days, 8:11:28", "throughput": 2715.0, "total_tokens": 396340672} {"current_steps": 2196, "total_steps": 9134, "loss": 0.6214, "learning_rate": 4.32015969349714e-05, "epoch": 0.24040066777963273, "percentage": 24.04, "elapsed_time": "1 day, 16:34:07", "remaining_time": "5 days, 8:10:19", "throughput": 2714.99, "total_tokens": 396516736} {"current_steps": 2197, "total_steps": 9134, "loss": 0.6514, "learning_rate": 4.31957014229703e-05, "epoch": 0.24051013985057063, "percentage": 24.05, "elapsed_time": "1 day, 16:35:13", "remaining_time": "5 days, 8:09:11", "throughput": 2715.01, "total_tokens": 396698848} {"current_steps": 2198, "total_steps": 9134, "loss": 0.7347, "learning_rate": 4.3189803758452504e-05, "epoch": 0.24061961192150852, "percentage": 24.06, "elapsed_time": "1 day, 16:36:19", "remaining_time": "5 days, 8:08:02", "throughput": 2715.12, "total_tokens": 396894400} {"current_steps": 2199, "total_steps": 9134, "loss": 0.8095, "learning_rate": 4.318390394211571e-05, "epoch": 0.24072908399244644, "percentage": 24.07, "elapsed_time": "1 day, 16:37:24", "remaining_time": "5 days, 8:06:51", "throughput": 2715.12, "total_tokens": 397070912} {"current_steps": 2200, "total_steps": 9134, "loss": 0.6231, "learning_rate": 4.3178001974657836e-05, "epoch": 0.24083855606338433, "percentage": 24.09, "elapsed_time": "1 day, 16:38:29", "remaining_time": "5 days, 8:05:41", "throughput": 2714.96, "total_tokens": 397223904} {"current_steps": 2201, "total_steps": 9134, "loss": 0.8237, "learning_rate": 4.317209785677707e-05, "epoch": 0.24094802813432223, "percentage": 24.1, "elapsed_time": "1 day, 16:39:37", "remaining_time": "5 days, 8:04:38", "throughput": 2715.12, "total_tokens": 397432224} {"current_steps": 2202, "total_steps": 9134, "loss": 0.767, "learning_rate": 4.3166191589171875e-05, "epoch": 0.24105750020526012, "percentage": 24.11, "elapsed_time": "1 day, 16:40:45", "remaining_time": "5 days, 8:03:35", "throughput": 2715.25, "total_tokens": 397635616} {"current_steps": 2203, "total_steps": 9134, "loss": 0.7334, "learning_rate": 4.316028317254094e-05, "epoch": 0.24116697227619804, "percentage": 24.12, "elapsed_time": "1 day, 16:41:53", "remaining_time": "5 days, 8:02:36", "throughput": 2715.36, "total_tokens": 397838112} {"current_steps": 2204, "total_steps": 9134, "loss": 0.6005, "learning_rate": 4.315437260758322e-05, "epoch": 0.24127644434713594, "percentage": 24.13, "elapsed_time": "1 day, 16:42:59", "remaining_time": "5 days, 8:01:28", "throughput": 2715.37, "total_tokens": 398018432} {"current_steps": 2205, "total_steps": 9134, "loss": 1.0094, "learning_rate": 4.3148459894997926e-05, "epoch": 0.24138591641807383, "percentage": 24.14, "elapsed_time": "1 day, 16:44:07", "remaining_time": "5 days, 8:00:26", "throughput": 2715.36, "total_tokens": 398202112} {"current_steps": 2206, "total_steps": 9134, "loss": 0.9189, "learning_rate": 4.3142545035484526e-05, "epoch": 0.24149538848901175, "percentage": 24.15, "elapsed_time": "1 day, 16:45:12", "remaining_time": "5 days, 7:59:13", "throughput": 2715.35, "total_tokens": 398374592} {"current_steps": 2207, "total_steps": 9134, "loss": 0.9183, "learning_rate": 4.3136628029742735e-05, "epoch": 0.24160486055994965, "percentage": 24.16, "elapsed_time": "1 day, 16:46:20", "remaining_time": "5 days, 7:58:12", "throughput": 2715.45, "total_tokens": 398574848} {"current_steps": 2208, "total_steps": 9134, "loss": 0.6346, "learning_rate": 4.3130708878472505e-05, "epoch": 0.24171433263088754, "percentage": 24.17, "elapsed_time": "1 day, 16:47:24", "remaining_time": "5 days, 7:56:57", "throughput": 2715.38, "total_tokens": 398737472} {"current_steps": 2209, "total_steps": 9134, "loss": 0.6345, "learning_rate": 4.312478758237408e-05, "epoch": 0.24182380470182543, "percentage": 24.18, "elapsed_time": "1 day, 16:48:28", "remaining_time": "5 days, 7:55:42", "throughput": 2715.36, "total_tokens": 398908160} {"current_steps": 2210, "total_steps": 9134, "loss": 0.6804, "learning_rate": 4.3118864142147944e-05, "epoch": 0.24193327677276336, "percentage": 24.2, "elapsed_time": "1 day, 16:49:35", "remaining_time": "5 days, 7:54:40", "throughput": 2715.49, "total_tokens": 399111552} {"current_steps": 2211, "total_steps": 9134, "loss": 0.9816, "learning_rate": 4.31129385584948e-05, "epoch": 0.24204274884370125, "percentage": 24.21, "elapsed_time": "1 day, 16:50:39", "remaining_time": "5 days, 7:53:25", "throughput": 2715.45, "total_tokens": 399280000} {"current_steps": 2212, "total_steps": 9134, "loss": 0.7062, "learning_rate": 4.310701083211566e-05, "epoch": 0.24215222091463914, "percentage": 24.22, "elapsed_time": "1 day, 16:51:44", "remaining_time": "5 days, 7:52:13", "throughput": 2715.31, "total_tokens": 399433664} {"current_steps": 2213, "total_steps": 9134, "loss": 0.6091, "learning_rate": 4.310108096371175e-05, "epoch": 0.24226169298557707, "percentage": 24.23, "elapsed_time": "1 day, 16:52:47", "remaining_time": "5 days, 7:50:57", "throughput": 2715.37, "total_tokens": 399615328} {"current_steps": 2214, "total_steps": 9134, "loss": 0.803, "learning_rate": 4.309514895398456e-05, "epoch": 0.24237116505651496, "percentage": 24.24, "elapsed_time": "1 day, 16:53:49", "remaining_time": "5 days, 7:49:35", "throughput": 2715.33, "total_tokens": 399776160} {"current_steps": 2215, "total_steps": 9134, "loss": 0.7244, "learning_rate": 4.308921480363586e-05, "epoch": 0.24248063712745285, "percentage": 24.25, "elapsed_time": "1 day, 16:54:52", "remaining_time": "5 days, 7:48:17", "throughput": 2715.32, "total_tokens": 399945728} {"current_steps": 2216, "total_steps": 9134, "loss": 0.6973, "learning_rate": 4.308327851336762e-05, "epoch": 0.24259010919839077, "percentage": 24.26, "elapsed_time": "1 day, 16:55:55", "remaining_time": "5 days, 7:47:00", "throughput": 2715.27, "total_tokens": 400110368} {"current_steps": 2217, "total_steps": 9134, "loss": 0.8851, "learning_rate": 4.307734008388209e-05, "epoch": 0.24269958126932867, "percentage": 24.27, "elapsed_time": "1 day, 16:56:58", "remaining_time": "5 days, 7:45:42", "throughput": 2715.19, "total_tokens": 400268288} {"current_steps": 2218, "total_steps": 9134, "loss": 0.658, "learning_rate": 4.307139951588179e-05, "epoch": 0.24280905334026656, "percentage": 24.28, "elapsed_time": "1 day, 16:58:00", "remaining_time": "5 days, 7:44:23", "throughput": 2715.09, "total_tokens": 400423520} {"current_steps": 2219, "total_steps": 9134, "loss": 0.593, "learning_rate": 4.306545681006949e-05, "epoch": 0.24291852541120446, "percentage": 24.29, "elapsed_time": "1 day, 16:59:05", "remaining_time": "5 days, 7:43:09", "throughput": 2715.04, "total_tokens": 400591072} {"current_steps": 2220, "total_steps": 9134, "loss": 0.8656, "learning_rate": 4.305951196714817e-05, "epoch": 0.24302799748214238, "percentage": 24.3, "elapsed_time": "1 day, 17:00:11", "remaining_time": "5 days, 7:42:02", "throughput": 2715.09, "total_tokens": 400777440} {"current_steps": 2221, "total_steps": 9134, "loss": 0.6704, "learning_rate": 4.305356498782112e-05, "epoch": 0.24313746955308027, "percentage": 24.32, "elapsed_time": "1 day, 17:01:18", "remaining_time": "5 days, 7:40:58", "throughput": 2715.1, "total_tokens": 400961568} {"current_steps": 2222, "total_steps": 9134, "loss": 0.6563, "learning_rate": 4.304761587279183e-05, "epoch": 0.24324694162401816, "percentage": 24.33, "elapsed_time": "1 day, 17:02:22", "remaining_time": "5 days, 7:39:44", "throughput": 2714.93, "total_tokens": 401110976} {"current_steps": 2223, "total_steps": 9134, "loss": 0.6782, "learning_rate": 4.304166462276409e-05, "epoch": 0.2433564136949561, "percentage": 24.34, "elapsed_time": "1 day, 17:03:29", "remaining_time": "5 days, 7:38:39", "throughput": 2715.03, "total_tokens": 401308096} {"current_steps": 2224, "total_steps": 9134, "loss": 0.8364, "learning_rate": 4.303571123844191e-05, "epoch": 0.24346588576589398, "percentage": 24.35, "elapsed_time": "1 day, 17:04:33", "remaining_time": "5 days, 7:37:24", "throughput": 2715.01, "total_tokens": 401477664} {"current_steps": 2225, "total_steps": 9134, "loss": 0.5803, "learning_rate": 4.3029755720529576e-05, "epoch": 0.24357535783683187, "percentage": 24.36, "elapsed_time": "1 day, 17:05:33", "remaining_time": "5 days, 7:35:57", "throughput": 2714.83, "total_tokens": 401613632} {"current_steps": 2226, "total_steps": 9134, "loss": 0.692, "learning_rate": 4.30237980697316e-05, "epoch": 0.24368482990776977, "percentage": 24.37, "elapsed_time": "1 day, 17:06:41", "remaining_time": "5 days, 7:34:56", "throughput": 2714.87, "total_tokens": 401804704} {"current_steps": 2227, "total_steps": 9134, "loss": 0.8151, "learning_rate": 4.3017838286752776e-05, "epoch": 0.2437943019787077, "percentage": 24.38, "elapsed_time": "1 day, 17:07:44", "remaining_time": "5 days, 7:33:37", "throughput": 2714.73, "total_tokens": 401953216} {"current_steps": 2228, "total_steps": 9134, "loss": 0.5109, "learning_rate": 4.301187637229812e-05, "epoch": 0.24390377404964558, "percentage": 24.39, "elapsed_time": "1 day, 17:08:41", "remaining_time": "5 days, 7:32:03", "throughput": 2714.53, "total_tokens": 402080672} {"current_steps": 2229, "total_steps": 9134, "loss": 0.659, "learning_rate": 4.300591232707293e-05, "epoch": 0.24401324612058348, "percentage": 24.4, "elapsed_time": "1 day, 17:09:49", "remaining_time": "5 days, 7:31:01", "throughput": 2714.63, "total_tokens": 402278688} {"current_steps": 2230, "total_steps": 9134, "loss": 0.7858, "learning_rate": 4.2999946151782735e-05, "epoch": 0.2441227181915214, "percentage": 24.41, "elapsed_time": "1 day, 17:10:57", "remaining_time": "5 days, 7:30:00", "throughput": 2714.54, "total_tokens": 402450720} {"current_steps": 2231, "total_steps": 9134, "loss": 0.7344, "learning_rate": 4.29939778471333e-05, "epoch": 0.2442321902624593, "percentage": 24.43, "elapsed_time": "1 day, 17:12:05", "remaining_time": "5 days, 7:28:58", "throughput": 2714.45, "total_tokens": 402622976} {"current_steps": 2232, "total_steps": 9134, "loss": 0.6002, "learning_rate": 4.298800741383071e-05, "epoch": 0.24434166233339719, "percentage": 24.44, "elapsed_time": "1 day, 17:13:12", "remaining_time": "5 days, 7:27:52", "throughput": 2714.57, "total_tokens": 402821440} {"current_steps": 2233, "total_steps": 9134, "loss": 0.5028, "learning_rate": 4.298203485258122e-05, "epoch": 0.2444511344043351, "percentage": 24.45, "elapsed_time": "1 day, 17:14:17", "remaining_time": "5 days, 7:26:42", "throughput": 2714.64, "total_tokens": 403008480} {"current_steps": 2234, "total_steps": 9134, "loss": 0.7309, "learning_rate": 4.2976060164091384e-05, "epoch": 0.244560606475273, "percentage": 24.46, "elapsed_time": "1 day, 17:15:18", "remaining_time": "5 days, 7:25:19", "throughput": 2714.5, "total_tokens": 403154080} {"current_steps": 2235, "total_steps": 9134, "loss": 0.5743, "learning_rate": 4.297008334906798e-05, "epoch": 0.2446700785462109, "percentage": 24.47, "elapsed_time": "1 day, 17:16:26", "remaining_time": "5 days, 7:24:16", "throughput": 2714.48, "total_tokens": 403335296} {"current_steps": 2236, "total_steps": 9134, "loss": 0.76, "learning_rate": 4.2964104408218085e-05, "epoch": 0.2447795506171488, "percentage": 24.48, "elapsed_time": "1 day, 17:17:32", "remaining_time": "5 days, 7:23:08", "throughput": 2714.43, "total_tokens": 403505984} {"current_steps": 2237, "total_steps": 9134, "loss": 0.5893, "learning_rate": 4.295812334224898e-05, "epoch": 0.2448890226880867, "percentage": 24.49, "elapsed_time": "1 day, 17:18:41", "remaining_time": "5 days, 7:22:08", "throughput": 2714.45, "total_tokens": 403695712} {"current_steps": 2238, "total_steps": 9134, "loss": 0.6426, "learning_rate": 4.2952140151868204e-05, "epoch": 0.2449984947590246, "percentage": 24.5, "elapsed_time": "1 day, 17:19:49", "remaining_time": "5 days, 7:21:08", "throughput": 2714.52, "total_tokens": 403891264} {"current_steps": 2239, "total_steps": 9134, "loss": 0.5291, "learning_rate": 4.294615483778358e-05, "epoch": 0.2451079668299625, "percentage": 24.51, "elapsed_time": "1 day, 17:20:50", "remaining_time": "5 days, 7:19:45", "throughput": 2714.43, "total_tokens": 404044480} {"current_steps": 2240, "total_steps": 9134, "loss": 0.7297, "learning_rate": 4.2940167400703134e-05, "epoch": 0.24521743890090042, "percentage": 24.52, "elapsed_time": "1 day, 17:21:56", "remaining_time": "5 days, 7:18:38", "throughput": 2714.36, "total_tokens": 404213824} {"current_steps": 2241, "total_steps": 9134, "loss": 0.9402, "learning_rate": 4.293417784133519e-05, "epoch": 0.2453269109718383, "percentage": 24.53, "elapsed_time": "1 day, 17:23:00", "remaining_time": "5 days, 7:17:23", "throughput": 2714.34, "total_tokens": 404383840} {"current_steps": 2242, "total_steps": 9134, "loss": 0.6448, "learning_rate": 4.2928186160388286e-05, "epoch": 0.2454363830427762, "percentage": 24.55, "elapsed_time": "1 day, 17:24:05", "remaining_time": "5 days, 7:16:11", "throughput": 2714.28, "total_tokens": 404550720} {"current_steps": 2243, "total_steps": 9134, "loss": 0.5925, "learning_rate": 4.292219235857123e-05, "epoch": 0.2455458551137141, "percentage": 24.56, "elapsed_time": "1 day, 17:25:10", "remaining_time": "5 days, 7:15:02", "throughput": 2714.28, "total_tokens": 404729472} {"current_steps": 2244, "total_steps": 9134, "loss": 0.6788, "learning_rate": 4.291619643659308e-05, "epoch": 0.24565532718465202, "percentage": 24.57, "elapsed_time": "1 day, 17:26:15", "remaining_time": "5 days, 7:13:49", "throughput": 2714.29, "total_tokens": 404905760} {"current_steps": 2245, "total_steps": 9134, "loss": 0.5877, "learning_rate": 4.291019839516314e-05, "epoch": 0.24576479925558992, "percentage": 24.58, "elapsed_time": "1 day, 17:27:22", "remaining_time": "5 days, 7:12:44", "throughput": 2714.41, "total_tokens": 405104672} {"current_steps": 2246, "total_steps": 9134, "loss": 0.8504, "learning_rate": 4.290419823499098e-05, "epoch": 0.2458742713265278, "percentage": 24.59, "elapsed_time": "1 day, 17:28:30", "remaining_time": "5 days, 7:11:43", "throughput": 2714.35, "total_tokens": 405281184} {"current_steps": 2247, "total_steps": 9134, "loss": 0.8372, "learning_rate": 4.289819595678638e-05, "epoch": 0.24598374339746573, "percentage": 24.6, "elapsed_time": "1 day, 17:29:35", "remaining_time": "5 days, 7:10:32", "throughput": 2714.34, "total_tokens": 405455680} {"current_steps": 2248, "total_steps": 9134, "loss": 0.7548, "learning_rate": 4.289219156125942e-05, "epoch": 0.24609321546840363, "percentage": 24.61, "elapsed_time": "1 day, 17:30:41", "remaining_time": "5 days, 7:09:24", "throughput": 2714.35, "total_tokens": 405636672} {"current_steps": 2249, "total_steps": 9134, "loss": 0.7107, "learning_rate": 4.288618504912041e-05, "epoch": 0.24620268753934152, "percentage": 24.62, "elapsed_time": "1 day, 17:31:48", "remaining_time": "5 days, 7:08:19", "throughput": 2714.4, "total_tokens": 405825952} {"current_steps": 2250, "total_steps": 9134, "loss": 0.5628, "learning_rate": 4.2880176421079896e-05, "epoch": 0.24631215961027944, "percentage": 24.63, "elapsed_time": "1 day, 17:32:50", "remaining_time": "5 days, 7:06:59", "throughput": 2714.23, "total_tokens": 405968864} {"current_steps": 2251, "total_steps": 9134, "loss": 0.6264, "learning_rate": 4.287416567784869e-05, "epoch": 0.24642163168121733, "percentage": 24.64, "elapsed_time": "1 day, 17:33:56", "remaining_time": "5 days, 7:05:50", "throughput": 2714.31, "total_tokens": 406159264} {"current_steps": 2252, "total_steps": 9134, "loss": 0.7524, "learning_rate": 4.2868152820137855e-05, "epoch": 0.24653110375215523, "percentage": 24.66, "elapsed_time": "1 day, 17:35:00", "remaining_time": "5 days, 7:04:35", "throughput": 2714.33, "total_tokens": 406335328} {"current_steps": 2253, "total_steps": 9134, "loss": 0.6801, "learning_rate": 4.28621378486587e-05, "epoch": 0.24664057582309312, "percentage": 24.67, "elapsed_time": "1 day, 17:36:05", "remaining_time": "5 days, 7:03:26", "throughput": 2714.3, "total_tokens": 406509152} {"current_steps": 2254, "total_steps": 9134, "loss": 0.8152, "learning_rate": 4.285612076412279e-05, "epoch": 0.24675004789403104, "percentage": 24.68, "elapsed_time": "1 day, 17:37:09", "remaining_time": "5 days, 7:02:13", "throughput": 2714.38, "total_tokens": 406694176} {"current_steps": 2255, "total_steps": 9134, "loss": 0.5984, "learning_rate": 4.285010156724192e-05, "epoch": 0.24685951996496894, "percentage": 24.69, "elapsed_time": "1 day, 17:38:18", "remaining_time": "5 days, 7:01:12", "throughput": 2714.55, "total_tokens": 406907200} {"current_steps": 2256, "total_steps": 9134, "loss": 0.7221, "learning_rate": 4.2844080258728156e-05, "epoch": 0.24696899203590683, "percentage": 24.7, "elapsed_time": "1 day, 17:39:25", "remaining_time": "5 days, 7:00:08", "throughput": 2714.55, "total_tokens": 407088864} {"current_steps": 2257, "total_steps": 9134, "loss": 0.7122, "learning_rate": 4.2838056839293816e-05, "epoch": 0.24707846410684475, "percentage": 24.71, "elapsed_time": "1 day, 17:40:28", "remaining_time": "5 days, 6:58:52", "throughput": 2714.5, "total_tokens": 407253728} {"current_steps": 2258, "total_steps": 9134, "loss": 0.8215, "learning_rate": 4.283203130965145e-05, "epoch": 0.24718793617778265, "percentage": 24.72, "elapsed_time": "1 day, 17:41:30", "remaining_time": "5 days, 6:57:31", "throughput": 2714.51, "total_tokens": 407422624} {"current_steps": 2259, "total_steps": 9134, "loss": 0.7149, "learning_rate": 4.282600367051387e-05, "epoch": 0.24729740824872054, "percentage": 24.73, "elapsed_time": "1 day, 17:42:30", "remaining_time": "5 days, 6:56:04", "throughput": 2714.27, "total_tokens": 407548960} {"current_steps": 2260, "total_steps": 9134, "loss": 0.6445, "learning_rate": 4.2819973922594134e-05, "epoch": 0.24740688031965843, "percentage": 24.74, "elapsed_time": "1 day, 17:43:37", "remaining_time": "5 days, 6:54:59", "throughput": 2714.33, "total_tokens": 407739584} {"current_steps": 2261, "total_steps": 9134, "loss": 0.7869, "learning_rate": 4.281394206660555e-05, "epoch": 0.24751635239059636, "percentage": 24.75, "elapsed_time": "1 day, 17:44:43", "remaining_time": "5 days, 6:53:52", "throughput": 2714.42, "total_tokens": 407932448} {"current_steps": 2262, "total_steps": 9134, "loss": 0.6026, "learning_rate": 4.2807908103261674e-05, "epoch": 0.24762582446153425, "percentage": 24.76, "elapsed_time": "1 day, 17:45:48", "remaining_time": "5 days, 6:52:42", "throughput": 2714.31, "total_tokens": 408093056} {"current_steps": 2263, "total_steps": 9134, "loss": 0.8459, "learning_rate": 4.280187203327631e-05, "epoch": 0.24773529653247214, "percentage": 24.78, "elapsed_time": "1 day, 17:46:54", "remaining_time": "5 days, 6:51:35", "throughput": 2714.32, "total_tokens": 408274048} {"current_steps": 2264, "total_steps": 9134, "loss": 0.6728, "learning_rate": 4.2795833857363515e-05, "epoch": 0.24784476860341006, "percentage": 24.79, "elapsed_time": "1 day, 17:47:57", "remaining_time": "5 days, 6:50:17", "throughput": 2714.25, "total_tokens": 408434432} {"current_steps": 2265, "total_steps": 9134, "loss": 0.6107, "learning_rate": 4.2789793576237594e-05, "epoch": 0.24795424067434796, "percentage": 24.8, "elapsed_time": "1 day, 17:49:06", "remaining_time": "5 days, 6:49:17", "throughput": 2714.26, "total_tokens": 408621024} {"current_steps": 2266, "total_steps": 9134, "loss": 0.6844, "learning_rate": 4.278375119061311e-05, "epoch": 0.24806371274528585, "percentage": 24.81, "elapsed_time": "1 day, 17:50:09", "remaining_time": "5 days, 6:48:00", "throughput": 2714.31, "total_tokens": 408799776} {"current_steps": 2267, "total_steps": 9134, "loss": 0.7267, "learning_rate": 4.2777706701204846e-05, "epoch": 0.24817318481622377, "percentage": 24.82, "elapsed_time": "1 day, 17:51:15", "remaining_time": "5 days, 6:46:52", "throughput": 2714.44, "total_tokens": 408999360} {"current_steps": 2268, "total_steps": 9134, "loss": 0.7287, "learning_rate": 4.277166010872787e-05, "epoch": 0.24828265688716167, "percentage": 24.83, "elapsed_time": "1 day, 17:52:20", "remaining_time": "5 days, 6:45:42", "throughput": 2714.38, "total_tokens": 409167584} {"current_steps": 2269, "total_steps": 9134, "loss": 0.8652, "learning_rate": 4.276561141389748e-05, "epoch": 0.24839212895809956, "percentage": 24.84, "elapsed_time": "1 day, 17:53:29", "remaining_time": "5 days, 6:44:43", "throughput": 2714.48, "total_tokens": 409370080} {"current_steps": 2270, "total_steps": 9134, "loss": 0.5777, "learning_rate": 4.275956061742921e-05, "epoch": 0.24850160102903746, "percentage": 24.85, "elapsed_time": "1 day, 17:54:31", "remaining_time": "5 days, 6:43:23", "throughput": 2714.47, "total_tokens": 409536064} {"current_steps": 2271, "total_steps": 9134, "loss": 0.7637, "learning_rate": 4.275350772003888e-05, "epoch": 0.24861107309997538, "percentage": 24.86, "elapsed_time": "1 day, 17:55:34", "remaining_time": "5 days, 6:42:05", "throughput": 2714.36, "total_tokens": 409689952} {"current_steps": 2272, "total_steps": 9134, "loss": 0.9454, "learning_rate": 4.2747452722442524e-05, "epoch": 0.24872054517091327, "percentage": 24.87, "elapsed_time": "1 day, 17:56:37", "remaining_time": "5 days, 6:40:50", "throughput": 2714.33, "total_tokens": 409857728} {"current_steps": 2273, "total_steps": 9134, "loss": 0.6154, "learning_rate": 4.274139562535643e-05, "epoch": 0.24883001724185116, "percentage": 24.89, "elapsed_time": "1 day, 17:57:43", "remaining_time": "5 days, 6:39:42", "throughput": 2714.45, "total_tokens": 410054624} {"current_steps": 2274, "total_steps": 9134, "loss": 0.8847, "learning_rate": 4.2735336429497166e-05, "epoch": 0.2489394893127891, "percentage": 24.9, "elapsed_time": "1 day, 17:58:52", "remaining_time": "5 days, 6:38:44", "throughput": 2714.66, "total_tokens": 410273696} {"current_steps": 2275, "total_steps": 9134, "loss": 0.7859, "learning_rate": 4.272927513558149e-05, "epoch": 0.24904896138372698, "percentage": 24.91, "elapsed_time": "1 day, 18:00:00", "remaining_time": "5 days, 6:37:40", "throughput": 2714.79, "total_tokens": 410477760} {"current_steps": 2276, "total_steps": 9134, "loss": 0.8957, "learning_rate": 4.272321174432646e-05, "epoch": 0.24915843345466487, "percentage": 24.92, "elapsed_time": "1 day, 18:01:06", "remaining_time": "5 days, 6:36:32", "throughput": 2714.8, "total_tokens": 410657856} {"current_steps": 2277, "total_steps": 9134, "loss": 0.7914, "learning_rate": 4.271714625644937e-05, "epoch": 0.24926790552560277, "percentage": 24.93, "elapsed_time": "1 day, 18:02:12", "remaining_time": "5 days, 6:35:26", "throughput": 2714.88, "total_tokens": 410850720} {"current_steps": 2278, "total_steps": 9134, "loss": 0.8169, "learning_rate": 4.271107867266775e-05, "epoch": 0.2493773775965407, "percentage": 24.94, "elapsed_time": "1 day, 18:03:17", "remaining_time": "5 days, 6:34:13", "throughput": 2714.87, "total_tokens": 411024320} {"current_steps": 2279, "total_steps": 9134, "loss": 0.8569, "learning_rate": 4.270500899369937e-05, "epoch": 0.24948684966747858, "percentage": 24.95, "elapsed_time": "1 day, 18:04:22", "remaining_time": "5 days, 6:33:05", "throughput": 2714.97, "total_tokens": 411218080} {"current_steps": 2280, "total_steps": 9134, "loss": 0.6996, "learning_rate": 4.269893722026228e-05, "epoch": 0.24959632173841648, "percentage": 24.96, "elapsed_time": "1 day, 18:05:27", "remaining_time": "5 days, 6:31:52", "throughput": 2714.92, "total_tokens": 411384512} {"current_steps": 2281, "total_steps": 9134, "loss": 0.6996, "learning_rate": 4.2692863353074745e-05, "epoch": 0.2497057938093544, "percentage": 24.97, "elapsed_time": "1 day, 18:06:35", "remaining_time": "5 days, 6:30:50", "throughput": 2714.93, "total_tokens": 411570880} {"current_steps": 2282, "total_steps": 9134, "loss": 0.6311, "learning_rate": 4.26867873928553e-05, "epoch": 0.2498152658802923, "percentage": 24.98, "elapsed_time": "1 day, 18:07:35", "remaining_time": "5 days, 6:29:26", "throughput": 2714.77, "total_tokens": 411710208} {"current_steps": 2283, "total_steps": 9134, "loss": 0.6481, "learning_rate": 4.2680709340322725e-05, "epoch": 0.24992473795123019, "percentage": 24.99, "elapsed_time": "1 day, 18:08:37", "remaining_time": "5 days, 6:28:06", "throughput": 2714.67, "total_tokens": 411864096} {"current_steps": 2284, "total_steps": 9134, "loss": 0.9176, "learning_rate": 4.2674629196196025e-05, "epoch": 0.2500342100221681, "percentage": 25.01, "elapsed_time": "1 day, 18:09:47", "remaining_time": "5 days, 6:27:09", "throughput": 2714.81, "total_tokens": 412073312} {"current_steps": 2285, "total_steps": 9134, "loss": 0.5857, "learning_rate": 4.266854696119449e-05, "epoch": 0.250143682093106, "percentage": 25.02, "elapsed_time": "1 day, 18:10:55", "remaining_time": "5 days, 6:26:09", "throughput": 2714.96, "total_tokens": 412282528} {"current_steps": 2286, "total_steps": 9134, "loss": 0.9749, "learning_rate": 4.266246263603761e-05, "epoch": 0.2502531541640439, "percentage": 25.03, "elapsed_time": "1 day, 18:12:04", "remaining_time": "5 days, 6:25:10", "throughput": 2715.12, "total_tokens": 412494880} {"current_steps": 2287, "total_steps": 9134, "loss": 0.8228, "learning_rate": 4.2656376221445185e-05, "epoch": 0.2503626262349818, "percentage": 25.04, "elapsed_time": "1 day, 18:13:10", "remaining_time": "5 days, 6:24:01", "throughput": 2715.06, "total_tokens": 412664000} {"current_steps": 2288, "total_steps": 9134, "loss": 0.7435, "learning_rate": 4.265028771813719e-05, "epoch": 0.2504720983059197, "percentage": 25.05, "elapsed_time": "1 day, 18:14:17", "remaining_time": "5 days, 6:22:56", "throughput": 2715.09, "total_tokens": 412849920} {"current_steps": 2289, "total_steps": 9134, "loss": 0.7253, "learning_rate": 4.2644197126833906e-05, "epoch": 0.25058157037685763, "percentage": 25.06, "elapsed_time": "1 day, 18:15:19", "remaining_time": "5 days, 6:21:36", "throughput": 2714.99, "total_tokens": 413002912} {"current_steps": 2290, "total_steps": 9134, "loss": 0.8337, "learning_rate": 4.263810444825583e-05, "epoch": 0.2506910424477955, "percentage": 25.07, "elapsed_time": "1 day, 18:16:24", "remaining_time": "5 days, 6:20:26", "throughput": 2714.87, "total_tokens": 413161056} {"current_steps": 2291, "total_steps": 9134, "loss": 0.7558, "learning_rate": 4.2632009683123716e-05, "epoch": 0.2508005145187334, "percentage": 25.08, "elapsed_time": "1 day, 18:17:28", "remaining_time": "5 days, 6:19:11", "throughput": 2714.84, "total_tokens": 413329952} {"current_steps": 2292, "total_steps": 9134, "loss": 0.5995, "learning_rate": 4.262591283215857e-05, "epoch": 0.2509099865896713, "percentage": 25.09, "elapsed_time": "1 day, 18:18:36", "remaining_time": "5 days, 6:18:11", "throughput": 2714.86, "total_tokens": 413518560} {"current_steps": 2293, "total_steps": 9134, "loss": 0.6912, "learning_rate": 4.261981389608162e-05, "epoch": 0.2510194586606092, "percentage": 25.1, "elapsed_time": "1 day, 18:19:42", "remaining_time": "5 days, 6:17:02", "throughput": 2714.74, "total_tokens": 413678720} {"current_steps": 2294, "total_steps": 9134, "loss": 0.6114, "learning_rate": 4.2613712875614374e-05, "epoch": 0.25112893073154713, "percentage": 25.11, "elapsed_time": "1 day, 18:20:47", "remaining_time": "5 days, 6:15:51", "throughput": 2714.69, "total_tokens": 413848064} {"current_steps": 2295, "total_steps": 9134, "loss": 0.7621, "learning_rate": 4.260760977147858e-05, "epoch": 0.251238402802485, "percentage": 25.13, "elapsed_time": "1 day, 18:21:53", "remaining_time": "5 days, 6:14:43", "throughput": 2714.6, "total_tokens": 414013152} {"current_steps": 2296, "total_steps": 9134, "loss": 0.7083, "learning_rate": 4.260150458439619e-05, "epoch": 0.2513478748734229, "percentage": 25.14, "elapsed_time": "1 day, 18:22:57", "remaining_time": "5 days, 6:13:30", "throughput": 2714.5, "total_tokens": 414172640} {"current_steps": 2297, "total_steps": 9134, "loss": 0.7597, "learning_rate": 4.259539731508947e-05, "epoch": 0.25145734694436084, "percentage": 25.15, "elapsed_time": "1 day, 18:23:59", "remaining_time": "5 days, 6:12:11", "throughput": 2714.49, "total_tokens": 414339968} {"current_steps": 2298, "total_steps": 9134, "loss": 0.6881, "learning_rate": 4.2589287964280874e-05, "epoch": 0.2515668190152987, "percentage": 25.16, "elapsed_time": "1 day, 18:25:06", "remaining_time": "5 days, 6:11:05", "throughput": 2714.5, "total_tokens": 414521856} {"current_steps": 2299, "total_steps": 9134, "loss": 0.7224, "learning_rate": 4.2583176532693136e-05, "epoch": 0.2516762910862366, "percentage": 25.17, "elapsed_time": "1 day, 18:26:14", "remaining_time": "5 days, 6:10:03", "throughput": 2714.62, "total_tokens": 414725248} {"current_steps": 2300, "total_steps": 9134, "loss": 0.7737, "learning_rate": 4.257706302104924e-05, "epoch": 0.25178576315717455, "percentage": 25.18, "elapsed_time": "1 day, 18:27:21", "remaining_time": "5 days, 6:08:57", "throughput": 2714.72, "total_tokens": 414920800} {"current_steps": 2301, "total_steps": 9134, "loss": 0.6697, "learning_rate": 4.2570947430072384e-05, "epoch": 0.2518952352281124, "percentage": 25.19, "elapsed_time": "1 day, 18:28:24", "remaining_time": "5 days, 6:07:41", "throughput": 2714.78, "total_tokens": 415101792} {"current_steps": 2302, "total_steps": 9134, "loss": 0.6812, "learning_rate": 4.256482976048603e-05, "epoch": 0.25200470729905033, "percentage": 25.2, "elapsed_time": "1 day, 18:29:29", "remaining_time": "5 days, 6:06:30", "throughput": 2714.71, "total_tokens": 415268448} {"current_steps": 2303, "total_steps": 9134, "loss": 0.521, "learning_rate": 4.2558710013013906e-05, "epoch": 0.25211417936998826, "percentage": 25.21, "elapsed_time": "1 day, 18:30:33", "remaining_time": "5 days, 6:05:17", "throughput": 2714.57, "total_tokens": 415420320} {"current_steps": 2304, "total_steps": 9134, "loss": 0.9001, "learning_rate": 4.255258818837994e-05, "epoch": 0.2522236514409261, "percentage": 25.22, "elapsed_time": "1 day, 18:31:39", "remaining_time": "5 days, 6:04:10", "throughput": 2714.53, "total_tokens": 415593024} {"current_steps": 2305, "total_steps": 9134, "loss": 0.5922, "learning_rate": 4.254646428730835e-05, "epoch": 0.25233312351186404, "percentage": 25.24, "elapsed_time": "1 day, 18:32:48", "remaining_time": "5 days, 6:03:11", "throughput": 2714.69, "total_tokens": 415806272} {"current_steps": 2306, "total_steps": 9134, "loss": 0.5669, "learning_rate": 4.254033831052359e-05, "epoch": 0.25244259558280197, "percentage": 25.25, "elapsed_time": "1 day, 18:33:54", "remaining_time": "5 days, 6:02:03", "throughput": 2714.66, "total_tokens": 415979200} {"current_steps": 2307, "total_steps": 9134, "loss": 0.6982, "learning_rate": 4.253421025875033e-05, "epoch": 0.25255206765373983, "percentage": 25.26, "elapsed_time": "1 day, 18:35:02", "remaining_time": "5 days, 6:01:00", "throughput": 2714.8, "total_tokens": 416184384} {"current_steps": 2308, "total_steps": 9134, "loss": 0.71, "learning_rate": 4.252808013271351e-05, "epoch": 0.25266153972467775, "percentage": 25.27, "elapsed_time": "1 day, 18:36:05", "remaining_time": "5 days, 5:59:44", "throughput": 2714.72, "total_tokens": 416343648} {"current_steps": 2309, "total_steps": 9134, "loss": 0.8952, "learning_rate": 4.252194793313833e-05, "epoch": 0.2527710117956156, "percentage": 25.28, "elapsed_time": "1 day, 18:37:10", "remaining_time": "5 days, 5:58:35", "throughput": 2714.74, "total_tokens": 416525984} {"current_steps": 2310, "total_steps": 9134, "loss": 0.6391, "learning_rate": 4.25158136607502e-05, "epoch": 0.25288048386655354, "percentage": 25.29, "elapsed_time": "1 day, 18:38:12", "remaining_time": "5 days, 5:57:13", "throughput": 2714.67, "total_tokens": 416680544} {"current_steps": 2311, "total_steps": 9134, "loss": 0.609, "learning_rate": 4.25096773162748e-05, "epoch": 0.25298995593749146, "percentage": 25.3, "elapsed_time": "1 day, 18:39:19", "remaining_time": "5 days, 5:56:08", "throughput": 2714.69, "total_tokens": 416866240} {"current_steps": 2312, "total_steps": 9134, "loss": 0.7208, "learning_rate": 4.2503538900438044e-05, "epoch": 0.25309942800842933, "percentage": 25.31, "elapsed_time": "1 day, 18:40:23", "remaining_time": "5 days, 5:54:55", "throughput": 2714.76, "total_tokens": 417051712} {"current_steps": 2313, "total_steps": 9134, "loss": 0.5881, "learning_rate": 4.2497398413966094e-05, "epoch": 0.25320890007936725, "percentage": 25.32, "elapsed_time": "1 day, 18:41:28", "remaining_time": "5 days, 5:53:45", "throughput": 2714.78, "total_tokens": 417230688} {"current_steps": 2314, "total_steps": 9134, "loss": 0.6289, "learning_rate": 4.249125585758537e-05, "epoch": 0.25331837215030517, "percentage": 25.33, "elapsed_time": "1 day, 18:42:34", "remaining_time": "5 days, 5:52:37", "throughput": 2714.86, "total_tokens": 417422880} {"current_steps": 2315, "total_steps": 9134, "loss": 0.6618, "learning_rate": 4.248511123202251e-05, "epoch": 0.25342784422124304, "percentage": 25.34, "elapsed_time": "1 day, 18:43:41", "remaining_time": "5 days, 5:51:31", "throughput": 2714.86, "total_tokens": 417602976} {"current_steps": 2316, "total_steps": 9134, "loss": 0.7165, "learning_rate": 4.247896453800442e-05, "epoch": 0.25353731629218096, "percentage": 25.36, "elapsed_time": "1 day, 18:44:48", "remaining_time": "5 days, 5:50:28", "throughput": 2714.95, "total_tokens": 417800544} {"current_steps": 2317, "total_steps": 9134, "loss": 0.6589, "learning_rate": 4.247281577625824e-05, "epoch": 0.2536467883631189, "percentage": 25.37, "elapsed_time": "1 day, 18:45:55", "remaining_time": "5 days, 5:49:21", "throughput": 2715.0, "total_tokens": 417988256} {"current_steps": 2318, "total_steps": 9134, "loss": 0.8643, "learning_rate": 4.2466664947511356e-05, "epoch": 0.25375626043405675, "percentage": 25.38, "elapsed_time": "1 day, 18:46:58", "remaining_time": "5 days, 5:48:06", "throughput": 2714.87, "total_tokens": 418140800} {"current_steps": 2319, "total_steps": 9134, "loss": 0.764, "learning_rate": 4.246051205249139e-05, "epoch": 0.25386573250499467, "percentage": 25.39, "elapsed_time": "1 day, 18:48:07", "remaining_time": "5 days, 5:47:08", "throughput": 2715.04, "total_tokens": 418354720} {"current_steps": 2320, "total_steps": 9134, "loss": 0.676, "learning_rate": 4.2454357091926236e-05, "epoch": 0.2539752045759326, "percentage": 25.4, "elapsed_time": "1 day, 18:49:10", "remaining_time": "5 days, 5:45:51", "throughput": 2714.99, "total_tokens": 418517792} {"current_steps": 2321, "total_steps": 9134, "loss": 0.5762, "learning_rate": 4.244820006654401e-05, "epoch": 0.25408467664687046, "percentage": 25.41, "elapsed_time": "1 day, 18:50:17", "remaining_time": "5 days, 5:44:46", "throughput": 2714.93, "total_tokens": 418690944} {"current_steps": 2322, "total_steps": 9134, "loss": 0.7981, "learning_rate": 4.244204097707306e-05, "epoch": 0.2541941487178084, "percentage": 25.42, "elapsed_time": "1 day, 18:51:26", "remaining_time": "5 days, 5:43:47", "throughput": 2715.15, "total_tokens": 418912480} {"current_steps": 2323, "total_steps": 9134, "loss": 0.701, "learning_rate": 4.243587982424201e-05, "epoch": 0.2543036207887463, "percentage": 25.43, "elapsed_time": "1 day, 18:52:33", "remaining_time": "5 days, 5:42:42", "throughput": 2715.13, "total_tokens": 419089888} {"current_steps": 2324, "total_steps": 9134, "loss": 0.6268, "learning_rate": 4.242971660877971e-05, "epoch": 0.25441309285968416, "percentage": 25.44, "elapsed_time": "1 day, 18:53:36", "remaining_time": "5 days, 5:41:25", "throughput": 2715.03, "total_tokens": 419246240} {"current_steps": 2325, "total_steps": 9134, "loss": 0.6317, "learning_rate": 4.242355133141525e-05, "epoch": 0.2545225649306221, "percentage": 25.45, "elapsed_time": "1 day, 18:54:42", "remaining_time": "5 days, 5:40:19", "throughput": 2715.14, "total_tokens": 419442688} {"current_steps": 2326, "total_steps": 9134, "loss": 0.6422, "learning_rate": 4.241738399287798e-05, "epoch": 0.25463203700155995, "percentage": 25.47, "elapsed_time": "1 day, 18:55:48", "remaining_time": "5 days, 5:39:11", "throughput": 2715.15, "total_tokens": 419623680} {"current_steps": 2327, "total_steps": 9134, "loss": 0.7002, "learning_rate": 4.2411214593897486e-05, "epoch": 0.2547415090724979, "percentage": 25.48, "elapsed_time": "1 day, 18:56:55", "remaining_time": "5 days, 5:38:06", "throughput": 2715.24, "total_tokens": 419819008} {"current_steps": 2328, "total_steps": 9134, "loss": 0.9622, "learning_rate": 4.2405043135203584e-05, "epoch": 0.2548509811434358, "percentage": 25.49, "elapsed_time": "1 day, 18:58:04", "remaining_time": "5 days, 5:37:05", "throughput": 2715.32, "total_tokens": 420017696} {"current_steps": 2329, "total_steps": 9134, "loss": 0.7019, "learning_rate": 4.239886961752635e-05, "epoch": 0.25496045321437366, "percentage": 25.5, "elapsed_time": "1 day, 18:59:10", "remaining_time": "5 days, 5:35:58", "throughput": 2715.41, "total_tokens": 420210784} {"current_steps": 2330, "total_steps": 9134, "loss": 0.6885, "learning_rate": 4.23926940415961e-05, "epoch": 0.2550699252853116, "percentage": 25.51, "elapsed_time": "1 day, 19:00:16", "remaining_time": "5 days, 5:34:50", "throughput": 2715.53, "total_tokens": 420407904} {"current_steps": 2331, "total_steps": 9134, "loss": 0.5546, "learning_rate": 4.2386516408143404e-05, "epoch": 0.2551793973562495, "percentage": 25.52, "elapsed_time": "1 day, 19:01:23", "remaining_time": "5 days, 5:33:44", "throughput": 2715.53, "total_tokens": 420589120} {"current_steps": 2332, "total_steps": 9134, "loss": 0.6421, "learning_rate": 4.2380336717899044e-05, "epoch": 0.25528886942718737, "percentage": 25.53, "elapsed_time": "1 day, 19:02:25", "remaining_time": "5 days, 5:32:25", "throughput": 2715.44, "total_tokens": 420744352} {"current_steps": 2333, "total_steps": 9134, "loss": 0.6979, "learning_rate": 4.237415497159408e-05, "epoch": 0.2553983414981253, "percentage": 25.54, "elapsed_time": "1 day, 19:03:32", "remaining_time": "5 days, 5:31:22", "throughput": 2715.5, "total_tokens": 420938112} {"current_steps": 2334, "total_steps": 9134, "loss": 0.6976, "learning_rate": 4.2367971169959796e-05, "epoch": 0.2555078135690632, "percentage": 25.55, "elapsed_time": "1 day, 19:04:33", "remaining_time": "5 days, 5:29:59", "throughput": 2715.38, "total_tokens": 421084160} {"current_steps": 2335, "total_steps": 9134, "loss": 0.6831, "learning_rate": 4.2361785313727726e-05, "epoch": 0.2556172856400011, "percentage": 25.56, "elapsed_time": "1 day, 19:05:40", "remaining_time": "5 days, 5:28:54", "throughput": 2715.49, "total_tokens": 421281728} {"current_steps": 2336, "total_steps": 9134, "loss": 0.8004, "learning_rate": 4.235559740362964e-05, "epoch": 0.255726757710939, "percentage": 25.57, "elapsed_time": "1 day, 19:06:48", "remaining_time": "5 days, 5:27:54", "throughput": 2715.58, "total_tokens": 421481984} {"current_steps": 2337, "total_steps": 9134, "loss": 0.7721, "learning_rate": 4.2349407440397566e-05, "epoch": 0.2558362297818769, "percentage": 25.59, "elapsed_time": "1 day, 19:07:57", "remaining_time": "5 days, 5:26:54", "throughput": 2715.58, "total_tokens": 421669696} {"current_steps": 2338, "total_steps": 9134, "loss": 0.6656, "learning_rate": 4.234321542476375e-05, "epoch": 0.2559457018528148, "percentage": 25.6, "elapsed_time": "1 day, 19:09:05", "remaining_time": "5 days, 5:25:51", "throughput": 2715.71, "total_tokens": 421873312} {"current_steps": 2339, "total_steps": 9134, "loss": 0.6814, "learning_rate": 4.2337021357460706e-05, "epoch": 0.2560551739237527, "percentage": 25.61, "elapsed_time": "1 day, 19:10:14", "remaining_time": "5 days, 5:24:52", "throughput": 2715.74, "total_tokens": 422064832} {"current_steps": 2340, "total_steps": 9134, "loss": 0.8215, "learning_rate": 4.2330825239221186e-05, "epoch": 0.25616464599469063, "percentage": 25.62, "elapsed_time": "1 day, 19:11:17", "remaining_time": "5 days, 5:23:36", "throughput": 2715.7, "total_tokens": 422230144} {"current_steps": 2341, "total_steps": 9134, "loss": 0.8495, "learning_rate": 4.232462707077816e-05, "epoch": 0.2562741180656285, "percentage": 25.63, "elapsed_time": "1 day, 19:12:26", "remaining_time": "5 days, 5:22:37", "throughput": 2715.95, "total_tokens": 422457280} {"current_steps": 2342, "total_steps": 9134, "loss": 0.9702, "learning_rate": 4.231842685286488e-05, "epoch": 0.2563835901365664, "percentage": 25.64, "elapsed_time": "1 day, 19:13:34", "remaining_time": "5 days, 5:21:35", "throughput": 2716.13, "total_tokens": 422669856} {"current_steps": 2343, "total_steps": 9134, "loss": 0.5781, "learning_rate": 4.23122245862148e-05, "epoch": 0.2564930622075043, "percentage": 25.65, "elapsed_time": "1 day, 19:14:40", "remaining_time": "5 days, 5:20:26", "throughput": 2716.03, "total_tokens": 422831136} {"current_steps": 2344, "total_steps": 9134, "loss": 0.8055, "learning_rate": 4.2306020271561656e-05, "epoch": 0.2566025342784422, "percentage": 25.66, "elapsed_time": "1 day, 19:15:45", "remaining_time": "5 days, 5:19:16", "throughput": 2716.07, "total_tokens": 423015488} {"current_steps": 2345, "total_steps": 9134, "loss": 0.6582, "learning_rate": 4.2299813909639395e-05, "epoch": 0.25671200634938013, "percentage": 25.67, "elapsed_time": "1 day, 19:16:54", "remaining_time": "5 days, 5:18:17", "throughput": 2716.11, "total_tokens": 423209024} {"current_steps": 2346, "total_steps": 9134, "loss": 0.7001, "learning_rate": 4.229360550118222e-05, "epoch": 0.256821478420318, "percentage": 25.68, "elapsed_time": "1 day, 19:18:00", "remaining_time": "5 days, 5:17:10", "throughput": 2715.96, "total_tokens": 423365824} {"current_steps": 2347, "total_steps": 9134, "loss": 0.6909, "learning_rate": 4.228739504692457e-05, "epoch": 0.2569309504912559, "percentage": 25.7, "elapsed_time": "1 day, 19:19:06", "remaining_time": "5 days, 5:16:02", "throughput": 2716.03, "total_tokens": 423554880} {"current_steps": 2348, "total_steps": 9134, "loss": 0.5869, "learning_rate": 4.228118254760114e-05, "epoch": 0.25704042256219384, "percentage": 25.71, "elapsed_time": "1 day, 19:20:12", "remaining_time": "5 days, 5:14:55", "throughput": 2716.03, "total_tokens": 423735872} {"current_steps": 2349, "total_steps": 9134, "loss": 0.7899, "learning_rate": 4.2274968003946845e-05, "epoch": 0.2571498946331317, "percentage": 25.72, "elapsed_time": "1 day, 19:21:18", "remaining_time": "5 days, 5:13:46", "throughput": 2716.07, "total_tokens": 423918880} {"current_steps": 2350, "total_steps": 9134, "loss": 0.6313, "learning_rate": 4.226875141669686e-05, "epoch": 0.2572593667040696, "percentage": 25.73, "elapsed_time": "1 day, 19:22:23", "remaining_time": "5 days, 5:12:37", "throughput": 2716.0, "total_tokens": 424086656} {"current_steps": 2351, "total_steps": 9134, "loss": 0.6408, "learning_rate": 4.22625327865866e-05, "epoch": 0.25736883877500755, "percentage": 25.74, "elapsed_time": "1 day, 19:23:27", "remaining_time": "5 days, 5:11:23", "throughput": 2715.99, "total_tokens": 424259136} {"current_steps": 2352, "total_steps": 9134, "loss": 0.6255, "learning_rate": 4.22563121143517e-05, "epoch": 0.2574783108459454, "percentage": 25.75, "elapsed_time": "1 day, 19:24:31", "remaining_time": "5 days, 5:10:10", "throughput": 2715.96, "total_tokens": 424428704} {"current_steps": 2353, "total_steps": 9134, "loss": 0.8997, "learning_rate": 4.225008940072808e-05, "epoch": 0.25758778291688333, "percentage": 25.76, "elapsed_time": "1 day, 19:25:40", "remaining_time": "5 days, 5:09:09", "throughput": 2716.04, "total_tokens": 424625824} {"current_steps": 2354, "total_steps": 9134, "loss": 0.8799, "learning_rate": 4.224386464645186e-05, "epoch": 0.25769725498782126, "percentage": 25.77, "elapsed_time": "1 day, 19:26:49", "remaining_time": "5 days, 5:08:10", "throughput": 2716.12, "total_tokens": 424826304} {"current_steps": 2355, "total_steps": 9134, "loss": 0.6415, "learning_rate": 4.22376378522594e-05, "epoch": 0.2578067270587591, "percentage": 25.78, "elapsed_time": "1 day, 19:27:48", "remaining_time": "5 days, 5:06:44", "throughput": 2715.99, "total_tokens": 424968320} {"current_steps": 2356, "total_steps": 9134, "loss": 0.6528, "learning_rate": 4.223140901888736e-05, "epoch": 0.25791619912969704, "percentage": 25.79, "elapsed_time": "1 day, 19:28:55", "remaining_time": "5 days, 5:05:39", "throughput": 2716.03, "total_tokens": 425156480} {"current_steps": 2357, "total_steps": 9134, "loss": 0.959, "learning_rate": 4.222517814707255e-05, "epoch": 0.25802567120063497, "percentage": 25.8, "elapsed_time": "1 day, 19:30:03", "remaining_time": "5 days, 5:04:37", "throughput": 2716.2, "total_tokens": 425366368} {"current_steps": 2358, "total_steps": 9134, "loss": 0.6475, "learning_rate": 4.221894523755211e-05, "epoch": 0.25813514327157283, "percentage": 25.82, "elapsed_time": "1 day, 19:31:11", "remaining_time": "5 days, 5:03:34", "throughput": 2716.29, "total_tokens": 425564608} {"current_steps": 2359, "total_steps": 9134, "loss": 0.5597, "learning_rate": 4.2212710291063354e-05, "epoch": 0.25824461534251075, "percentage": 25.83, "elapsed_time": "1 day, 19:32:15", "remaining_time": "5 days, 5:02:21", "throughput": 2716.21, "total_tokens": 425725888} {"current_steps": 2360, "total_steps": 9134, "loss": 0.7329, "learning_rate": 4.220647330834389e-05, "epoch": 0.2583540874134486, "percentage": 25.84, "elapsed_time": "1 day, 19:33:20", "remaining_time": "5 days, 5:01:11", "throughput": 2716.08, "total_tokens": 425882688} {"current_steps": 2361, "total_steps": 9134, "loss": 0.679, "learning_rate": 4.2200234290131515e-05, "epoch": 0.25846355948438654, "percentage": 25.85, "elapsed_time": "1 day, 19:34:23", "remaining_time": "5 days, 4:59:55", "throughput": 2715.97, "total_tokens": 426037024} {"current_steps": 2362, "total_steps": 9134, "loss": 0.6232, "learning_rate": 4.219399323716431e-05, "epoch": 0.25857303155532446, "percentage": 25.86, "elapsed_time": "1 day, 19:35:27", "remaining_time": "5 days, 4:58:39", "throughput": 2715.88, "total_tokens": 426195392} {"current_steps": 2363, "total_steps": 9134, "loss": 0.7653, "learning_rate": 4.2187750150180574e-05, "epoch": 0.25868250362626233, "percentage": 25.87, "elapsed_time": "1 day, 19:36:30", "remaining_time": "5 days, 4:57:24", "throughput": 2715.76, "total_tokens": 426348160} {"current_steps": 2364, "total_steps": 9134, "loss": 0.797, "learning_rate": 4.2181505029918847e-05, "epoch": 0.25879197569720025, "percentage": 25.88, "elapsed_time": "1 day, 19:37:33", "remaining_time": "5 days, 4:56:08", "throughput": 2715.78, "total_tokens": 426523328} {"current_steps": 2365, "total_steps": 9134, "loss": 0.9774, "learning_rate": 4.217525787711792e-05, "epoch": 0.25890144776813817, "percentage": 25.89, "elapsed_time": "1 day, 19:38:39", "remaining_time": "5 days, 4:55:01", "throughput": 2715.78, "total_tokens": 426702304} {"current_steps": 2366, "total_steps": 9134, "loss": 0.7212, "learning_rate": 4.216900869251683e-05, "epoch": 0.25901091983907604, "percentage": 25.9, "elapsed_time": "1 day, 19:39:44", "remaining_time": "5 days, 4:53:51", "throughput": 2715.78, "total_tokens": 426879936} {"current_steps": 2367, "total_steps": 9134, "loss": 0.6235, "learning_rate": 4.216275747685482e-05, "epoch": 0.25912039191001396, "percentage": 25.91, "elapsed_time": "1 day, 19:40:53", "remaining_time": "5 days, 4:52:51", "throughput": 2715.88, "total_tokens": 427081760} {"current_steps": 2368, "total_steps": 9134, "loss": 0.6489, "learning_rate": 4.215650423087142e-05, "epoch": 0.2592298639809519, "percentage": 25.93, "elapsed_time": "1 day, 19:42:00", "remaining_time": "5 days, 4:51:47", "throughput": 2715.84, "total_tokens": 427258944} {"current_steps": 2369, "total_steps": 9134, "loss": 0.6584, "learning_rate": 4.215024895530636e-05, "epoch": 0.25933933605188975, "percentage": 25.94, "elapsed_time": "1 day, 19:43:07", "remaining_time": "5 days, 4:50:42", "throughput": 2715.84, "total_tokens": 427439488} {"current_steps": 2370, "total_steps": 9134, "loss": 0.6371, "learning_rate": 4.2143991650899646e-05, "epoch": 0.25944880812282767, "percentage": 25.95, "elapsed_time": "1 day, 19:44:12", "remaining_time": "5 days, 4:49:30", "throughput": 2715.85, "total_tokens": 427616896} {"current_steps": 2371, "total_steps": 9134, "loss": 0.6665, "learning_rate": 4.213773231839149e-05, "epoch": 0.2595582801937656, "percentage": 25.96, "elapsed_time": "1 day, 19:45:20", "remaining_time": "5 days, 4:48:28", "throughput": 2715.96, "total_tokens": 427818944} {"current_steps": 2372, "total_steps": 9134, "loss": 0.7532, "learning_rate": 4.213147095852235e-05, "epoch": 0.25966775226470346, "percentage": 25.97, "elapsed_time": "1 day, 19:46:25", "remaining_time": "5 days, 4:47:17", "throughput": 2716.01, "total_tokens": 428003520} {"current_steps": 2373, "total_steps": 9134, "loss": 0.7031, "learning_rate": 4.2125207572032954e-05, "epoch": 0.2597772243356414, "percentage": 25.98, "elapsed_time": "1 day, 19:47:32", "remaining_time": "5 days, 4:46:12", "throughput": 2716.1, "total_tokens": 428199296} {"current_steps": 2374, "total_steps": 9134, "loss": 0.6883, "learning_rate": 4.211894215966424e-05, "epoch": 0.2598866964065793, "percentage": 25.99, "elapsed_time": "1 day, 19:48:39", "remaining_time": "5 days, 4:45:09", "throughput": 2716.01, "total_tokens": 428368192} {"current_steps": 2375, "total_steps": 9134, "loss": 0.7356, "learning_rate": 4.21126747221574e-05, "epoch": 0.25999616847751716, "percentage": 26.0, "elapsed_time": "1 day, 19:49:44", "remaining_time": "5 days, 4:43:58", "throughput": 2716.04, "total_tokens": 428549408} {"current_steps": 2376, "total_steps": 9134, "loss": 0.6502, "learning_rate": 4.210640526025384e-05, "epoch": 0.2601056405484551, "percentage": 26.01, "elapsed_time": "1 day, 19:50:52", "remaining_time": "5 days, 4:42:56", "throughput": 2716.03, "total_tokens": 428732192} {"current_steps": 2377, "total_steps": 9134, "loss": 0.7482, "learning_rate": 4.210013377469525e-05, "epoch": 0.26021511261939295, "percentage": 26.02, "elapsed_time": "1 day, 19:52:01", "remaining_time": "5 days, 4:41:57", "throughput": 2715.99, "total_tokens": 428913184} {"current_steps": 2378, "total_steps": 9134, "loss": 0.584, "learning_rate": 4.209386026622353e-05, "epoch": 0.2603245846903309, "percentage": 26.03, "elapsed_time": "1 day, 19:53:07", "remaining_time": "5 days, 4:40:48", "throughput": 2716.03, "total_tokens": 429097984} {"current_steps": 2379, "total_steps": 9134, "loss": 0.5518, "learning_rate": 4.208758473558081e-05, "epoch": 0.2604340567612688, "percentage": 26.05, "elapsed_time": "1 day, 19:54:11", "remaining_time": "5 days, 4:39:36", "throughput": 2715.99, "total_tokens": 429265760} {"current_steps": 2380, "total_steps": 9134, "loss": 0.7819, "learning_rate": 4.208130718350948e-05, "epoch": 0.26054352883220666, "percentage": 26.06, "elapsed_time": "1 day, 19:55:17", "remaining_time": "5 days, 4:38:29", "throughput": 2716.01, "total_tokens": 429449888} {"current_steps": 2381, "total_steps": 9134, "loss": 0.7541, "learning_rate": 4.207502761075217e-05, "epoch": 0.2606530009031446, "percentage": 26.07, "elapsed_time": "1 day, 19:56:23", "remaining_time": "5 days, 4:37:21", "throughput": 2716.1, "total_tokens": 429643648} {"current_steps": 2382, "total_steps": 9134, "loss": 0.5879, "learning_rate": 4.206874601805173e-05, "epoch": 0.2607624729740825, "percentage": 26.08, "elapsed_time": "1 day, 19:57:32", "remaining_time": "5 days, 4:36:21", "throughput": 2716.13, "total_tokens": 429833824} {"current_steps": 2383, "total_steps": 9134, "loss": 0.8328, "learning_rate": 4.206246240615127e-05, "epoch": 0.26087194504502037, "percentage": 26.09, "elapsed_time": "1 day, 19:58:37", "remaining_time": "5 days, 4:35:11", "throughput": 2716.05, "total_tokens": 429999136} {"current_steps": 2384, "total_steps": 9134, "loss": 0.8094, "learning_rate": 4.205617677579413e-05, "epoch": 0.2609814171159583, "percentage": 26.1, "elapsed_time": "1 day, 19:59:46", "remaining_time": "5 days, 4:34:10", "throughput": 2716.17, "total_tokens": 430203200} {"current_steps": 2385, "total_steps": 9134, "loss": 0.6311, "learning_rate": 4.2049889127723876e-05, "epoch": 0.2610908891868962, "percentage": 26.11, "elapsed_time": "1 day, 20:00:52", "remaining_time": "5 days, 4:33:03", "throughput": 2716.21, "total_tokens": 430389792} {"current_steps": 2386, "total_steps": 9134, "loss": 0.5677, "learning_rate": 4.204359946268432e-05, "epoch": 0.2612003612578341, "percentage": 26.12, "elapsed_time": "1 day, 20:02:00", "remaining_time": "5 days, 4:32:02", "throughput": 2716.23, "total_tokens": 430579520} {"current_steps": 2387, "total_steps": 9134, "loss": 0.8018, "learning_rate": 4.203730778141955e-05, "epoch": 0.261309833328772, "percentage": 26.13, "elapsed_time": "1 day, 20:03:07", "remaining_time": "5 days, 4:30:58", "throughput": 2716.23, "total_tokens": 430761184} {"current_steps": 2388, "total_steps": 9134, "loss": 0.5371, "learning_rate": 4.203101408467383e-05, "epoch": 0.2614193053997099, "percentage": 26.14, "elapsed_time": "1 day, 20:04:12", "remaining_time": "5 days, 4:29:45", "throughput": 2716.22, "total_tokens": 430934112} {"current_steps": 2389, "total_steps": 9134, "loss": 0.9066, "learning_rate": 4.2024718373191705e-05, "epoch": 0.2615287774706478, "percentage": 26.16, "elapsed_time": "1 day, 20:05:21", "remaining_time": "5 days, 4:28:47", "throughput": 2716.25, "total_tokens": 431126304} {"current_steps": 2390, "total_steps": 9134, "loss": 0.7265, "learning_rate": 4.201842064771794e-05, "epoch": 0.2616382495415857, "percentage": 26.17, "elapsed_time": "1 day, 20:06:28", "remaining_time": "5 days, 4:27:43", "throughput": 2716.27, "total_tokens": 431313344} {"current_steps": 2391, "total_steps": 9134, "loss": 0.7215, "learning_rate": 4.2012120908997546e-05, "epoch": 0.26174772161252363, "percentage": 26.18, "elapsed_time": "1 day, 20:07:33", "remaining_time": "5 days, 4:26:33", "throughput": 2716.27, "total_tokens": 431490752} {"current_steps": 2392, "total_steps": 9134, "loss": 0.7194, "learning_rate": 4.200581915777577e-05, "epoch": 0.2618571936834615, "percentage": 26.19, "elapsed_time": "1 day, 20:08:41", "remaining_time": "5 days, 4:25:29", "throughput": 2716.31, "total_tokens": 431678688} {"current_steps": 2393, "total_steps": 9134, "loss": 0.5698, "learning_rate": 4.19995153947981e-05, "epoch": 0.2619666657543994, "percentage": 26.2, "elapsed_time": "1 day, 20:09:47", "remaining_time": "5 days, 4:24:23", "throughput": 2716.29, "total_tokens": 431856768} {"current_steps": 2394, "total_steps": 9134, "loss": 0.6913, "learning_rate": 4.1993209620810255e-05, "epoch": 0.2620761378253373, "percentage": 26.21, "elapsed_time": "1 day, 20:10:55", "remaining_time": "5 days, 4:23:21", "throughput": 2716.45, "total_tokens": 432067328} {"current_steps": 2395, "total_steps": 9134, "loss": 0.7507, "learning_rate": 4.19869018365582e-05, "epoch": 0.2621856098962752, "percentage": 26.22, "elapsed_time": "1 day, 20:12:03", "remaining_time": "5 days, 4:22:18", "throughput": 2716.51, "total_tokens": 432260640} {"current_steps": 2396, "total_steps": 9134, "loss": 0.5902, "learning_rate": 4.198059204278813e-05, "epoch": 0.26229508196721313, "percentage": 26.23, "elapsed_time": "1 day, 20:13:09", "remaining_time": "5 days, 4:21:09", "throughput": 2716.41, "total_tokens": 432423264} {"current_steps": 2397, "total_steps": 9134, "loss": 0.6058, "learning_rate": 4.1974280240246477e-05, "epoch": 0.262404554038151, "percentage": 26.24, "elapsed_time": "1 day, 20:14:16", "remaining_time": "5 days, 4:20:06", "throughput": 2716.49, "total_tokens": 432619264} {"current_steps": 2398, "total_steps": 9134, "loss": 0.6659, "learning_rate": 4.196796642967992e-05, "epoch": 0.2625140261090889, "percentage": 26.25, "elapsed_time": "1 day, 20:15:19", "remaining_time": "5 days, 4:18:51", "throughput": 2716.49, "total_tokens": 432791744} {"current_steps": 2399, "total_steps": 9134, "loss": 1.0284, "learning_rate": 4.1961650611835376e-05, "epoch": 0.26262349818002684, "percentage": 26.26, "elapsed_time": "1 day, 20:16:28", "remaining_time": "5 days, 4:17:49", "throughput": 2716.62, "total_tokens": 432996704} {"current_steps": 2400, "total_steps": 9134, "loss": 0.6089, "learning_rate": 4.195533278745999e-05, "epoch": 0.2627329702509647, "percentage": 26.28, "elapsed_time": "1 day, 20:17:33", "remaining_time": "5 days, 4:16:39", "throughput": 2716.62, "total_tokens": 433174336} {"current_steps": 2401, "total_steps": 9134, "loss": 0.6598, "learning_rate": 4.194901295730115e-05, "epoch": 0.2628424423219026, "percentage": 26.29, "elapsed_time": "1 day, 20:18:41", "remaining_time": "5 days, 4:15:37", "throughput": 2716.8, "total_tokens": 433387584} {"current_steps": 2402, "total_steps": 9134, "loss": 0.6033, "learning_rate": 4.1942691122106484e-05, "epoch": 0.26295191439284055, "percentage": 26.3, "elapsed_time": "1 day, 20:19:46", "remaining_time": "5 days, 4:14:26", "throughput": 2716.78, "total_tokens": 433560960} {"current_steps": 2403, "total_steps": 9134, "loss": 0.6755, "learning_rate": 4.1936367282623836e-05, "epoch": 0.2630613864637784, "percentage": 26.31, "elapsed_time": "1 day, 20:20:51", "remaining_time": "5 days, 4:13:16", "throughput": 2716.81, "total_tokens": 433741952} {"current_steps": 2404, "total_steps": 9134, "loss": 0.8841, "learning_rate": 4.1930041439601316e-05, "epoch": 0.26317085853471633, "percentage": 26.32, "elapsed_time": "1 day, 20:22:00", "remaining_time": "5 days, 4:12:16", "throughput": 2716.98, "total_tokens": 433956096} {"current_steps": 2405, "total_steps": 9134, "loss": 0.6934, "learning_rate": 4.192371359378726e-05, "epoch": 0.26328033060565426, "percentage": 26.33, "elapsed_time": "1 day, 20:23:03", "remaining_time": "5 days, 4:11:01", "throughput": 2717.04, "total_tokens": 434138208} {"current_steps": 2406, "total_steps": 9134, "loss": 0.6385, "learning_rate": 4.191738374593024e-05, "epoch": 0.2633898026765921, "percentage": 26.34, "elapsed_time": "1 day, 20:24:09", "remaining_time": "5 days, 4:09:54", "throughput": 2717.1, "total_tokens": 434327264} {"current_steps": 2407, "total_steps": 9134, "loss": 0.5218, "learning_rate": 4.191105189677906e-05, "epoch": 0.26349927474753004, "percentage": 26.35, "elapsed_time": "1 day, 20:25:11", "remaining_time": "5 days, 4:08:34", "throughput": 2716.99, "total_tokens": 434476224} {"current_steps": 2408, "total_steps": 9134, "loss": 0.861, "learning_rate": 4.190471804708278e-05, "epoch": 0.26360874681846796, "percentage": 26.36, "elapsed_time": "1 day, 20:26:15", "remaining_time": "5 days, 4:07:22", "throughput": 2717.04, "total_tokens": 434660800} {"current_steps": 2409, "total_steps": 9134, "loss": 0.5958, "learning_rate": 4.189838219759066e-05, "epoch": 0.26371821888940583, "percentage": 26.37, "elapsed_time": "1 day, 20:27:16", "remaining_time": "5 days, 4:05:59", "throughput": 2716.94, "total_tokens": 434808192} {"current_steps": 2410, "total_steps": 9134, "loss": 0.8483, "learning_rate": 4.1892044349052234e-05, "epoch": 0.26382769096034375, "percentage": 26.38, "elapsed_time": "1 day, 20:28:22", "remaining_time": "5 days, 4:04:53", "throughput": 2716.98, "total_tokens": 434996576} {"current_steps": 2411, "total_steps": 9134, "loss": 0.9089, "learning_rate": 4.1885704502217255e-05, "epoch": 0.2639371630312816, "percentage": 26.4, "elapsed_time": "1 day, 20:29:31", "remaining_time": "5 days, 4:03:53", "throughput": 2717.22, "total_tokens": 435221248} {"current_steps": 2412, "total_steps": 9134, "loss": 0.6613, "learning_rate": 4.187936265783571e-05, "epoch": 0.26404663510221954, "percentage": 26.41, "elapsed_time": "1 day, 20:30:34", "remaining_time": "5 days, 4:02:36", "throughput": 2717.18, "total_tokens": 435386112} {"current_steps": 2413, "total_steps": 9134, "loss": 0.7273, "learning_rate": 4.187301881665783e-05, "epoch": 0.26415610717315746, "percentage": 26.42, "elapsed_time": "1 day, 20:31:40", "remaining_time": "5 days, 4:01:31", "throughput": 2717.14, "total_tokens": 435560832} {"current_steps": 2414, "total_steps": 9134, "loss": 0.8307, "learning_rate": 4.1866672979434084e-05, "epoch": 0.2642655792440953, "percentage": 26.43, "elapsed_time": "1 day, 20:32:45", "remaining_time": "5 days, 4:00:19", "throughput": 2717.12, "total_tokens": 435733312} {"current_steps": 2415, "total_steps": 9134, "loss": 0.7134, "learning_rate": 4.1860325146915166e-05, "epoch": 0.26437505131503325, "percentage": 26.44, "elapsed_time": "1 day, 20:33:54", "remaining_time": "5 days, 3:59:18", "throughput": 2717.24, "total_tokens": 435938048} {"current_steps": 2416, "total_steps": 9134, "loss": 0.7758, "learning_rate": 4.1853975319852015e-05, "epoch": 0.26448452338597117, "percentage": 26.45, "elapsed_time": "1 day, 20:35:01", "remaining_time": "5 days, 3:58:16", "throughput": 2717.29, "total_tokens": 436129568} {"current_steps": 2417, "total_steps": 9134, "loss": 0.6861, "learning_rate": 4.18476234989958e-05, "epoch": 0.26459399545690904, "percentage": 26.46, "elapsed_time": "1 day, 20:36:10", "remaining_time": "5 days, 3:57:14", "throughput": 2717.3, "total_tokens": 436316608} {"current_steps": 2418, "total_steps": 9134, "loss": 0.6837, "learning_rate": 4.184126968509794e-05, "epoch": 0.26470346752784696, "percentage": 26.47, "elapsed_time": "1 day, 20:37:16", "remaining_time": "5 days, 3:56:09", "throughput": 2717.5, "total_tokens": 436530304} {"current_steps": 2419, "total_steps": 9134, "loss": 0.7014, "learning_rate": 4.183491387891007e-05, "epoch": 0.2648129395987849, "percentage": 26.48, "elapsed_time": "1 day, 20:38:24", "remaining_time": "5 days, 3:55:05", "throughput": 2717.54, "total_tokens": 436719808} {"current_steps": 2420, "total_steps": 9134, "loss": 0.8221, "learning_rate": 4.1828556081184064e-05, "epoch": 0.26492241166972275, "percentage": 26.49, "elapsed_time": "1 day, 20:39:33", "remaining_time": "5 days, 3:54:06", "throughput": 2717.57, "total_tokens": 436912672} {"current_steps": 2421, "total_steps": 9134, "loss": 0.5469, "learning_rate": 4.1822196292672045e-05, "epoch": 0.26503188374066067, "percentage": 26.51, "elapsed_time": "1 day, 20:40:38", "remaining_time": "5 days, 3:52:55", "throughput": 2717.61, "total_tokens": 437094336} {"current_steps": 2422, "total_steps": 9134, "loss": 0.5706, "learning_rate": 4.1815834514126366e-05, "epoch": 0.2651413558115986, "percentage": 26.52, "elapsed_time": "1 day, 20:41:41", "remaining_time": "5 days, 3:51:41", "throughput": 2717.55, "total_tokens": 437259200} {"current_steps": 2423, "total_steps": 9134, "loss": 0.8705, "learning_rate": 4.180947074629961e-05, "epoch": 0.26525082788253646, "percentage": 26.53, "elapsed_time": "1 day, 20:42:48", "remaining_time": "5 days, 3:50:34", "throughput": 2717.68, "total_tokens": 437459904} {"current_steps": 2424, "total_steps": 9134, "loss": 0.7482, "learning_rate": 4.1803104989944594e-05, "epoch": 0.2653602999534744, "percentage": 26.54, "elapsed_time": "1 day, 20:43:54", "remaining_time": "5 days, 3:49:26", "throughput": 2717.65, "total_tokens": 437634176} {"current_steps": 2425, "total_steps": 9134, "loss": 0.8687, "learning_rate": 4.1796737245814396e-05, "epoch": 0.2654697720244123, "percentage": 26.55, "elapsed_time": "1 day, 20:45:01", "remaining_time": "5 days, 3:48:23", "throughput": 2717.81, "total_tokens": 437843616} {"current_steps": 2426, "total_steps": 9134, "loss": 0.8499, "learning_rate": 4.1790367514662276e-05, "epoch": 0.26557924409535016, "percentage": 26.56, "elapsed_time": "1 day, 20:46:09", "remaining_time": "5 days, 3:47:21", "throughput": 2717.91, "total_tokens": 438044096} {"current_steps": 2427, "total_steps": 9134, "loss": 0.6385, "learning_rate": 4.178399579724178e-05, "epoch": 0.2656887161662881, "percentage": 26.57, "elapsed_time": "1 day, 20:47:12", "remaining_time": "5 days, 3:46:05", "throughput": 2717.77, "total_tokens": 438193280} {"current_steps": 2428, "total_steps": 9134, "loss": 0.6204, "learning_rate": 4.177762209430667e-05, "epoch": 0.26579818823722595, "percentage": 26.58, "elapsed_time": "1 day, 20:48:17", "remaining_time": "5 days, 3:44:55", "throughput": 2717.68, "total_tokens": 438355904} {"current_steps": 2429, "total_steps": 9134, "loss": 0.5386, "learning_rate": 4.177124640661094e-05, "epoch": 0.2659076603081639, "percentage": 26.59, "elapsed_time": "1 day, 20:49:25", "remaining_time": "5 days, 3:43:51", "throughput": 2717.74, "total_tokens": 438549440} {"current_steps": 2430, "total_steps": 9134, "loss": 0.7279, "learning_rate": 4.176486873490882e-05, "epoch": 0.2660171323791018, "percentage": 26.6, "elapsed_time": "1 day, 20:50:30", "remaining_time": "5 days, 3:42:41", "throughput": 2717.76, "total_tokens": 438728864} {"current_steps": 2431, "total_steps": 9134, "loss": 0.8481, "learning_rate": 4.1758489079954774e-05, "epoch": 0.26612660445003966, "percentage": 26.61, "elapsed_time": "1 day, 20:51:34", "remaining_time": "5 days, 3:41:28", "throughput": 2717.76, "total_tokens": 438902464} {"current_steps": 2432, "total_steps": 9134, "loss": 0.6231, "learning_rate": 4.1752107442503505e-05, "epoch": 0.2662360765209776, "percentage": 26.63, "elapsed_time": "1 day, 20:52:35", "remaining_time": "5 days, 3:40:06", "throughput": 2717.67, "total_tokens": 439053888} {"current_steps": 2433, "total_steps": 9134, "loss": 0.7068, "learning_rate": 4.174572382330996e-05, "epoch": 0.2663455485919155, "percentage": 26.64, "elapsed_time": "1 day, 20:53:40", "remaining_time": "5 days, 3:38:57", "throughput": 2717.69, "total_tokens": 439234432} {"current_steps": 2434, "total_steps": 9134, "loss": 0.7253, "learning_rate": 4.1739338223129294e-05, "epoch": 0.26645502066285337, "percentage": 26.65, "elapsed_time": "1 day, 20:54:48", "remaining_time": "5 days, 3:37:55", "throughput": 2717.77, "total_tokens": 439432896} {"current_steps": 2435, "total_steps": 9134, "loss": 0.7188, "learning_rate": 4.1732950642716916e-05, "epoch": 0.2665644927337913, "percentage": 26.66, "elapsed_time": "1 day, 20:55:49", "remaining_time": "5 days, 3:36:33", "throughput": 2717.73, "total_tokens": 439590816} {"current_steps": 2436, "total_steps": 9134, "loss": 0.9017, "learning_rate": 4.1726561082828466e-05, "epoch": 0.2666739648047292, "percentage": 26.67, "elapsed_time": "1 day, 20:56:57", "remaining_time": "5 days, 3:35:30", "throughput": 2717.83, "total_tokens": 439791072} {"current_steps": 2437, "total_steps": 9134, "loss": 0.7513, "learning_rate": 4.172016954421981e-05, "epoch": 0.2667834368756671, "percentage": 26.68, "elapsed_time": "1 day, 20:58:01", "remaining_time": "5 days, 3:34:19", "throughput": 2717.86, "total_tokens": 439971840} {"current_steps": 2438, "total_steps": 9134, "loss": 0.6477, "learning_rate": 4.171377602764707e-05, "epoch": 0.266892908946605, "percentage": 26.69, "elapsed_time": "1 day, 20:59:03", "remaining_time": "5 days, 3:32:59", "throughput": 2717.78, "total_tokens": 440125280} {"current_steps": 2439, "total_steps": 9134, "loss": 0.6648, "learning_rate": 4.170738053386657e-05, "epoch": 0.2670023810175429, "percentage": 26.7, "elapsed_time": "1 day, 21:00:09", "remaining_time": "5 days, 3:31:51", "throughput": 2717.72, "total_tokens": 440295296} {"current_steps": 2440, "total_steps": 9134, "loss": 0.7852, "learning_rate": 4.170098306363489e-05, "epoch": 0.2671118530884808, "percentage": 26.71, "elapsed_time": "1 day, 21:01:17", "remaining_time": "5 days, 3:30:49", "throughput": 2717.75, "total_tokens": 440485472} {"current_steps": 2441, "total_steps": 9134, "loss": 0.6549, "learning_rate": 4.169458361770885e-05, "epoch": 0.2672213251594187, "percentage": 26.72, "elapsed_time": "1 day, 21:02:22", "remaining_time": "5 days, 3:29:39", "throughput": 2717.63, "total_tokens": 440642944} {"current_steps": 2442, "total_steps": 9134, "loss": 0.6812, "learning_rate": 4.168818219684548e-05, "epoch": 0.26733079723035663, "percentage": 26.74, "elapsed_time": "1 day, 21:03:27", "remaining_time": "5 days, 3:28:30", "throughput": 2717.51, "total_tokens": 440801760} {"current_steps": 2443, "total_steps": 9134, "loss": 0.6429, "learning_rate": 4.168177880180205e-05, "epoch": 0.2674402693012945, "percentage": 26.75, "elapsed_time": "1 day, 21:04:31", "remaining_time": "5 days, 3:27:15", "throughput": 2717.59, "total_tokens": 440986336} {"current_steps": 2444, "total_steps": 9134, "loss": 0.7478, "learning_rate": 4.167537343333608e-05, "epoch": 0.2675497413722324, "percentage": 26.76, "elapsed_time": "1 day, 21:05:34", "remaining_time": "5 days, 3:26:01", "throughput": 2717.55, "total_tokens": 441152320} {"current_steps": 2445, "total_steps": 9134, "loss": 0.7742, "learning_rate": 4.166896609220532e-05, "epoch": 0.2676592134431703, "percentage": 26.77, "elapsed_time": "1 day, 21:06:42", "remaining_time": "5 days, 3:24:58", "throughput": 2717.54, "total_tokens": 441335328} {"current_steps": 2446, "total_steps": 9134, "loss": 0.5799, "learning_rate": 4.1662556779167735e-05, "epoch": 0.2677686855141082, "percentage": 26.78, "elapsed_time": "1 day, 21:07:44", "remaining_time": "5 days, 3:23:40", "throughput": 2717.48, "total_tokens": 441495488} {"current_steps": 2447, "total_steps": 9134, "loss": 0.6634, "learning_rate": 4.165614549498152e-05, "epoch": 0.26787815758504613, "percentage": 26.79, "elapsed_time": "1 day, 21:08:50", "remaining_time": "5 days, 3:22:32", "throughput": 2717.6, "total_tokens": 441693280} {"current_steps": 2448, "total_steps": 9134, "loss": 0.7197, "learning_rate": 4.164973224040516e-05, "epoch": 0.267987629655984, "percentage": 26.8, "elapsed_time": "1 day, 21:09:55", "remaining_time": "5 days, 3:21:21", "throughput": 2717.58, "total_tokens": 441866656} {"current_steps": 2449, "total_steps": 9134, "loss": 0.7235, "learning_rate": 4.164331701619729e-05, "epoch": 0.2680971017269219, "percentage": 26.81, "elapsed_time": "1 day, 21:11:04", "remaining_time": "5 days, 3:20:22", "throughput": 2717.55, "total_tokens": 442048768} {"current_steps": 2450, "total_steps": 9134, "loss": 0.6798, "learning_rate": 4.1636899823116835e-05, "epoch": 0.26820657379785984, "percentage": 26.82, "elapsed_time": "1 day, 21:12:08", "remaining_time": "5 days, 3:19:10", "throughput": 2717.49, "total_tokens": 442212960} {"current_steps": 2451, "total_steps": 9134, "loss": 0.7217, "learning_rate": 4.1630480661922935e-05, "epoch": 0.2683160458687977, "percentage": 26.83, "elapsed_time": "1 day, 21:13:12", "remaining_time": "5 days, 3:17:57", "throughput": 2717.36, "total_tokens": 442365728} {"current_steps": 2452, "total_steps": 9134, "loss": 0.7866, "learning_rate": 4.162405953337497e-05, "epoch": 0.2684255179397356, "percentage": 26.84, "elapsed_time": "1 day, 21:14:21", "remaining_time": "5 days, 3:16:57", "throughput": 2717.48, "total_tokens": 442572704} {"current_steps": 2453, "total_steps": 9134, "loss": 0.5574, "learning_rate": 4.161763643823253e-05, "epoch": 0.26853499001067355, "percentage": 26.86, "elapsed_time": "1 day, 21:15:24", "remaining_time": "5 days, 3:15:41", "throughput": 2717.4, "total_tokens": 442731072} {"current_steps": 2454, "total_steps": 9134, "loss": 0.6538, "learning_rate": 4.1611211377255473e-05, "epoch": 0.2686444620816114, "percentage": 26.87, "elapsed_time": "1 day, 21:16:32", "remaining_time": "5 days, 3:14:38", "throughput": 2717.46, "total_tokens": 442924160} {"current_steps": 2455, "total_steps": 9134, "loss": 0.7989, "learning_rate": 4.1604784351203876e-05, "epoch": 0.26875393415254933, "percentage": 26.88, "elapsed_time": "1 day, 21:17:40", "remaining_time": "5 days, 3:13:38", "throughput": 2717.57, "total_tokens": 443128896} {"current_steps": 2456, "total_steps": 9134, "loss": 0.6935, "learning_rate": 4.1598355360838016e-05, "epoch": 0.26886340622348726, "percentage": 26.89, "elapsed_time": "1 day, 21:18:44", "remaining_time": "5 days, 3:12:24", "throughput": 2717.5, "total_tokens": 443291296} {"current_steps": 2457, "total_steps": 9134, "loss": 1.0139, "learning_rate": 4.159192440691846e-05, "epoch": 0.2689728782944251, "percentage": 26.9, "elapsed_time": "1 day, 21:19:52", "remaining_time": "5 days, 3:11:22", "throughput": 2717.6, "total_tokens": 443492672} {"current_steps": 2458, "total_steps": 9134, "loss": 0.6998, "learning_rate": 4.1585491490205965e-05, "epoch": 0.26908235036536304, "percentage": 26.91, "elapsed_time": "1 day, 21:21:00", "remaining_time": "5 days, 3:10:19", "throughput": 2717.59, "total_tokens": 443674560} {"current_steps": 2459, "total_steps": 9134, "loss": 0.7053, "learning_rate": 4.157905661146152e-05, "epoch": 0.26919182243630096, "percentage": 26.92, "elapsed_time": "1 day, 21:22:04", "remaining_time": "5 days, 3:09:08", "throughput": 2717.62, "total_tokens": 443854432} {"current_steps": 2460, "total_steps": 9134, "loss": 0.7108, "learning_rate": 4.157261977144638e-05, "epoch": 0.26930129450723883, "percentage": 26.93, "elapsed_time": "1 day, 21:23:12", "remaining_time": "5 days, 3:08:05", "throughput": 2717.7, "total_tokens": 444051104} {"current_steps": 2461, "total_steps": 9134, "loss": 0.6096, "learning_rate": 4.1566180970922006e-05, "epoch": 0.26941076657817675, "percentage": 26.94, "elapsed_time": "1 day, 21:24:18", "remaining_time": "5 days, 3:06:57", "throughput": 2717.76, "total_tokens": 444240608} {"current_steps": 2462, "total_steps": 9134, "loss": 0.7337, "learning_rate": 4.155974021065009e-05, "epoch": 0.2695202386491146, "percentage": 26.95, "elapsed_time": "1 day, 21:25:24", "remaining_time": "5 days, 3:05:50", "throughput": 2717.8, "total_tokens": 444428096} {"current_steps": 2463, "total_steps": 9134, "loss": 0.71, "learning_rate": 4.1553297491392564e-05, "epoch": 0.26962971072005254, "percentage": 26.97, "elapsed_time": "1 day, 21:26:32", "remaining_time": "5 days, 3:04:48", "throughput": 2717.71, "total_tokens": 444596992} {"current_steps": 2464, "total_steps": 9134, "loss": 0.6077, "learning_rate": 4.154685281391158e-05, "epoch": 0.26973918279099046, "percentage": 26.98, "elapsed_time": "1 day, 21:27:40", "remaining_time": "5 days, 3:03:45", "throughput": 2717.83, "total_tokens": 444800608} {"current_steps": 2465, "total_steps": 9134, "loss": 0.8101, "learning_rate": 4.1540406178969553e-05, "epoch": 0.2698486548619283, "percentage": 26.99, "elapsed_time": "1 day, 21:28:44", "remaining_time": "5 days, 3:02:33", "throughput": 2717.75, "total_tokens": 444963456} {"current_steps": 2466, "total_steps": 9134, "loss": 0.5022, "learning_rate": 4.153395758732909e-05, "epoch": 0.26995812693286625, "percentage": 27.0, "elapsed_time": "1 day, 21:29:45", "remaining_time": "5 days, 3:01:10", "throughput": 2717.68, "total_tokens": 445115104} {"current_steps": 2467, "total_steps": 9134, "loss": 0.8127, "learning_rate": 4.152750703975305e-05, "epoch": 0.27006759900380417, "percentage": 27.01, "elapsed_time": "1 day, 21:30:52", "remaining_time": "5 days, 3:00:06", "throughput": 2717.79, "total_tokens": 445315136} {"current_steps": 2468, "total_steps": 9134, "loss": 0.8784, "learning_rate": 4.152105453700452e-05, "epoch": 0.27017707107474204, "percentage": 27.02, "elapsed_time": "1 day, 21:32:01", "remaining_time": "5 days, 2:59:06", "throughput": 2717.96, "total_tokens": 445531072} {"current_steps": 2469, "total_steps": 9134, "loss": 0.7166, "learning_rate": 4.151460007984683e-05, "epoch": 0.27028654314567996, "percentage": 27.03, "elapsed_time": "1 day, 21:33:08", "remaining_time": "5 days, 2:58:01", "throughput": 2717.9, "total_tokens": 445703104} {"current_steps": 2470, "total_steps": 9134, "loss": 0.7559, "learning_rate": 4.150814366904352e-05, "epoch": 0.2703960152166179, "percentage": 27.04, "elapsed_time": "1 day, 21:34:13", "remaining_time": "5 days, 2:56:53", "throughput": 2717.71, "total_tokens": 445850720} {"current_steps": 2471, "total_steps": 9134, "loss": 0.7502, "learning_rate": 4.150168530535837e-05, "epoch": 0.27050548728755575, "percentage": 27.05, "elapsed_time": "1 day, 21:35:18", "remaining_time": "5 days, 2:55:43", "throughput": 2717.76, "total_tokens": 446035744} {"current_steps": 2472, "total_steps": 9134, "loss": 0.6764, "learning_rate": 4.149522498955539e-05, "epoch": 0.27061495935849367, "percentage": 27.06, "elapsed_time": "1 day, 21:36:27", "remaining_time": "5 days, 2:54:41", "throughput": 2717.82, "total_tokens": 446230624} {"current_steps": 2473, "total_steps": 9134, "loss": 0.7967, "learning_rate": 4.148876272239883e-05, "epoch": 0.2707244314294316, "percentage": 27.07, "elapsed_time": "1 day, 21:37:31", "remaining_time": "5 days, 2:53:30", "throughput": 2717.86, "total_tokens": 446413856} {"current_steps": 2474, "total_steps": 9134, "loss": 0.6252, "learning_rate": 4.148229850465316e-05, "epoch": 0.27083390350036946, "percentage": 27.09, "elapsed_time": "1 day, 21:38:38", "remaining_time": "5 days, 2:52:24", "throughput": 2717.89, "total_tokens": 446599104} {"current_steps": 2475, "total_steps": 9134, "loss": 0.6244, "learning_rate": 4.1475832337083085e-05, "epoch": 0.2709433755713074, "percentage": 27.1, "elapsed_time": "1 day, 21:39:43", "remaining_time": "5 days, 2:51:14", "throughput": 2717.9, "total_tokens": 446778304} {"current_steps": 2476, "total_steps": 9134, "loss": 0.714, "learning_rate": 4.1469364220453546e-05, "epoch": 0.2710528476422453, "percentage": 27.11, "elapsed_time": "1 day, 21:40:48", "remaining_time": "5 days, 2:50:04", "throughput": 2717.96, "total_tokens": 446964224} {"current_steps": 2477, "total_steps": 9134, "loss": 0.9179, "learning_rate": 4.1462894155529706e-05, "epoch": 0.27116231971318316, "percentage": 27.12, "elapsed_time": "1 day, 21:41:52", "remaining_time": "5 days, 2:48:52", "throughput": 2717.91, "total_tokens": 447130880} {"current_steps": 2478, "total_steps": 9134, "loss": 0.6579, "learning_rate": 4.145642214307695e-05, "epoch": 0.2712717917841211, "percentage": 27.13, "elapsed_time": "1 day, 21:42:58", "remaining_time": "5 days, 2:47:44", "throughput": 2718.04, "total_tokens": 447331136} {"current_steps": 2479, "total_steps": 9134, "loss": 0.5765, "learning_rate": 4.144994818386092e-05, "epoch": 0.27138126385505895, "percentage": 27.14, "elapsed_time": "1 day, 21:44:05", "remaining_time": "5 days, 2:46:40", "throughput": 2718.03, "total_tokens": 447512576} {"current_steps": 2480, "total_steps": 9134, "loss": 0.6908, "learning_rate": 4.144347227864747e-05, "epoch": 0.2714907359259969, "percentage": 27.15, "elapsed_time": "1 day, 21:45:12", "remaining_time": "5 days, 2:45:35", "throughput": 2718.06, "total_tokens": 447699616} {"current_steps": 2481, "total_steps": 9134, "loss": 0.7807, "learning_rate": 4.1436994428202667e-05, "epoch": 0.2716002079969348, "percentage": 27.16, "elapsed_time": "1 day, 21:46:17", "remaining_time": "5 days, 2:44:23", "throughput": 2717.98, "total_tokens": 447861120} {"current_steps": 2482, "total_steps": 9134, "loss": 0.6498, "learning_rate": 4.143051463329286e-05, "epoch": 0.27170968006787266, "percentage": 27.17, "elapsed_time": "1 day, 21:47:21", "remaining_time": "5 days, 2:43:11", "throughput": 2717.87, "total_tokens": 448017696} {"current_steps": 2483, "total_steps": 9134, "loss": 0.6461, "learning_rate": 4.1424032894684584e-05, "epoch": 0.2718191521388106, "percentage": 27.18, "elapsed_time": "1 day, 21:48:26", "remaining_time": "5 days, 2:41:59", "throughput": 2717.69, "total_tokens": 448163520} {"current_steps": 2484, "total_steps": 9134, "loss": 0.5423, "learning_rate": 4.141754921314461e-05, "epoch": 0.2719286242097485, "percentage": 27.2, "elapsed_time": "1 day, 21:49:32", "remaining_time": "5 days, 2:40:53", "throughput": 2717.72, "total_tokens": 448348768} {"current_steps": 2485, "total_steps": 9134, "loss": 0.8305, "learning_rate": 4.141106358943995e-05, "epoch": 0.27203809628068637, "percentage": 27.21, "elapsed_time": "1 day, 21:50:40", "remaining_time": "5 days, 2:39:52", "throughput": 2717.86, "total_tokens": 448559104} {"current_steps": 2486, "total_steps": 9134, "loss": 0.7723, "learning_rate": 4.140457602433784e-05, "epoch": 0.2721475683516243, "percentage": 27.22, "elapsed_time": "1 day, 21:51:49", "remaining_time": "5 days, 2:38:52", "throughput": 2717.87, "total_tokens": 448746816} {"current_steps": 2487, "total_steps": 9134, "loss": 0.7453, "learning_rate": 4.139808651860574e-05, "epoch": 0.2722570404225622, "percentage": 27.23, "elapsed_time": "1 day, 21:52:52", "remaining_time": "5 days, 2:37:37", "throughput": 2717.83, "total_tokens": 448911232} {"current_steps": 2488, "total_steps": 9134, "loss": 0.5576, "learning_rate": 4.139159507301136e-05, "epoch": 0.2723665124935001, "percentage": 27.24, "elapsed_time": "1 day, 21:54:01", "remaining_time": "5 days, 2:36:37", "throughput": 2717.78, "total_tokens": 449090880} {"current_steps": 2489, "total_steps": 9134, "loss": 0.8987, "learning_rate": 4.138510168832261e-05, "epoch": 0.272475984564438, "percentage": 27.25, "elapsed_time": "1 day, 21:55:09", "remaining_time": "5 days, 2:35:33", "throughput": 2717.8, "total_tokens": 449277472} {"current_steps": 2490, "total_steps": 9134, "loss": 0.7678, "learning_rate": 4.137860636530766e-05, "epoch": 0.2725854566353759, "percentage": 27.26, "elapsed_time": "1 day, 21:56:16", "remaining_time": "5 days, 2:34:29", "throughput": 2717.89, "total_tokens": 449475936} {"current_steps": 2491, "total_steps": 9134, "loss": 0.7396, "learning_rate": 4.1372109104734886e-05, "epoch": 0.2726949287063138, "percentage": 27.27, "elapsed_time": "1 day, 21:57:25", "remaining_time": "5 days, 2:33:30", "throughput": 2718.02, "total_tokens": 449685152} {"current_steps": 2492, "total_steps": 9134, "loss": 0.6865, "learning_rate": 4.1365609907372905e-05, "epoch": 0.2728044007772517, "percentage": 27.28, "elapsed_time": "1 day, 21:58:27", "remaining_time": "5 days, 2:32:13", "throughput": 2717.9, "total_tokens": 449833664} {"current_steps": 2493, "total_steps": 9134, "loss": 0.6291, "learning_rate": 4.135910877399055e-05, "epoch": 0.27291387284818963, "percentage": 27.29, "elapsed_time": "1 day, 21:59:33", "remaining_time": "5 days, 2:31:04", "throughput": 2717.9, "total_tokens": 450011968} {"current_steps": 2494, "total_steps": 9134, "loss": 0.6542, "learning_rate": 4.13526057053569e-05, "epoch": 0.2730233449191275, "percentage": 27.3, "elapsed_time": "1 day, 22:00:40", "remaining_time": "5 days, 2:29:59", "throughput": 2717.91, "total_tokens": 450195424} {"current_steps": 2495, "total_steps": 9134, "loss": 0.7338, "learning_rate": 4.134610070224127e-05, "epoch": 0.2731328169900654, "percentage": 27.32, "elapsed_time": "1 day, 22:01:43", "remaining_time": "5 days, 2:28:43", "throughput": 2717.87, "total_tokens": 450359616} {"current_steps": 2496, "total_steps": 9134, "loss": 0.6666, "learning_rate": 4.133959376541317e-05, "epoch": 0.2732422890610033, "percentage": 27.33, "elapsed_time": "1 day, 22:02:45", "remaining_time": "5 days, 2:27:25", "throughput": 2717.92, "total_tokens": 450537248} {"current_steps": 2497, "total_steps": 9134, "loss": 0.6672, "learning_rate": 4.133308489564236e-05, "epoch": 0.2733517611319412, "percentage": 27.34, "elapsed_time": "1 day, 22:03:53", "remaining_time": "5 days, 2:26:23", "throughput": 2717.89, "total_tokens": 450717120} {"current_steps": 2498, "total_steps": 9134, "loss": 0.8104, "learning_rate": 4.132657409369883e-05, "epoch": 0.27346123320287913, "percentage": 27.35, "elapsed_time": "1 day, 22:05:02", "remaining_time": "5 days, 2:25:23", "throughput": 2717.72, "total_tokens": 450876832} {"current_steps": 2499, "total_steps": 9134, "loss": 0.8793, "learning_rate": 4.1320061360352804e-05, "epoch": 0.273570705273817, "percentage": 27.36, "elapsed_time": "1 day, 22:06:07", "remaining_time": "5 days, 2:24:14", "throughput": 2717.78, "total_tokens": 451063872} {"current_steps": 2500, "total_steps": 9134, "loss": 0.7204, "learning_rate": 4.13135466963747e-05, "epoch": 0.2736801773447549, "percentage": 27.37, "elapsed_time": "1 day, 22:07:14", "remaining_time": "5 days, 2:23:07", "throughput": 2717.7, "total_tokens": 451229856} {"current_steps": 2501, "total_steps": 9134, "loss": 0.6425, "learning_rate": 4.130703010253523e-05, "epoch": 0.27378964941569284, "percentage": 27.38, "elapsed_time": "1 day, 22:08:15", "remaining_time": "5 days, 2:21:49", "throughput": 2717.67, "total_tokens": 451394272} {"current_steps": 2502, "total_steps": 9134, "loss": 0.6298, "learning_rate": 4.130051157960526e-05, "epoch": 0.2738991214866307, "percentage": 27.39, "elapsed_time": "1 day, 22:09:22", "remaining_time": "5 days, 2:20:42", "throughput": 2717.7, "total_tokens": 451577952} {"current_steps": 2503, "total_steps": 9134, "loss": 0.5696, "learning_rate": 4.1293991128355934e-05, "epoch": 0.2740085935575686, "percentage": 27.4, "elapsed_time": "1 day, 22:10:26", "remaining_time": "5 days, 2:19:30", "throughput": 2717.74, "total_tokens": 451759392} {"current_steps": 2504, "total_steps": 9134, "loss": 0.6699, "learning_rate": 4.12874687495586e-05, "epoch": 0.27411806562850655, "percentage": 27.41, "elapsed_time": "1 day, 22:11:35", "remaining_time": "5 days, 2:18:32", "throughput": 2717.92, "total_tokens": 451978240} {"current_steps": 2505, "total_steps": 9134, "loss": 0.7837, "learning_rate": 4.128094444398486e-05, "epoch": 0.2742275376994444, "percentage": 27.43, "elapsed_time": "1 day, 22:12:44", "remaining_time": "5 days, 2:17:32", "throughput": 2718.15, "total_tokens": 452204480} {"current_steps": 2506, "total_steps": 9134, "loss": 0.7288, "learning_rate": 4.127441821240651e-05, "epoch": 0.27433700977038233, "percentage": 27.44, "elapsed_time": "1 day, 22:13:50", "remaining_time": "5 days, 2:16:23", "throughput": 2718.12, "total_tokens": 452376960} {"current_steps": 2507, "total_steps": 9134, "loss": 0.6966, "learning_rate": 4.12678900555956e-05, "epoch": 0.27444648184132026, "percentage": 27.45, "elapsed_time": "1 day, 22:14:55", "remaining_time": "5 days, 2:15:14", "throughput": 2718.18, "total_tokens": 452565344} {"current_steps": 2508, "total_steps": 9134, "loss": 0.5866, "learning_rate": 4.1261359974324387e-05, "epoch": 0.2745559539122581, "percentage": 27.46, "elapsed_time": "1 day, 22:16:04", "remaining_time": "5 days, 2:14:13", "throughput": 2718.22, "total_tokens": 452757984} {"current_steps": 2509, "total_steps": 9134, "loss": 0.913, "learning_rate": 4.1254827969365387e-05, "epoch": 0.27466542598319604, "percentage": 27.47, "elapsed_time": "1 day, 22:17:12", "remaining_time": "5 days, 2:13:12", "throughput": 2718.28, "total_tokens": 452954880} {"current_steps": 2510, "total_steps": 9134, "loss": 0.6852, "learning_rate": 4.1248294041491306e-05, "epoch": 0.27477489805413396, "percentage": 27.48, "elapsed_time": "1 day, 22:18:20", "remaining_time": "5 days, 2:12:10", "throughput": 2718.37, "total_tokens": 453153792} {"current_steps": 2511, "total_steps": 9134, "loss": 0.7437, "learning_rate": 4.12417581914751e-05, "epoch": 0.27488437012507183, "percentage": 27.49, "elapsed_time": "1 day, 22:19:24", "remaining_time": "5 days, 2:10:58", "throughput": 2718.32, "total_tokens": 453320224} {"current_steps": 2512, "total_steps": 9134, "loss": 0.7121, "learning_rate": 4.123522042008996e-05, "epoch": 0.27499384219600975, "percentage": 27.5, "elapsed_time": "1 day, 22:20:26", "remaining_time": "5 days, 2:09:39", "throughput": 2718.3, "total_tokens": 453485760} {"current_steps": 2513, "total_steps": 9134, "loss": 0.7123, "learning_rate": 4.122868072810927e-05, "epoch": 0.2751033142669476, "percentage": 27.51, "elapsed_time": "1 day, 22:21:33", "remaining_time": "5 days, 2:08:33", "throughput": 2718.41, "total_tokens": 453683776} {"current_steps": 2514, "total_steps": 9134, "loss": 0.644, "learning_rate": 4.122213911630667e-05, "epoch": 0.27521278633788554, "percentage": 27.52, "elapsed_time": "1 day, 22:22:39", "remaining_time": "5 days, 2:07:27", "throughput": 2718.43, "total_tokens": 453868576} {"current_steps": 2515, "total_steps": 9134, "loss": 0.7475, "learning_rate": 4.121559558545603e-05, "epoch": 0.27532225840882346, "percentage": 27.53, "elapsed_time": "1 day, 22:23:48", "remaining_time": "5 days, 2:06:27", "throughput": 2718.54, "total_tokens": 454073760} {"current_steps": 2516, "total_steps": 9134, "loss": 0.6714, "learning_rate": 4.120905013633143e-05, "epoch": 0.2754317304797613, "percentage": 27.55, "elapsed_time": "1 day, 22:24:54", "remaining_time": "5 days, 2:05:18", "throughput": 2718.51, "total_tokens": 454247136} {"current_steps": 2517, "total_steps": 9134, "loss": 0.7585, "learning_rate": 4.1202502769707184e-05, "epoch": 0.27554120255069925, "percentage": 27.56, "elapsed_time": "1 day, 22:25:57", "remaining_time": "5 days, 2:04:03", "throughput": 2718.44, "total_tokens": 454406400} {"current_steps": 2518, "total_steps": 9134, "loss": 0.6338, "learning_rate": 4.119595348635784e-05, "epoch": 0.27565067462163717, "percentage": 27.57, "elapsed_time": "1 day, 22:27:00", "remaining_time": "5 days, 2:02:49", "throughput": 2718.46, "total_tokens": 454582912} {"current_steps": 2519, "total_steps": 9134, "loss": 0.8511, "learning_rate": 4.118940228705815e-05, "epoch": 0.27576014669257504, "percentage": 27.58, "elapsed_time": "1 day, 22:28:07", "remaining_time": "5 days, 2:01:44", "throughput": 2718.47, "total_tokens": 454765472} {"current_steps": 2520, "total_steps": 9134, "loss": 0.9503, "learning_rate": 4.1182849172583135e-05, "epoch": 0.27586961876351296, "percentage": 27.59, "elapsed_time": "1 day, 22:29:16", "remaining_time": "5 days, 2:00:44", "throughput": 2718.61, "total_tokens": 454977152} {"current_steps": 2521, "total_steps": 9134, "loss": 0.6124, "learning_rate": 4.117629414370799e-05, "epoch": 0.2759790908344509, "percentage": 27.6, "elapsed_time": "1 day, 22:30:24", "remaining_time": "5 days, 1:59:42", "throughput": 2718.6, "total_tokens": 455160832} {"current_steps": 2522, "total_steps": 9134, "loss": 0.7638, "learning_rate": 4.116973720120817e-05, "epoch": 0.27608856290538875, "percentage": 27.61, "elapsed_time": "1 day, 22:31:30", "remaining_time": "5 days, 1:58:33", "throughput": 2718.66, "total_tokens": 455349440} {"current_steps": 2523, "total_steps": 9134, "loss": 0.5594, "learning_rate": 4.116317834585935e-05, "epoch": 0.27619803497632667, "percentage": 27.62, "elapsed_time": "1 day, 22:32:34", "remaining_time": "5 days, 1:57:22", "throughput": 2718.6, "total_tokens": 455513184} {"current_steps": 2524, "total_steps": 9134, "loss": 0.7322, "learning_rate": 4.115661757843743e-05, "epoch": 0.2763075070472646, "percentage": 27.63, "elapsed_time": "1 day, 22:33:40", "remaining_time": "5 days, 1:56:15", "throughput": 2718.67, "total_tokens": 455706272} {"current_steps": 2525, "total_steps": 9134, "loss": 0.7606, "learning_rate": 4.115005489971854e-05, "epoch": 0.27641697911820245, "percentage": 27.64, "elapsed_time": "1 day, 22:34:49", "remaining_time": "5 days, 1:55:14", "throughput": 2718.71, "total_tokens": 455899136} {"current_steps": 2526, "total_steps": 9134, "loss": 0.8265, "learning_rate": 4.114349031047903e-05, "epoch": 0.2765264511891404, "percentage": 27.65, "elapsed_time": "1 day, 22:35:56", "remaining_time": "5 days, 1:54:10", "throughput": 2718.7, "total_tokens": 456079680} {"current_steps": 2527, "total_steps": 9134, "loss": 0.7435, "learning_rate": 4.1136923811495475e-05, "epoch": 0.2766359232600783, "percentage": 27.67, "elapsed_time": "1 day, 22:37:04", "remaining_time": "5 days, 1:53:06", "throughput": 2718.78, "total_tokens": 456276128} {"current_steps": 2528, "total_steps": 9134, "loss": 0.5567, "learning_rate": 4.1130355403544675e-05, "epoch": 0.27674539533101616, "percentage": 27.68, "elapsed_time": "1 day, 22:38:09", "remaining_time": "5 days, 1:51:57", "throughput": 2718.86, "total_tokens": 456467872} {"current_steps": 2529, "total_steps": 9134, "loss": 0.6926, "learning_rate": 4.1123785087403676e-05, "epoch": 0.2768548674019541, "percentage": 27.69, "elapsed_time": "1 day, 22:39:17", "remaining_time": "5 days, 1:50:54", "throughput": 2718.97, "total_tokens": 456671264} {"current_steps": 2530, "total_steps": 9134, "loss": 0.6822, "learning_rate": 4.111721286384972e-05, "epoch": 0.27696433947289195, "percentage": 27.7, "elapsed_time": "1 day, 22:40:23", "remaining_time": "5 days, 1:49:47", "throughput": 2719.0, "total_tokens": 456855616} {"current_steps": 2531, "total_steps": 9134, "loss": 0.6777, "learning_rate": 4.1110638733660294e-05, "epoch": 0.2770738115438299, "percentage": 27.71, "elapsed_time": "1 day, 22:41:25", "remaining_time": "5 days, 1:48:29", "throughput": 2718.93, "total_tokens": 457012864} {"current_steps": 2532, "total_steps": 9134, "loss": 1.0981, "learning_rate": 4.110406269761311e-05, "epoch": 0.2771832836147678, "percentage": 27.72, "elapsed_time": "1 day, 22:42:34", "remaining_time": "5 days, 1:47:29", "throughput": 2719.15, "total_tokens": 457236416} {"current_steps": 2533, "total_steps": 9134, "loss": 0.6851, "learning_rate": 4.109748475648609e-05, "epoch": 0.27729275568570566, "percentage": 27.73, "elapsed_time": "1 day, 22:43:37", "remaining_time": "5 days, 1:46:14", "throughput": 2719.09, "total_tokens": 457399040} {"current_steps": 2534, "total_steps": 9134, "loss": 0.6021, "learning_rate": 4.109090491105739e-05, "epoch": 0.2774022277566436, "percentage": 27.74, "elapsed_time": "1 day, 22:44:39", "remaining_time": "5 days, 1:44:57", "throughput": 2719.09, "total_tokens": 457568160} {"current_steps": 2535, "total_steps": 9134, "loss": 0.6856, "learning_rate": 4.108432316210541e-05, "epoch": 0.2775116998275815, "percentage": 27.75, "elapsed_time": "1 day, 22:45:44", "remaining_time": "5 days, 1:43:48", "throughput": 2719.07, "total_tokens": 457742208} {"current_steps": 2536, "total_steps": 9134, "loss": 0.9781, "learning_rate": 4.107773951040874e-05, "epoch": 0.27762117189851937, "percentage": 27.76, "elapsed_time": "1 day, 22:46:52", "remaining_time": "5 days, 1:42:43", "throughput": 2719.14, "total_tokens": 457935744} {"current_steps": 2537, "total_steps": 9134, "loss": 0.9058, "learning_rate": 4.107115395674623e-05, "epoch": 0.2777306439694573, "percentage": 27.78, "elapsed_time": "1 day, 22:47:56", "remaining_time": "5 days, 1:41:32", "throughput": 2719.12, "total_tokens": 458108000} {"current_steps": 2538, "total_steps": 9134, "loss": 0.7031, "learning_rate": 4.1064566501896925e-05, "epoch": 0.2778401160403952, "percentage": 27.79, "elapsed_time": "1 day, 22:49:01", "remaining_time": "5 days, 1:40:22", "throughput": 2719.07, "total_tokens": 458277344} {"current_steps": 2539, "total_steps": 9134, "loss": 0.7866, "learning_rate": 4.1057977146640115e-05, "epoch": 0.2779495881113331, "percentage": 27.8, "elapsed_time": "1 day, 22:50:10", "remaining_time": "5 days, 1:39:22", "throughput": 2719.08, "total_tokens": 458465504} {"current_steps": 2540, "total_steps": 9134, "loss": 0.6235, "learning_rate": 4.10513858917553e-05, "epoch": 0.278059060182271, "percentage": 27.81, "elapsed_time": "1 day, 22:51:16", "remaining_time": "5 days, 1:38:14", "throughput": 2719.17, "total_tokens": 458659712} {"current_steps": 2541, "total_steps": 9134, "loss": 0.5307, "learning_rate": 4.104479273802222e-05, "epoch": 0.2781685322532089, "percentage": 27.82, "elapsed_time": "1 day, 22:52:23", "remaining_time": "5 days, 1:37:10", "throughput": 2719.18, "total_tokens": 458844288} {"current_steps": 2542, "total_steps": 9134, "loss": 0.6158, "learning_rate": 4.1038197686220837e-05, "epoch": 0.2782780043241468, "percentage": 27.83, "elapsed_time": "1 day, 22:53:30", "remaining_time": "5 days, 1:36:05", "throughput": 2719.25, "total_tokens": 459038272} {"current_steps": 2543, "total_steps": 9134, "loss": 0.8242, "learning_rate": 4.1031600737131326e-05, "epoch": 0.2783874763950847, "percentage": 27.84, "elapsed_time": "1 day, 22:54:37", "remaining_time": "5 days, 1:35:00", "throughput": 2719.4, "total_tokens": 459245696} {"current_steps": 2544, "total_steps": 9134, "loss": 0.7983, "learning_rate": 4.102500189153409e-05, "epoch": 0.27849694846602263, "percentage": 27.85, "elapsed_time": "1 day, 22:55:43", "remaining_time": "5 days, 1:33:53", "throughput": 2719.48, "total_tokens": 459439008} {"current_steps": 2545, "total_steps": 9134, "loss": 0.5546, "learning_rate": 4.1018401150209776e-05, "epoch": 0.2786064205369605, "percentage": 27.86, "elapsed_time": "1 day, 22:56:47", "remaining_time": "5 days, 1:32:40", "throughput": 2719.47, "total_tokens": 459610816} {"current_steps": 2546, "total_steps": 9134, "loss": 0.5729, "learning_rate": 4.101179851393921e-05, "epoch": 0.2787158926078984, "percentage": 27.87, "elapsed_time": "1 day, 22:57:53", "remaining_time": "5 days, 1:31:32", "throughput": 2719.43, "total_tokens": 459783072} {"current_steps": 2547, "total_steps": 9134, "loss": 0.5532, "learning_rate": 4.100519398350351e-05, "epoch": 0.2788253646788363, "percentage": 27.88, "elapsed_time": "1 day, 22:58:57", "remaining_time": "5 days, 1:30:19", "throughput": 2719.4, "total_tokens": 459951296} {"current_steps": 2548, "total_steps": 9134, "loss": 0.8026, "learning_rate": 4.099858755968394e-05, "epoch": 0.2789348367497742, "percentage": 27.9, "elapsed_time": "1 day, 23:00:04", "remaining_time": "5 days, 1:29:16", "throughput": 2719.32, "total_tokens": 460122880} {"current_steps": 2549, "total_steps": 9134, "loss": 0.7547, "learning_rate": 4.0991979243262054e-05, "epoch": 0.27904430882071213, "percentage": 27.91, "elapsed_time": "1 day, 23:01:10", "remaining_time": "5 days, 1:28:08", "throughput": 2719.26, "total_tokens": 460291552} {"current_steps": 2550, "total_steps": 9134, "loss": 0.8274, "learning_rate": 4.09853690350196e-05, "epoch": 0.27915378089165, "percentage": 27.92, "elapsed_time": "1 day, 23:02:19", "remaining_time": "5 days, 1:27:08", "throughput": 2719.22, "total_tokens": 460471648} {"current_steps": 2551, "total_steps": 9134, "loss": 0.659, "learning_rate": 4.097875693573854e-05, "epoch": 0.2792632529625879, "percentage": 27.93, "elapsed_time": "1 day, 23:03:24", "remaining_time": "5 days, 1:25:57", "throughput": 2719.24, "total_tokens": 460651520} {"current_steps": 2552, "total_steps": 9134, "loss": 0.6332, "learning_rate": 4.0972142946201086e-05, "epoch": 0.27937272503352584, "percentage": 27.94, "elapsed_time": "1 day, 23:04:29", "remaining_time": "5 days, 1:24:48", "throughput": 2719.26, "total_tokens": 460831392} {"current_steps": 2553, "total_steps": 9134, "loss": 0.6982, "learning_rate": 4.0965527067189655e-05, "epoch": 0.2794821971044637, "percentage": 27.95, "elapsed_time": "1 day, 23:05:37", "remaining_time": "5 days, 1:23:45", "throughput": 2719.32, "total_tokens": 461026272} {"current_steps": 2554, "total_steps": 9134, "loss": 0.8168, "learning_rate": 4.095890929948689e-05, "epoch": 0.2795916691754016, "percentage": 27.96, "elapsed_time": "1 day, 23:06:40", "remaining_time": "5 days, 1:22:31", "throughput": 2719.35, "total_tokens": 461203904} {"current_steps": 2555, "total_steps": 9134, "loss": 0.6863, "learning_rate": 4.095228964387566e-05, "epoch": 0.27970114124633955, "percentage": 27.97, "elapsed_time": "1 day, 23:07:45", "remaining_time": "5 days, 1:21:20", "throughput": 2719.34, "total_tokens": 461378624} {"current_steps": 2556, "total_steps": 9134, "loss": 0.822, "learning_rate": 4.094566810113907e-05, "epoch": 0.2798106133172774, "percentage": 27.98, "elapsed_time": "1 day, 23:08:52", "remaining_time": "5 days, 1:20:15", "throughput": 2719.31, "total_tokens": 461555360} {"current_steps": 2557, "total_steps": 9134, "loss": 0.7704, "learning_rate": 4.0939044672060426e-05, "epoch": 0.27992008538821533, "percentage": 27.99, "elapsed_time": "1 day, 23:09:58", "remaining_time": "5 days, 1:19:09", "throughput": 2719.34, "total_tokens": 461741056} {"current_steps": 2558, "total_steps": 9134, "loss": 0.647, "learning_rate": 4.093241935742326e-05, "epoch": 0.28002955745915326, "percentage": 28.01, "elapsed_time": "1 day, 23:11:05", "remaining_time": "5 days, 1:18:03", "throughput": 2719.42, "total_tokens": 461936832} {"current_steps": 2559, "total_steps": 9134, "loss": 0.6284, "learning_rate": 4.0925792158011345e-05, "epoch": 0.2801390295300911, "percentage": 28.02, "elapsed_time": "1 day, 23:12:07", "remaining_time": "5 days, 1:16:46", "throughput": 2719.38, "total_tokens": 462098112} {"current_steps": 2560, "total_steps": 9134, "loss": 0.679, "learning_rate": 4.091916307460866e-05, "epoch": 0.28024850160102904, "percentage": 28.03, "elapsed_time": "1 day, 23:13:14", "remaining_time": "5 days, 1:15:39", "throughput": 2719.32, "total_tokens": 462267680} {"current_steps": 2561, "total_steps": 9134, "loss": 0.7662, "learning_rate": 4.091253210799942e-05, "epoch": 0.28035797367196696, "percentage": 28.04, "elapsed_time": "1 day, 23:14:22", "remaining_time": "5 days, 1:14:37", "throughput": 2719.44, "total_tokens": 462473760} {"current_steps": 2562, "total_steps": 9134, "loss": 0.8217, "learning_rate": 4.0905899258968046e-05, "epoch": 0.28046744574290483, "percentage": 28.05, "elapsed_time": "1 day, 23:15:30", "remaining_time": "5 days, 1:13:36", "throughput": 2719.5, "total_tokens": 462670432} {"current_steps": 2563, "total_steps": 9134, "loss": 0.7336, "learning_rate": 4.08992645282992e-05, "epoch": 0.28057691781384275, "percentage": 28.06, "elapsed_time": "1 day, 23:16:38", "remaining_time": "5 days, 1:12:34", "throughput": 2719.62, "total_tokens": 462876736} {"current_steps": 2564, "total_steps": 9134, "loss": 0.7736, "learning_rate": 4.089262791677775e-05, "epoch": 0.2806863898847806, "percentage": 28.07, "elapsed_time": "1 day, 23:17:41", "remaining_time": "5 days, 1:11:18", "throughput": 2719.53, "total_tokens": 463031744} {"current_steps": 2565, "total_steps": 9134, "loss": 0.56, "learning_rate": 4.0885989425188806e-05, "epoch": 0.28079586195571854, "percentage": 28.08, "elapsed_time": "1 day, 23:18:47", "remaining_time": "5 days, 1:10:10", "throughput": 2719.59, "total_tokens": 463221024} {"current_steps": 2566, "total_steps": 9134, "loss": 0.7438, "learning_rate": 4.087934905431768e-05, "epoch": 0.28090533402665646, "percentage": 28.09, "elapsed_time": "1 day, 23:19:52", "remaining_time": "5 days, 1:09:00", "throughput": 2719.67, "total_tokens": 463410528} {"current_steps": 2567, "total_steps": 9134, "loss": 0.7131, "learning_rate": 4.087270680494992e-05, "epoch": 0.2810148060975943, "percentage": 28.1, "elapsed_time": "1 day, 23:20:58", "remaining_time": "5 days, 1:07:52", "throughput": 2719.79, "total_tokens": 463609440} {"current_steps": 2568, "total_steps": 9134, "loss": 0.8143, "learning_rate": 4.086606267787128e-05, "epoch": 0.28112427816853225, "percentage": 28.11, "elapsed_time": "1 day, 23:22:07", "remaining_time": "5 days, 1:06:52", "throughput": 2719.8, "total_tokens": 463799616} {"current_steps": 2569, "total_steps": 9134, "loss": 0.6703, "learning_rate": 4.0859416673867755e-05, "epoch": 0.28123375023947017, "percentage": 28.13, "elapsed_time": "1 day, 23:23:10", "remaining_time": "5 days, 1:05:39", "throughput": 2719.67, "total_tokens": 463951040} {"current_steps": 2570, "total_steps": 9134, "loss": 0.8107, "learning_rate": 4.085276879372557e-05, "epoch": 0.28134322231040804, "percentage": 28.14, "elapsed_time": "1 day, 23:24:15", "remaining_time": "5 days, 1:04:29", "throughput": 2719.76, "total_tokens": 464143008} {"current_steps": 2571, "total_steps": 9134, "loss": 0.842, "learning_rate": 4.084611903823113e-05, "epoch": 0.28145269438134596, "percentage": 28.15, "elapsed_time": "1 day, 23:25:19", "remaining_time": "5 days, 1:03:17", "throughput": 2719.61, "total_tokens": 464292192} {"current_steps": 2572, "total_steps": 9134, "loss": 0.7741, "learning_rate": 4.083946740817111e-05, "epoch": 0.2815621664522839, "percentage": 28.16, "elapsed_time": "1 day, 23:26:23", "remaining_time": "5 days, 1:02:04", "throughput": 2719.51, "total_tokens": 464448992} {"current_steps": 2573, "total_steps": 9134, "loss": 0.9608, "learning_rate": 4.083281390433236e-05, "epoch": 0.28167163852322175, "percentage": 28.17, "elapsed_time": "1 day, 23:27:31", "remaining_time": "5 days, 1:01:02", "throughput": 2719.65, "total_tokens": 464658208} {"current_steps": 2574, "total_steps": 9134, "loss": 0.7138, "learning_rate": 4.0826158527502e-05, "epoch": 0.28178111059415967, "percentage": 28.18, "elapsed_time": "1 day, 23:28:37", "remaining_time": "5 days, 0:59:54", "throughput": 2719.49, "total_tokens": 464808512} {"current_steps": 2575, "total_steps": 9134, "loss": 0.6454, "learning_rate": 4.081950127846735e-05, "epoch": 0.2818905826650976, "percentage": 28.19, "elapsed_time": "1 day, 23:29:42", "remaining_time": "5 days, 0:58:45", "throughput": 2719.43, "total_tokens": 464975392} {"current_steps": 2576, "total_steps": 9134, "loss": 0.679, "learning_rate": 4.081284215801593e-05, "epoch": 0.28200005473603545, "percentage": 28.2, "elapsed_time": "1 day, 23:30:44", "remaining_time": "5 days, 0:57:26", "throughput": 2719.3, "total_tokens": 465122560} {"current_steps": 2577, "total_steps": 9134, "loss": 0.8124, "learning_rate": 4.080618116693551e-05, "epoch": 0.2821095268069734, "percentage": 28.21, "elapsed_time": "1 day, 23:31:53", "remaining_time": "5 days, 0:56:26", "throughput": 2719.4, "total_tokens": 465326848} {"current_steps": 2578, "total_steps": 9134, "loss": 0.7779, "learning_rate": 4.079951830601408e-05, "epoch": 0.2822189988779113, "percentage": 28.22, "elapsed_time": "1 day, 23:33:00", "remaining_time": "5 days, 0:55:20", "throughput": 2719.41, "total_tokens": 465508736} {"current_steps": 2579, "total_steps": 9134, "loss": 0.8101, "learning_rate": 4.079285357603984e-05, "epoch": 0.28232847094884916, "percentage": 28.24, "elapsed_time": "1 day, 23:34:06", "remaining_time": "5 days, 0:54:15", "throughput": 2719.4, "total_tokens": 465688832} {"current_steps": 2580, "total_steps": 9134, "loss": 0.68, "learning_rate": 4.078618697780121e-05, "epoch": 0.2824379430197871, "percentage": 28.25, "elapsed_time": "1 day, 23:35:13", "remaining_time": "5 days, 0:53:08", "throughput": 2719.39, "total_tokens": 465867360} {"current_steps": 2581, "total_steps": 9134, "loss": 0.8635, "learning_rate": 4.0779518512086834e-05, "epoch": 0.28254741509072495, "percentage": 28.26, "elapsed_time": "1 day, 23:36:21", "remaining_time": "5 days, 0:52:07", "throughput": 2719.53, "total_tokens": 466077248} {"current_steps": 2582, "total_steps": 9134, "loss": 0.5325, "learning_rate": 4.077284817968559e-05, "epoch": 0.2826568871616629, "percentage": 28.27, "elapsed_time": "1 day, 23:37:29", "remaining_time": "5 days, 0:51:05", "throughput": 2719.57, "total_tokens": 466269216} {"current_steps": 2583, "total_steps": 9134, "loss": 0.6551, "learning_rate": 4.0766175981386556e-05, "epoch": 0.2827663592326008, "percentage": 28.28, "elapsed_time": "1 day, 23:38:30", "remaining_time": "5 days, 0:49:45", "throughput": 2719.39, "total_tokens": 466404736} {"current_steps": 2584, "total_steps": 9134, "loss": 0.8677, "learning_rate": 4.0759501917979035e-05, "epoch": 0.28287583130353866, "percentage": 28.29, "elapsed_time": "1 day, 23:39:34", "remaining_time": "5 days, 0:48:32", "throughput": 2719.23, "total_tokens": 466550336} {"current_steps": 2585, "total_steps": 9134, "loss": 0.8391, "learning_rate": 4.0752825990252574e-05, "epoch": 0.2829853033744766, "percentage": 28.3, "elapsed_time": "1 day, 23:40:39", "remaining_time": "5 days, 0:47:22", "throughput": 2719.25, "total_tokens": 466731328} {"current_steps": 2586, "total_steps": 9134, "loss": 0.6522, "learning_rate": 4.074614819899692e-05, "epoch": 0.2830947754454145, "percentage": 28.31, "elapsed_time": "1 day, 23:41:45", "remaining_time": "5 days, 0:46:15", "throughput": 2719.11, "total_tokens": 466886112} {"current_steps": 2587, "total_steps": 9134, "loss": 0.7409, "learning_rate": 4.073946854500202e-05, "epoch": 0.28320424751635237, "percentage": 28.32, "elapsed_time": "1 day, 23:42:49", "remaining_time": "5 days, 0:45:01", "throughput": 2719.11, "total_tokens": 467059488} {"current_steps": 2588, "total_steps": 9134, "loss": 0.6733, "learning_rate": 4.073278702905809e-05, "epoch": 0.2833137195872903, "percentage": 28.33, "elapsed_time": "1 day, 23:43:54", "remaining_time": "5 days, 0:43:53", "throughput": 2719.11, "total_tokens": 467238240} {"current_steps": 2589, "total_steps": 9134, "loss": 0.4938, "learning_rate": 4.0726103651955525e-05, "epoch": 0.2834231916582282, "percentage": 28.34, "elapsed_time": "1 day, 23:44:58", "remaining_time": "5 days, 0:42:39", "throughput": 2719.09, "total_tokens": 467406464} {"current_steps": 2590, "total_steps": 9134, "loss": 0.9921, "learning_rate": 4.071941841448496e-05, "epoch": 0.2835326637291661, "percentage": 28.36, "elapsed_time": "1 day, 23:46:07", "remaining_time": "5 days, 0:41:39", "throughput": 2719.25, "total_tokens": 467623072} {"current_steps": 2591, "total_steps": 9134, "loss": 0.4916, "learning_rate": 4.071273131743725e-05, "epoch": 0.283642135800104, "percentage": 28.37, "elapsed_time": "1 day, 23:47:08", "remaining_time": "5 days, 0:40:19", "throughput": 2719.22, "total_tokens": 467781664} {"current_steps": 2592, "total_steps": 9134, "loss": 0.7407, "learning_rate": 4.070604236160347e-05, "epoch": 0.2837516078710419, "percentage": 28.38, "elapsed_time": "1 day, 23:48:16", "remaining_time": "5 days, 0:39:18", "throughput": 2719.29, "total_tokens": 467980352} {"current_steps": 2593, "total_steps": 9134, "loss": 0.9193, "learning_rate": 4.06993515477749e-05, "epoch": 0.2838610799419798, "percentage": 28.39, "elapsed_time": "1 day, 23:49:25", "remaining_time": "5 days, 0:38:18", "throughput": 2719.42, "total_tokens": 468190464} {"current_steps": 2594, "total_steps": 9134, "loss": 0.6743, "learning_rate": 4.069265887674304e-05, "epoch": 0.2839705520129177, "percentage": 28.4, "elapsed_time": "1 day, 23:50:26", "remaining_time": "5 days, 0:36:58", "throughput": 2719.29, "total_tokens": 468334048} {"current_steps": 2595, "total_steps": 9134, "loss": 0.7248, "learning_rate": 4.068596434929965e-05, "epoch": 0.28408002408385563, "percentage": 28.41, "elapsed_time": "1 day, 23:51:31", "remaining_time": "5 days, 0:35:46", "throughput": 2719.35, "total_tokens": 468519968} {"current_steps": 2596, "total_steps": 9134, "loss": 0.7753, "learning_rate": 4.067926796623666e-05, "epoch": 0.2841894961547935, "percentage": 28.42, "elapsed_time": "1 day, 23:52:38", "remaining_time": "5 days, 0:34:43", "throughput": 2719.34, "total_tokens": 468702304} {"current_steps": 2597, "total_steps": 9134, "loss": 0.8119, "learning_rate": 4.067256972834623e-05, "epoch": 0.2842989682257314, "percentage": 28.43, "elapsed_time": "1 day, 23:53:40", "remaining_time": "5 days, 0:33:26", "throughput": 2719.32, "total_tokens": 468868064} {"current_steps": 2598, "total_steps": 9134, "loss": 0.692, "learning_rate": 4.066586963642078e-05, "epoch": 0.2844084402966693, "percentage": 28.44, "elapsed_time": "1 day, 23:54:45", "remaining_time": "5 days, 0:32:15", "throughput": 2719.34, "total_tokens": 469047264} {"current_steps": 2599, "total_steps": 9134, "loss": 0.6408, "learning_rate": 4.06591676912529e-05, "epoch": 0.2845179123676072, "percentage": 28.45, "elapsed_time": "1 day, 23:55:47", "remaining_time": "5 days, 0:30:57", "throughput": 2719.24, "total_tokens": 469197120} {"current_steps": 2600, "total_steps": 9134, "loss": 0.8267, "learning_rate": 4.065246389363541e-05, "epoch": 0.28462738443854513, "percentage": 28.47, "elapsed_time": "1 day, 23:56:55", "remaining_time": "5 days, 0:29:55", "throughput": 2719.28, "total_tokens": 469388864} {"current_steps": 2601, "total_steps": 9134, "loss": 0.4828, "learning_rate": 4.064575824436136e-05, "epoch": 0.284736856509483, "percentage": 28.48, "elapsed_time": "1 day, 23:57:57", "remaining_time": "5 days, 0:28:39", "throughput": 2719.23, "total_tokens": 469549920} {"current_steps": 2602, "total_steps": 9134, "loss": 0.6579, "learning_rate": 4.063905074422403e-05, "epoch": 0.2848463285804209, "percentage": 28.49, "elapsed_time": "1 day, 23:59:02", "remaining_time": "5 days, 0:27:29", "throughput": 2719.1, "total_tokens": 469704928} {"current_steps": 2603, "total_steps": 9134, "loss": 0.7735, "learning_rate": 4.0632341394016884e-05, "epoch": 0.28495580065135884, "percentage": 28.5, "elapsed_time": "2 days, 0:00:10", "remaining_time": "5 days, 0:26:26", "throughput": 2719.19, "total_tokens": 469904288} {"current_steps": 2604, "total_steps": 9134, "loss": 0.7966, "learning_rate": 4.062563019453364e-05, "epoch": 0.2850652727222967, "percentage": 28.51, "elapsed_time": "2 days, 0:01:17", "remaining_time": "5 days, 0:25:20", "throughput": 2719.3, "total_tokens": 470104768} {"current_steps": 2605, "total_steps": 9134, "loss": 0.6812, "learning_rate": 4.0618917146568214e-05, "epoch": 0.2851747447932346, "percentage": 28.52, "elapsed_time": "2 days, 0:02:21", "remaining_time": "5 days, 0:24:09", "throughput": 2719.17, "total_tokens": 470258432} {"current_steps": 2606, "total_steps": 9134, "loss": 0.6137, "learning_rate": 4.061220225091474e-05, "epoch": 0.28528421686417255, "percentage": 28.53, "elapsed_time": "2 days, 0:03:26", "remaining_time": "5 days, 0:22:59", "throughput": 2719.09, "total_tokens": 470419712} {"current_steps": 2607, "total_steps": 9134, "loss": 0.6157, "learning_rate": 4.06054855083676e-05, "epoch": 0.2853936889351104, "percentage": 28.54, "elapsed_time": "2 days, 0:04:34", "remaining_time": "5 days, 0:21:56", "throughput": 2718.98, "total_tokens": 470585024} {"current_steps": 2608, "total_steps": 9134, "loss": 0.572, "learning_rate": 4.059876691972135e-05, "epoch": 0.28550316100604833, "percentage": 28.55, "elapsed_time": "2 days, 0:05:40", "remaining_time": "5 days, 0:20:49", "throughput": 2719.0, "total_tokens": 470768256} {"current_steps": 2609, "total_steps": 9134, "loss": 0.7178, "learning_rate": 4.05920464857708e-05, "epoch": 0.28561263307698626, "percentage": 28.56, "elapsed_time": "2 days, 0:06:44", "remaining_time": "5 days, 0:19:37", "throughput": 2719.03, "total_tokens": 470948576} {"current_steps": 2610, "total_steps": 9134, "loss": 0.7708, "learning_rate": 4.0585324207310946e-05, "epoch": 0.2857221051479241, "percentage": 28.57, "elapsed_time": "2 days, 0:07:51", "remaining_time": "5 days, 0:18:33", "throughput": 2719.09, "total_tokens": 471140992} {"current_steps": 2611, "total_steps": 9134, "loss": 0.6023, "learning_rate": 4.057860008513703e-05, "epoch": 0.28583157721886204, "percentage": 28.59, "elapsed_time": "2 days, 0:08:51", "remaining_time": "5 days, 0:17:10", "throughput": 2718.97, "total_tokens": 471283456} {"current_steps": 2612, "total_steps": 9134, "loss": 0.7144, "learning_rate": 4.057187412004452e-05, "epoch": 0.28594104928979996, "percentage": 28.6, "elapsed_time": "2 days, 0:10:00", "remaining_time": "5 days, 0:16:09", "throughput": 2719.08, "total_tokens": 471489088} {"current_steps": 2613, "total_steps": 9134, "loss": 0.5612, "learning_rate": 4.056514631282906e-05, "epoch": 0.28605052136073783, "percentage": 28.61, "elapsed_time": "2 days, 0:11:08", "remaining_time": "5 days, 0:15:07", "throughput": 2719.15, "total_tokens": 471686432} {"current_steps": 2614, "total_steps": 9134, "loss": 0.8474, "learning_rate": 4.055841666428655e-05, "epoch": 0.28615999343167575, "percentage": 28.62, "elapsed_time": "2 days, 0:12:17", "remaining_time": "5 days, 0:14:08", "throughput": 2719.26, "total_tokens": 471893856} {"current_steps": 2615, "total_steps": 9134, "loss": 0.5951, "learning_rate": 4.0551685175213094e-05, "epoch": 0.2862694655026136, "percentage": 28.63, "elapsed_time": "2 days, 0:13:17", "remaining_time": "5 days, 0:12:46", "throughput": 2719.21, "total_tokens": 472048864} {"current_steps": 2616, "total_steps": 9134, "loss": 0.6453, "learning_rate": 4.0544951846405e-05, "epoch": 0.28637893757355154, "percentage": 28.64, "elapsed_time": "2 days, 0:14:23", "remaining_time": "5 days, 0:11:37", "throughput": 2719.11, "total_tokens": 472209920} {"current_steps": 2617, "total_steps": 9134, "loss": 0.6488, "learning_rate": 4.053821667865883e-05, "epoch": 0.28648840964448946, "percentage": 28.65, "elapsed_time": "2 days, 0:15:26", "remaining_time": "5 days, 0:10:23", "throughput": 2719.05, "total_tokens": 472371648} {"current_steps": 2618, "total_steps": 9134, "loss": 0.7562, "learning_rate": 4.053147967277133e-05, "epoch": 0.2865978817154273, "percentage": 28.66, "elapsed_time": "2 days, 0:16:31", "remaining_time": "5 days, 0:09:14", "throughput": 2718.97, "total_tokens": 472534944} {"current_steps": 2619, "total_steps": 9134, "loss": 0.6095, "learning_rate": 4.052474082953948e-05, "epoch": 0.28670735378636525, "percentage": 28.67, "elapsed_time": "2 days, 0:17:36", "remaining_time": "5 days, 0:08:02", "throughput": 2718.87, "total_tokens": 472691520} {"current_steps": 2620, "total_steps": 9134, "loss": 0.6513, "learning_rate": 4.051800014976046e-05, "epoch": 0.28681682585730317, "percentage": 28.68, "elapsed_time": "2 days, 0:18:40", "remaining_time": "5 days, 0:06:52", "throughput": 2718.81, "total_tokens": 472858400} {"current_steps": 2621, "total_steps": 9134, "loss": 0.6595, "learning_rate": 4.051125763423169e-05, "epoch": 0.28692629792824104, "percentage": 28.69, "elapsed_time": "2 days, 0:19:45", "remaining_time": "5 days, 0:05:42", "throughput": 2718.68, "total_tokens": 473011616} {"current_steps": 2622, "total_steps": 9134, "loss": 0.6963, "learning_rate": 4.050451328375079e-05, "epoch": 0.28703576999917896, "percentage": 28.71, "elapsed_time": "2 days, 0:20:54", "remaining_time": "5 days, 0:04:42", "throughput": 2718.73, "total_tokens": 473207616} {"current_steps": 2623, "total_steps": 9134, "loss": 0.8038, "learning_rate": 4.0497767099115615e-05, "epoch": 0.2871452420701169, "percentage": 28.72, "elapsed_time": "2 days, 0:22:03", "remaining_time": "5 days, 0:03:42", "throughput": 2718.82, "total_tokens": 473411904} {"current_steps": 2624, "total_steps": 9134, "loss": 0.6942, "learning_rate": 4.0491019081124216e-05, "epoch": 0.28725471414105475, "percentage": 28.73, "elapsed_time": "2 days, 0:23:12", "remaining_time": "5 days, 0:02:41", "throughput": 2718.84, "total_tokens": 473600288} {"current_steps": 2625, "total_steps": 9134, "loss": 0.886, "learning_rate": 4.048426923057488e-05, "epoch": 0.28736418621199267, "percentage": 28.74, "elapsed_time": "2 days, 0:24:19", "remaining_time": "5 days, 0:01:37", "throughput": 2718.91, "total_tokens": 473797408} {"current_steps": 2626, "total_steps": 9134, "loss": 0.6483, "learning_rate": 4.047751754826608e-05, "epoch": 0.2874736582829306, "percentage": 28.75, "elapsed_time": "2 days, 0:25:23", "remaining_time": "5 days, 0:00:25", "throughput": 2718.95, "total_tokens": 473976608} {"current_steps": 2627, "total_steps": 9134, "loss": 0.6745, "learning_rate": 4.0470764034996556e-05, "epoch": 0.28758313035386845, "percentage": 28.76, "elapsed_time": "2 days, 0:26:30", "remaining_time": "4 days, 23:59:20", "throughput": 2718.98, "total_tokens": 474164992} {"current_steps": 2628, "total_steps": 9134, "loss": 0.7982, "learning_rate": 4.046400869156521e-05, "epoch": 0.2876926024248064, "percentage": 28.77, "elapsed_time": "2 days, 0:27:38", "remaining_time": "4 days, 23:58:17", "throughput": 2718.99, "total_tokens": 474351584} {"current_steps": 2629, "total_steps": 9134, "loss": 0.7603, "learning_rate": 4.045725151877121e-05, "epoch": 0.2878020744957443, "percentage": 28.78, "elapsed_time": "2 days, 0:28:44", "remaining_time": "4 days, 23:57:10", "throughput": 2719.01, "total_tokens": 474533696} {"current_steps": 2630, "total_steps": 9134, "loss": 0.9596, "learning_rate": 4.04504925174139e-05, "epoch": 0.28791154656668216, "percentage": 28.79, "elapsed_time": "2 days, 0:29:49", "remaining_time": "4 days, 23:56:00", "throughput": 2719.02, "total_tokens": 474712896} {"current_steps": 2631, "total_steps": 9134, "loss": 0.8781, "learning_rate": 4.0443731688292866e-05, "epoch": 0.2880210186376201, "percentage": 28.8, "elapsed_time": "2 days, 0:30:57", "remaining_time": "4 days, 23:54:58", "throughput": 2719.16, "total_tokens": 474922560} {"current_steps": 2632, "total_steps": 9134, "loss": 0.5924, "learning_rate": 4.043696903220788e-05, "epoch": 0.28813049070855795, "percentage": 28.82, "elapsed_time": "2 days, 0:32:01", "remaining_time": "4 days, 23:53:46", "throughput": 2719.06, "total_tokens": 475078912} {"current_steps": 2633, "total_steps": 9134, "loss": 0.551, "learning_rate": 4.0430204549958986e-05, "epoch": 0.2882399627794959, "percentage": 28.83, "elapsed_time": "2 days, 0:33:04", "remaining_time": "4 days, 23:52:30", "throughput": 2719.08, "total_tokens": 475252288} {"current_steps": 2634, "total_steps": 9134, "loss": 0.783, "learning_rate": 4.0423438242346386e-05, "epoch": 0.2883494348504338, "percentage": 28.84, "elapsed_time": "2 days, 0:34:13", "remaining_time": "4 days, 23:51:30", "throughput": 2719.2, "total_tokens": 475461056} {"current_steps": 2635, "total_steps": 9134, "loss": 0.7863, "learning_rate": 4.0416670110170526e-05, "epoch": 0.28845890692137166, "percentage": 28.85, "elapsed_time": "2 days, 0:35:17", "remaining_time": "4 days, 23:50:19", "throughput": 2719.31, "total_tokens": 475655488} {"current_steps": 2636, "total_steps": 9134, "loss": 0.7313, "learning_rate": 4.040990015423206e-05, "epoch": 0.2885683789923096, "percentage": 28.86, "elapsed_time": "2 days, 0:36:22", "remaining_time": "4 days, 23:49:10", "throughput": 2719.21, "total_tokens": 475814528} {"current_steps": 2637, "total_steps": 9134, "loss": 0.7351, "learning_rate": 4.040312837533187e-05, "epoch": 0.2886778510632475, "percentage": 28.87, "elapsed_time": "2 days, 0:37:26", "remaining_time": "4 days, 23:47:57", "throughput": 2719.23, "total_tokens": 475992608} {"current_steps": 2638, "total_steps": 9134, "loss": 1.0363, "learning_rate": 4.039635477427103e-05, "epoch": 0.28878732313418537, "percentage": 28.88, "elapsed_time": "2 days, 0:38:34", "remaining_time": "4 days, 23:46:53", "throughput": 2719.41, "total_tokens": 476207648} {"current_steps": 2639, "total_steps": 9134, "loss": 0.7408, "learning_rate": 4.038957935185086e-05, "epoch": 0.2888967952051233, "percentage": 28.89, "elapsed_time": "2 days, 0:39:39", "remaining_time": "4 days, 23:45:44", "throughput": 2719.43, "total_tokens": 476387520} {"current_steps": 2640, "total_steps": 9134, "loss": 0.8477, "learning_rate": 4.038280210887287e-05, "epoch": 0.2890062672760612, "percentage": 28.9, "elapsed_time": "2 days, 0:40:48", "remaining_time": "4 days, 23:44:44", "throughput": 2719.52, "total_tokens": 476592256} {"current_steps": 2641, "total_steps": 9134, "loss": 0.5161, "learning_rate": 4.0376023046138803e-05, "epoch": 0.2891157393469991, "percentage": 28.91, "elapsed_time": "2 days, 0:41:53", "remaining_time": "4 days, 23:43:35", "throughput": 2719.55, "total_tokens": 476774144} {"current_steps": 2642, "total_steps": 9134, "loss": 0.7096, "learning_rate": 4.036924216445061e-05, "epoch": 0.289225211417937, "percentage": 28.92, "elapsed_time": "2 days, 0:43:00", "remaining_time": "4 days, 23:42:30", "throughput": 2719.58, "total_tokens": 476962304} {"current_steps": 2643, "total_steps": 9134, "loss": 0.7925, "learning_rate": 4.036245946461043e-05, "epoch": 0.2893346834888749, "percentage": 28.94, "elapsed_time": "2 days, 0:44:06", "remaining_time": "4 days, 23:41:23", "throughput": 2719.51, "total_tokens": 477129632} {"current_steps": 2644, "total_steps": 9134, "loss": 0.6097, "learning_rate": 4.0355674947420676e-05, "epoch": 0.2894441555598128, "percentage": 28.95, "elapsed_time": "2 days, 0:45:11", "remaining_time": "4 days, 23:40:13", "throughput": 2719.55, "total_tokens": 477313984} {"current_steps": 2645, "total_steps": 9134, "loss": 0.9934, "learning_rate": 4.0348888613683925e-05, "epoch": 0.2895536276307507, "percentage": 28.96, "elapsed_time": "2 days, 0:46:17", "remaining_time": "4 days, 23:39:06", "throughput": 2719.51, "total_tokens": 477486688} {"current_steps": 2646, "total_steps": 9134, "loss": 0.7809, "learning_rate": 4.0342100464203e-05, "epoch": 0.28966309970168863, "percentage": 28.97, "elapsed_time": "2 days, 0:47:23", "remaining_time": "4 days, 23:37:59", "throughput": 2719.46, "total_tokens": 477656480} {"current_steps": 2647, "total_steps": 9134, "loss": 0.7938, "learning_rate": 4.033531049978091e-05, "epoch": 0.2897725717726265, "percentage": 28.98, "elapsed_time": "2 days, 0:48:31", "remaining_time": "4 days, 23:36:56", "throughput": 2719.48, "total_tokens": 477843744} {"current_steps": 2648, "total_steps": 9134, "loss": 0.6259, "learning_rate": 4.032851872122091e-05, "epoch": 0.2898820438435644, "percentage": 28.99, "elapsed_time": "2 days, 0:49:34", "remaining_time": "4 days, 23:35:41", "throughput": 2719.39, "total_tokens": 477998528} {"current_steps": 2649, "total_steps": 9134, "loss": 0.6605, "learning_rate": 4.0321725129326446e-05, "epoch": 0.28999151591450234, "percentage": 29.0, "elapsed_time": "2 days, 0:50:38", "remaining_time": "4 days, 23:34:28", "throughput": 2719.41, "total_tokens": 478177056} {"current_steps": 2650, "total_steps": 9134, "loss": 0.5733, "learning_rate": 4.031492972490119e-05, "epoch": 0.2901009879854402, "percentage": 29.01, "elapsed_time": "2 days, 0:51:46", "remaining_time": "4 days, 23:33:26", "throughput": 2719.36, "total_tokens": 478352224} {"current_steps": 2651, "total_steps": 9134, "loss": 0.6928, "learning_rate": 4.030813250874903e-05, "epoch": 0.29021046005637813, "percentage": 29.02, "elapsed_time": "2 days, 0:52:51", "remaining_time": "4 days, 23:32:16", "throughput": 2719.29, "total_tokens": 478516640} {"current_steps": 2652, "total_steps": 9134, "loss": 0.7149, "learning_rate": 4.030133348167405e-05, "epoch": 0.290319932127316, "percentage": 29.03, "elapsed_time": "2 days, 0:53:54", "remaining_time": "4 days, 23:31:03", "throughput": 2719.36, "total_tokens": 478701440} {"current_steps": 2653, "total_steps": 9134, "loss": 0.6239, "learning_rate": 4.0294532644480576e-05, "epoch": 0.2904294041982539, "percentage": 29.05, "elapsed_time": "2 days, 0:55:01", "remaining_time": "4 days, 23:29:58", "throughput": 2719.43, "total_tokens": 478897440} {"current_steps": 2654, "total_steps": 9134, "loss": 0.8451, "learning_rate": 4.028772999797313e-05, "epoch": 0.29053887626919184, "percentage": 29.06, "elapsed_time": "2 days, 0:56:08", "remaining_time": "4 days, 23:28:51", "throughput": 2719.39, "total_tokens": 479069920} {"current_steps": 2655, "total_steps": 9134, "loss": 0.8026, "learning_rate": 4.028092554295645e-05, "epoch": 0.2906483483401297, "percentage": 29.07, "elapsed_time": "2 days, 0:57:12", "remaining_time": "4 days, 23:27:40", "throughput": 2719.44, "total_tokens": 479253824} {"current_steps": 2656, "total_steps": 9134, "loss": 0.7605, "learning_rate": 4.027411928023549e-05, "epoch": 0.2907578204110676, "percentage": 29.08, "elapsed_time": "2 days, 0:58:19", "remaining_time": "4 days, 23:26:34", "throughput": 2719.49, "total_tokens": 479444448} {"current_steps": 2657, "total_steps": 9134, "loss": 0.7468, "learning_rate": 4.026731121061541e-05, "epoch": 0.29086729248200555, "percentage": 29.09, "elapsed_time": "2 days, 0:59:25", "remaining_time": "4 days, 23:25:28", "throughput": 2719.51, "total_tokens": 479627680} {"current_steps": 2658, "total_steps": 9134, "loss": 0.8872, "learning_rate": 4.026050133490161e-05, "epoch": 0.2909767645529434, "percentage": 29.1, "elapsed_time": "2 days, 1:00:33", "remaining_time": "4 days, 23:24:26", "throughput": 2719.65, "total_tokens": 479837344} {"current_steps": 2659, "total_steps": 9134, "loss": 1.1086, "learning_rate": 4.025368965389967e-05, "epoch": 0.29108623662388133, "percentage": 29.11, "elapsed_time": "2 days, 1:01:40", "remaining_time": "4 days, 23:23:19", "throughput": 2719.71, "total_tokens": 480029312} {"current_steps": 2660, "total_steps": 9134, "loss": 0.5807, "learning_rate": 4.02468761684154e-05, "epoch": 0.29119570869481926, "percentage": 29.12, "elapsed_time": "2 days, 1:02:42", "remaining_time": "4 days, 23:22:04", "throughput": 2719.63, "total_tokens": 480184768} {"current_steps": 2661, "total_steps": 9134, "loss": 0.8739, "learning_rate": 4.024006087925484e-05, "epoch": 0.2913051807657571, "percentage": 29.13, "elapsed_time": "2 days, 1:03:50", "remaining_time": "4 days, 23:21:01", "throughput": 2719.67, "total_tokens": 480375840} {"current_steps": 2662, "total_steps": 9134, "loss": 0.7637, "learning_rate": 4.02332437872242e-05, "epoch": 0.29141465283669504, "percentage": 29.14, "elapsed_time": "2 days, 1:04:57", "remaining_time": "4 days, 23:19:57", "throughput": 2719.8, "total_tokens": 480583040} {"current_steps": 2663, "total_steps": 9134, "loss": 0.8802, "learning_rate": 4.022642489312994e-05, "epoch": 0.29152412490763296, "percentage": 29.15, "elapsed_time": "2 days, 1:06:04", "remaining_time": "4 days, 23:18:52", "throughput": 2719.88, "total_tokens": 480779936} {"current_steps": 2664, "total_steps": 9134, "loss": 0.8596, "learning_rate": 4.0219604197778725e-05, "epoch": 0.29163359697857083, "percentage": 29.17, "elapsed_time": "2 days, 1:07:13", "remaining_time": "4 days, 23:17:52", "throughput": 2719.89, "total_tokens": 480967200} {"current_steps": 2665, "total_steps": 9134, "loss": 0.6464, "learning_rate": 4.0212781701977434e-05, "epoch": 0.29174306904950875, "percentage": 29.18, "elapsed_time": "2 days, 1:08:19", "remaining_time": "4 days, 23:16:43", "throughput": 2719.94, "total_tokens": 481154912} {"current_steps": 2666, "total_steps": 9134, "loss": 0.803, "learning_rate": 4.020595740653315e-05, "epoch": 0.2918525411204467, "percentage": 29.19, "elapsed_time": "2 days, 1:09:25", "remaining_time": "4 days, 23:15:37", "throughput": 2719.89, "total_tokens": 481326496} {"current_steps": 2667, "total_steps": 9134, "loss": 0.7658, "learning_rate": 4.019913131225318e-05, "epoch": 0.29196201319138454, "percentage": 29.2, "elapsed_time": "2 days, 1:10:31", "remaining_time": "4 days, 23:14:28", "throughput": 2719.77, "total_tokens": 481483296} {"current_steps": 2668, "total_steps": 9134, "loss": 0.6103, "learning_rate": 4.019230341994501e-05, "epoch": 0.29207148526232246, "percentage": 29.21, "elapsed_time": "2 days, 1:11:32", "remaining_time": "4 days, 23:13:09", "throughput": 2719.64, "total_tokens": 481626432} {"current_steps": 2669, "total_steps": 9134, "loss": 0.7102, "learning_rate": 4.018547373041641e-05, "epoch": 0.2921809573332603, "percentage": 29.22, "elapsed_time": "2 days, 1:12:37", "remaining_time": "4 days, 23:12:01", "throughput": 2719.56, "total_tokens": 481790176} {"current_steps": 2670, "total_steps": 9134, "loss": 0.6012, "learning_rate": 4.017864224447528e-05, "epoch": 0.29229042940419825, "percentage": 29.23, "elapsed_time": "2 days, 1:13:44", "remaining_time": "4 days, 23:10:55", "throughput": 2719.49, "total_tokens": 481959968} {"current_steps": 2671, "total_steps": 9134, "loss": 0.9035, "learning_rate": 4.01718089629298e-05, "epoch": 0.29239990147513617, "percentage": 29.24, "elapsed_time": "2 days, 1:14:53", "remaining_time": "4 days, 23:09:55", "throughput": 2719.6, "total_tokens": 482166272} {"current_steps": 2672, "total_steps": 9134, "loss": 0.6891, "learning_rate": 4.016497388658832e-05, "epoch": 0.29250937354607404, "percentage": 29.25, "elapsed_time": "2 days, 1:15:58", "remaining_time": "4 days, 23:08:45", "throughput": 2719.6, "total_tokens": 482344128} {"current_steps": 2673, "total_steps": 9134, "loss": 0.569, "learning_rate": 4.015813701625942e-05, "epoch": 0.29261884561701196, "percentage": 29.26, "elapsed_time": "2 days, 1:17:07", "remaining_time": "4 days, 23:07:45", "throughput": 2719.66, "total_tokens": 482541696} {"current_steps": 2674, "total_steps": 9134, "loss": 0.7128, "learning_rate": 4.015129835275189e-05, "epoch": 0.2927283176879499, "percentage": 29.28, "elapsed_time": "2 days, 1:18:15", "remaining_time": "4 days, 23:06:43", "throughput": 2719.78, "total_tokens": 482749120} {"current_steps": 2675, "total_steps": 9134, "loss": 0.7743, "learning_rate": 4.014445789687472e-05, "epoch": 0.29283778975888775, "percentage": 29.29, "elapsed_time": "2 days, 1:19:20", "remaining_time": "4 days, 23:05:33", "throughput": 2719.87, "total_tokens": 482941312} {"current_steps": 2676, "total_steps": 9134, "loss": 0.5479, "learning_rate": 4.013761564943714e-05, "epoch": 0.29294726182982567, "percentage": 29.3, "elapsed_time": "2 days, 1:20:28", "remaining_time": "4 days, 23:04:32", "throughput": 2720.02, "total_tokens": 483154560} {"current_steps": 2677, "total_steps": 9134, "loss": 0.6463, "learning_rate": 4.013077161124857e-05, "epoch": 0.2930567339007636, "percentage": 29.31, "elapsed_time": "2 days, 1:21:36", "remaining_time": "4 days, 23:03:29", "throughput": 2720.08, "total_tokens": 483349664} {"current_steps": 2678, "total_steps": 9134, "loss": 0.7593, "learning_rate": 4.012392578311864e-05, "epoch": 0.29316620597170145, "percentage": 29.32, "elapsed_time": "2 days, 1:22:42", "remaining_time": "4 days, 23:02:21", "throughput": 2720.06, "total_tokens": 483523488} {"current_steps": 2679, "total_steps": 9134, "loss": 0.5259, "learning_rate": 4.0117078165857205e-05, "epoch": 0.2932756780426394, "percentage": 29.33, "elapsed_time": "2 days, 1:23:45", "remaining_time": "4 days, 23:01:08", "throughput": 2719.97, "total_tokens": 483681632} {"current_steps": 2680, "total_steps": 9134, "loss": 0.7735, "learning_rate": 4.0110228760274314e-05, "epoch": 0.2933851501135773, "percentage": 29.34, "elapsed_time": "2 days, 1:24:51", "remaining_time": "4 days, 23:00:01", "throughput": 2719.94, "total_tokens": 483855008} {"current_steps": 2681, "total_steps": 9134, "loss": 0.629, "learning_rate": 4.010337756718026e-05, "epoch": 0.29349462218451516, "percentage": 29.35, "elapsed_time": "2 days, 1:25:57", "remaining_time": "4 days, 22:58:51", "throughput": 2719.98, "total_tokens": 484040256} {"current_steps": 2682, "total_steps": 9134, "loss": 0.905, "learning_rate": 4.00965245873855e-05, "epoch": 0.2936040942554531, "percentage": 29.36, "elapsed_time": "2 days, 1:27:02", "remaining_time": "4 days, 22:57:43", "throughput": 2719.97, "total_tokens": 484216320} {"current_steps": 2683, "total_steps": 9134, "loss": 0.7703, "learning_rate": 4.008966982170074e-05, "epoch": 0.293713566326391, "percentage": 29.37, "elapsed_time": "2 days, 1:28:08", "remaining_time": "4 days, 22:56:35", "throughput": 2719.88, "total_tokens": 484379616} {"current_steps": 2684, "total_steps": 9134, "loss": 0.875, "learning_rate": 4.008281327093689e-05, "epoch": 0.2938230383973289, "percentage": 29.38, "elapsed_time": "2 days, 1:29:14", "remaining_time": "4 days, 22:55:27", "throughput": 2720.01, "total_tokens": 484580096} {"current_steps": 2685, "total_steps": 9134, "loss": 0.6374, "learning_rate": 4.007595493590506e-05, "epoch": 0.2939325104682668, "percentage": 29.4, "elapsed_time": "2 days, 1:30:20", "remaining_time": "4 days, 22:54:20", "throughput": 2720.14, "total_tokens": 484784160} {"current_steps": 2686, "total_steps": 9134, "loss": 0.7606, "learning_rate": 4.006909481741659e-05, "epoch": 0.29404198253920466, "percentage": 29.41, "elapsed_time": "2 days, 1:31:28", "remaining_time": "4 days, 22:53:19", "throughput": 2720.3, "total_tokens": 485000096} {"current_steps": 2687, "total_steps": 9134, "loss": 0.6953, "learning_rate": 4.006223291628301e-05, "epoch": 0.2941514546101426, "percentage": 29.42, "elapsed_time": "2 days, 1:32:35", "remaining_time": "4 days, 22:52:12", "throughput": 2720.32, "total_tokens": 485183776} {"current_steps": 2688, "total_steps": 9134, "loss": 0.6848, "learning_rate": 4.0055369233316063e-05, "epoch": 0.2942609266810805, "percentage": 29.43, "elapsed_time": "2 days, 1:33:43", "remaining_time": "4 days, 22:51:12", "throughput": 2720.3, "total_tokens": 485366560} {"current_steps": 2689, "total_steps": 9134, "loss": 0.605, "learning_rate": 4.004850376932772e-05, "epoch": 0.29437039875201837, "percentage": 29.44, "elapsed_time": "2 days, 1:34:50", "remaining_time": "4 days, 22:50:05", "throughput": 2720.24, "total_tokens": 485536800} {"current_steps": 2690, "total_steps": 9134, "loss": 0.7007, "learning_rate": 4.0041636525130156e-05, "epoch": 0.2944798708229563, "percentage": 29.45, "elapsed_time": "2 days, 1:35:54", "remaining_time": "4 days, 22:48:53", "throughput": 2720.06, "total_tokens": 485678144} {"current_steps": 2691, "total_steps": 9134, "loss": 0.8169, "learning_rate": 4.003476750153573e-05, "epoch": 0.2945893428938942, "percentage": 29.46, "elapsed_time": "2 days, 1:36:57", "remaining_time": "4 days, 22:47:38", "throughput": 2720.0, "total_tokens": 485838304} {"current_steps": 2692, "total_steps": 9134, "loss": 0.6483, "learning_rate": 4.002789669935706e-05, "epoch": 0.2946988149648321, "percentage": 29.47, "elapsed_time": "2 days, 1:37:59", "remaining_time": "4 days, 22:46:23", "throughput": 2720.03, "total_tokens": 486014144} {"current_steps": 2693, "total_steps": 9134, "loss": 0.7284, "learning_rate": 4.002102411940694e-05, "epoch": 0.29480828703577, "percentage": 29.48, "elapsed_time": "2 days, 1:39:06", "remaining_time": "4 days, 22:45:17", "throughput": 2720.07, "total_tokens": 486202304} {"current_steps": 2694, "total_steps": 9134, "loss": 0.8499, "learning_rate": 4.001414976249839e-05, "epoch": 0.2949177591067079, "percentage": 29.49, "elapsed_time": "2 days, 1:40:14", "remaining_time": "4 days, 22:44:14", "throughput": 2720.07, "total_tokens": 486386656} {"current_steps": 2695, "total_steps": 9134, "loss": 0.7277, "learning_rate": 4.000727362944461e-05, "epoch": 0.2950272311776458, "percentage": 29.51, "elapsed_time": "2 days, 1:41:21", "remaining_time": "4 days, 22:43:11", "throughput": 2720.12, "total_tokens": 486580192} {"current_steps": 2696, "total_steps": 9134, "loss": 0.8296, "learning_rate": 4.0000395721059053e-05, "epoch": 0.2951367032485837, "percentage": 29.52, "elapsed_time": "2 days, 1:42:26", "remaining_time": "4 days, 22:42:01", "throughput": 2720.07, "total_tokens": 486748416} {"current_steps": 2697, "total_steps": 9134, "loss": 0.6923, "learning_rate": 3.999351603815536e-05, "epoch": 0.29524617531952163, "percentage": 29.53, "elapsed_time": "2 days, 1:43:32", "remaining_time": "4 days, 22:40:53", "throughput": 2720.04, "total_tokens": 486920224} {"current_steps": 2698, "total_steps": 9134, "loss": 0.6927, "learning_rate": 3.998663458154738e-05, "epoch": 0.2953556473904595, "percentage": 29.54, "elapsed_time": "2 days, 1:44:36", "remaining_time": "4 days, 22:39:41", "throughput": 2720.08, "total_tokens": 487101664} {"current_steps": 2699, "total_steps": 9134, "loss": 0.6878, "learning_rate": 3.997975135204918e-05, "epoch": 0.2954651194613974, "percentage": 29.55, "elapsed_time": "2 days, 1:45:42", "remaining_time": "4 days, 22:38:33", "throughput": 2720.08, "total_tokens": 487281088} {"current_steps": 2700, "total_steps": 9134, "loss": 0.7752, "learning_rate": 3.997286635047503e-05, "epoch": 0.29557459153233534, "percentage": 29.56, "elapsed_time": "2 days, 1:46:47", "remaining_time": "4 days, 22:37:24", "throughput": 2720.15, "total_tokens": 487471040} {"current_steps": 2701, "total_steps": 9134, "loss": 0.808, "learning_rate": 3.9965979577639416e-05, "epoch": 0.2956840636032732, "percentage": 29.57, "elapsed_time": "2 days, 1:47:53", "remaining_time": "4 days, 22:36:16", "throughput": 2720.21, "total_tokens": 487660992} {"current_steps": 2702, "total_steps": 9134, "loss": 0.6672, "learning_rate": 3.9959091034357036e-05, "epoch": 0.2957935356742111, "percentage": 29.58, "elapsed_time": "2 days, 1:49:00", "remaining_time": "4 days, 22:35:12", "throughput": 2720.17, "total_tokens": 487835264} {"current_steps": 2703, "total_steps": 9134, "loss": 0.8301, "learning_rate": 3.995220072144277e-05, "epoch": 0.295903007745149, "percentage": 29.59, "elapsed_time": "2 days, 1:50:09", "remaining_time": "4 days, 22:34:11", "throughput": 2720.25, "total_tokens": 488037984} {"current_steps": 2704, "total_steps": 9134, "loss": 0.701, "learning_rate": 3.994530863971175e-05, "epoch": 0.2960124798160869, "percentage": 29.6, "elapsed_time": "2 days, 1:51:18", "remaining_time": "4 days, 22:33:11", "throughput": 2720.32, "total_tokens": 488238688} {"current_steps": 2705, "total_steps": 9134, "loss": 0.6376, "learning_rate": 3.993841478997928e-05, "epoch": 0.29612195188702484, "percentage": 29.61, "elapsed_time": "2 days, 1:52:26", "remaining_time": "4 days, 22:32:09", "throughput": 2720.4, "total_tokens": 488438048} {"current_steps": 2706, "total_steps": 9134, "loss": 0.6891, "learning_rate": 3.993151917306091e-05, "epoch": 0.2962314239579627, "percentage": 29.63, "elapsed_time": "2 days, 1:53:31", "remaining_time": "4 days, 22:31:00", "throughput": 2720.39, "total_tokens": 488614560} {"current_steps": 2707, "total_steps": 9134, "loss": 0.5963, "learning_rate": 3.992462178977235e-05, "epoch": 0.2963408960289006, "percentage": 29.64, "elapsed_time": "2 days, 1:54:40", "remaining_time": "4 days, 22:30:00", "throughput": 2720.49, "total_tokens": 488818624} {"current_steps": 2708, "total_steps": 9134, "loss": 0.6143, "learning_rate": 3.9917722640929576e-05, "epoch": 0.29645036809983855, "percentage": 29.65, "elapsed_time": "2 days, 1:55:44", "remaining_time": "4 days, 22:28:48", "throughput": 2720.53, "total_tokens": 489001408} {"current_steps": 2709, "total_steps": 9134, "loss": 0.6866, "learning_rate": 3.991082172734874e-05, "epoch": 0.2965598401707764, "percentage": 29.66, "elapsed_time": "2 days, 1:56:53", "remaining_time": "4 days, 22:27:48", "throughput": 2720.56, "total_tokens": 489194272} {"current_steps": 2710, "total_steps": 9134, "loss": 0.828, "learning_rate": 3.990391904984618e-05, "epoch": 0.29666931224171433, "percentage": 29.67, "elapsed_time": "2 days, 1:57:59", "remaining_time": "4 days, 22:26:41", "throughput": 2720.56, "total_tokens": 489374592} {"current_steps": 2711, "total_steps": 9134, "loss": 0.6197, "learning_rate": 3.9897014609238496e-05, "epoch": 0.29677878431265226, "percentage": 29.68, "elapsed_time": "2 days, 1:59:00", "remaining_time": "4 days, 22:25:21", "throughput": 2720.55, "total_tokens": 489537664} {"current_steps": 2712, "total_steps": 9134, "loss": 0.7954, "learning_rate": 3.9890108406342455e-05, "epoch": 0.2968882563835901, "percentage": 29.69, "elapsed_time": "2 days, 2:00:03", "remaining_time": "4 days, 22:24:07", "throughput": 2720.46, "total_tokens": 489692224} {"current_steps": 2713, "total_steps": 9134, "loss": 0.5368, "learning_rate": 3.988320044197507e-05, "epoch": 0.29699772845452804, "percentage": 29.7, "elapsed_time": "2 days, 2:01:06", "remaining_time": "4 days, 22:22:53", "throughput": 2720.4, "total_tokens": 489853728} {"current_steps": 2714, "total_steps": 9134, "loss": 0.4457, "learning_rate": 3.987629071695351e-05, "epoch": 0.29710720052546596, "percentage": 29.71, "elapsed_time": "2 days, 2:02:10", "remaining_time": "4 days, 22:21:39", "throughput": 2720.38, "total_tokens": 490021952} {"current_steps": 2715, "total_steps": 9134, "loss": 0.6428, "learning_rate": 3.9869379232095204e-05, "epoch": 0.29721667259640383, "percentage": 29.72, "elapsed_time": "2 days, 2:03:19", "remaining_time": "4 days, 22:20:40", "throughput": 2720.42, "total_tokens": 490218400} {"current_steps": 2716, "total_steps": 9134, "loss": 0.778, "learning_rate": 3.986246598821776e-05, "epoch": 0.29732614466734175, "percentage": 29.74, "elapsed_time": "2 days, 2:04:28", "remaining_time": "4 days, 22:19:39", "throughput": 2720.42, "total_tokens": 490405664} {"current_steps": 2717, "total_steps": 9134, "loss": 0.8182, "learning_rate": 3.9855550986139e-05, "epoch": 0.2974356167382797, "percentage": 29.75, "elapsed_time": "2 days, 2:05:37", "remaining_time": "4 days, 22:18:40", "throughput": 2720.47, "total_tokens": 490602336} {"current_steps": 2718, "total_steps": 9134, "loss": 0.6533, "learning_rate": 3.984863422667695e-05, "epoch": 0.29754508880921754, "percentage": 29.76, "elapsed_time": "2 days, 2:06:40", "remaining_time": "4 days, 22:17:26", "throughput": 2720.48, "total_tokens": 490776384} {"current_steps": 2719, "total_steps": 9134, "loss": 0.7878, "learning_rate": 3.9841715710649865e-05, "epoch": 0.29765456088015546, "percentage": 29.77, "elapsed_time": "2 days, 2:07:43", "remaining_time": "4 days, 22:16:11", "throughput": 2720.42, "total_tokens": 490936768} {"current_steps": 2720, "total_steps": 9134, "loss": 0.698, "learning_rate": 3.983479543887618e-05, "epoch": 0.2977640329510933, "percentage": 29.78, "elapsed_time": "2 days, 2:08:46", "remaining_time": "4 days, 22:14:57", "throughput": 2720.31, "total_tokens": 491087520} {"current_steps": 2721, "total_steps": 9134, "loss": 0.6897, "learning_rate": 3.9827873412174565e-05, "epoch": 0.29787350502203125, "percentage": 29.79, "elapsed_time": "2 days, 2:09:53", "remaining_time": "4 days, 22:13:53", "throughput": 2720.41, "total_tokens": 491289120} {"current_steps": 2722, "total_steps": 9134, "loss": 0.6004, "learning_rate": 3.9820949631363855e-05, "epoch": 0.29798297709296917, "percentage": 29.8, "elapsed_time": "2 days, 2:11:02", "remaining_time": "4 days, 22:12:52", "throughput": 2720.5, "total_tokens": 491491616} {"current_steps": 2723, "total_steps": 9134, "loss": 0.6376, "learning_rate": 3.9814024097263154e-05, "epoch": 0.29809244916390704, "percentage": 29.81, "elapsed_time": "2 days, 2:12:05", "remaining_time": "4 days, 22:11:37", "throughput": 2720.4, "total_tokens": 491645056} {"current_steps": 2724, "total_steps": 9134, "loss": 0.7212, "learning_rate": 3.980709681069171e-05, "epoch": 0.29820192123484496, "percentage": 29.82, "elapsed_time": "2 days, 2:13:11", "remaining_time": "4 days, 22:10:30", "throughput": 2720.38, "total_tokens": 491822016} {"current_steps": 2725, "total_steps": 9134, "loss": 0.763, "learning_rate": 3.980016777246902e-05, "epoch": 0.2983113933057829, "percentage": 29.83, "elapsed_time": "2 days, 2:14:20", "remaining_time": "4 days, 22:09:30", "throughput": 2720.42, "total_tokens": 492016000} {"current_steps": 2726, "total_steps": 9134, "loss": 0.6382, "learning_rate": 3.979323698341478e-05, "epoch": 0.29842086537672075, "percentage": 29.84, "elapsed_time": "2 days, 2:15:25", "remaining_time": "4 days, 22:08:21", "throughput": 2720.45, "total_tokens": 492198784} {"current_steps": 2727, "total_steps": 9134, "loss": 0.8562, "learning_rate": 3.978630444434888e-05, "epoch": 0.29853033744765867, "percentage": 29.86, "elapsed_time": "2 days, 2:16:32", "remaining_time": "4 days, 22:07:16", "throughput": 2720.4, "total_tokens": 492373056} {"current_steps": 2728, "total_steps": 9134, "loss": 0.6055, "learning_rate": 3.977937015609143e-05, "epoch": 0.2986398095185966, "percentage": 29.87, "elapsed_time": "2 days, 2:17:38", "remaining_time": "4 days, 22:06:09", "throughput": 2720.39, "total_tokens": 492550464} {"current_steps": 2729, "total_steps": 9134, "loss": 0.8492, "learning_rate": 3.9772434119462754e-05, "epoch": 0.29874928158953445, "percentage": 29.88, "elapsed_time": "2 days, 2:18:47", "remaining_time": "4 days, 22:05:08", "throughput": 2720.5, "total_tokens": 492757888} {"current_steps": 2730, "total_steps": 9134, "loss": 0.7463, "learning_rate": 3.976549633528336e-05, "epoch": 0.2988587536604724, "percentage": 29.89, "elapsed_time": "2 days, 2:19:52", "remaining_time": "4 days, 22:03:59", "throughput": 2720.43, "total_tokens": 492923200} {"current_steps": 2731, "total_steps": 9134, "loss": 0.6969, "learning_rate": 3.975855680437397e-05, "epoch": 0.2989682257314103, "percentage": 29.9, "elapsed_time": "2 days, 2:20:55", "remaining_time": "4 days, 22:02:44", "throughput": 2720.4, "total_tokens": 493085824} {"current_steps": 2732, "total_steps": 9134, "loss": 0.8239, "learning_rate": 3.975161552755552e-05, "epoch": 0.29907769780234816, "percentage": 29.91, "elapsed_time": "2 days, 2:22:03", "remaining_time": "4 days, 22:01:42", "throughput": 2720.4, "total_tokens": 493272864} {"current_steps": 2733, "total_steps": 9134, "loss": 0.575, "learning_rate": 3.974467250564916e-05, "epoch": 0.2991871698732861, "percentage": 29.92, "elapsed_time": "2 days, 2:23:06", "remaining_time": "4 days, 22:00:27", "throughput": 2720.36, "total_tokens": 493435936} {"current_steps": 2734, "total_steps": 9134, "loss": 0.7081, "learning_rate": 3.973772773947623e-05, "epoch": 0.299296641944224, "percentage": 29.93, "elapsed_time": "2 days, 2:24:10", "remaining_time": "4 days, 21:59:15", "throughput": 2720.39, "total_tokens": 493616032} {"current_steps": 2735, "total_steps": 9134, "loss": 0.732, "learning_rate": 3.9730781229858284e-05, "epoch": 0.2994061140151619, "percentage": 29.94, "elapsed_time": "2 days, 2:25:11", "remaining_time": "4 days, 21:57:57", "throughput": 2720.24, "total_tokens": 493755136} {"current_steps": 2736, "total_steps": 9134, "loss": 0.5326, "learning_rate": 3.972383297761707e-05, "epoch": 0.2995155860860998, "percentage": 29.95, "elapsed_time": "2 days, 2:26:11", "remaining_time": "4 days, 21:56:35", "throughput": 2720.12, "total_tokens": 493895360} {"current_steps": 2737, "total_steps": 9134, "loss": 0.6188, "learning_rate": 3.971688298357457e-05, "epoch": 0.29962505815703766, "percentage": 29.96, "elapsed_time": "2 days, 2:27:11", "remaining_time": "4 days, 21:55:15", "throughput": 2720.05, "total_tokens": 494047008} {"current_steps": 2738, "total_steps": 9134, "loss": 0.5434, "learning_rate": 3.9709931248552944e-05, "epoch": 0.2997345302279756, "percentage": 29.98, "elapsed_time": "2 days, 2:28:16", "remaining_time": "4 days, 21:54:05", "throughput": 2720.01, "total_tokens": 494216352} {"current_steps": 2739, "total_steps": 9134, "loss": 0.9036, "learning_rate": 3.9702977773374576e-05, "epoch": 0.2998440022989135, "percentage": 29.99, "elapsed_time": "2 days, 2:29:25", "remaining_time": "4 days, 21:53:05", "throughput": 2720.01, "total_tokens": 494405408} {"current_steps": 2740, "total_steps": 9134, "loss": 0.8111, "learning_rate": 3.969602255886203e-05, "epoch": 0.29995347436985137, "percentage": 30.0, "elapsed_time": "2 days, 2:30:32", "remaining_time": "4 days, 21:52:00", "throughput": 2720.07, "total_tokens": 494597600} {"current_steps": 2741, "total_steps": 9134, "loss": 0.8526, "learning_rate": 3.968906560583813e-05, "epoch": 0.3000629464407893, "percentage": 30.01, "elapsed_time": "2 days, 2:31:41", "remaining_time": "4 days, 21:50:59", "throughput": 2720.07, "total_tokens": 494785536} {"current_steps": 2742, "total_steps": 9134, "loss": 0.6901, "learning_rate": 3.968210691512584e-05, "epoch": 0.3001724185117272, "percentage": 30.02, "elapsed_time": "2 days, 2:32:49", "remaining_time": "4 days, 21:49:57", "throughput": 2720.21, "total_tokens": 494995872} {"current_steps": 2743, "total_steps": 9134, "loss": 0.8486, "learning_rate": 3.9675146487548364e-05, "epoch": 0.3002818905826651, "percentage": 30.03, "elapsed_time": "2 days, 2:33:58", "remaining_time": "4 days, 21:48:57", "throughput": 2720.26, "total_tokens": 495192096} {"current_steps": 2744, "total_steps": 9134, "loss": 0.7542, "learning_rate": 3.966818432392912e-05, "epoch": 0.300391362653603, "percentage": 30.04, "elapsed_time": "2 days, 2:35:04", "remaining_time": "4 days, 21:47:49", "throughput": 2720.23, "total_tokens": 495364352} {"current_steps": 2745, "total_steps": 9134, "loss": 0.7337, "learning_rate": 3.9661220425091705e-05, "epoch": 0.3005008347245409, "percentage": 30.05, "elapsed_time": "2 days, 2:36:09", "remaining_time": "4 days, 21:46:39", "throughput": 2720.2, "total_tokens": 495536608} {"current_steps": 2746, "total_steps": 9134, "loss": 0.6002, "learning_rate": 3.9654254791859943e-05, "epoch": 0.3006103067954788, "percentage": 30.06, "elapsed_time": "2 days, 2:37:10", "remaining_time": "4 days, 21:45:20", "throughput": 2720.07, "total_tokens": 495678176} {"current_steps": 2747, "total_steps": 9134, "loss": 0.5132, "learning_rate": 3.9647287425057864e-05, "epoch": 0.3007197788664167, "percentage": 30.07, "elapsed_time": "2 days, 2:38:12", "remaining_time": "4 days, 21:44:05", "throughput": 2720.06, "total_tokens": 495846400} {"current_steps": 2748, "total_steps": 9134, "loss": 0.6548, "learning_rate": 3.9640318325509676e-05, "epoch": 0.30082925093735463, "percentage": 30.09, "elapsed_time": "2 days, 2:39:20", "remaining_time": "4 days, 21:43:02", "throughput": 2720.05, "total_tokens": 496030304} {"current_steps": 2749, "total_steps": 9134, "loss": 0.6137, "learning_rate": 3.9633347494039814e-05, "epoch": 0.3009387230082925, "percentage": 30.1, "elapsed_time": "2 days, 2:40:29", "remaining_time": "4 days, 21:42:02", "throughput": 2720.15, "total_tokens": 496235040} {"current_steps": 2750, "total_steps": 9134, "loss": 0.461, "learning_rate": 3.962637493147292e-05, "epoch": 0.3010481950792304, "percentage": 30.11, "elapsed_time": "2 days, 2:41:34", "remaining_time": "4 days, 21:40:51", "throughput": 2720.1, "total_tokens": 496402816} {"current_steps": 2751, "total_steps": 9134, "loss": 0.7966, "learning_rate": 3.961940063863383e-05, "epoch": 0.30115766715016834, "percentage": 30.12, "elapsed_time": "2 days, 2:42:39", "remaining_time": "4 days, 21:39:42", "throughput": 2720.02, "total_tokens": 496564768} {"current_steps": 2752, "total_steps": 9134, "loss": 0.6718, "learning_rate": 3.9612424616347596e-05, "epoch": 0.3012671392211062, "percentage": 30.13, "elapsed_time": "2 days, 2:43:43", "remaining_time": "4 days, 21:38:30", "throughput": 2720.04, "total_tokens": 496741504} {"current_steps": 2753, "total_steps": 9134, "loss": 0.5075, "learning_rate": 3.9605446865439466e-05, "epoch": 0.3013766112920441, "percentage": 30.14, "elapsed_time": "2 days, 2:44:51", "remaining_time": "4 days, 21:37:28", "throughput": 2720.06, "total_tokens": 496932128} {"current_steps": 2754, "total_steps": 9134, "loss": 0.7756, "learning_rate": 3.959846738673488e-05, "epoch": 0.301486083362982, "percentage": 30.15, "elapsed_time": "2 days, 2:46:00", "remaining_time": "4 days, 21:36:28", "throughput": 2720.19, "total_tokens": 497142688} {"current_steps": 2755, "total_steps": 9134, "loss": 0.7264, "learning_rate": 3.9591486181059524e-05, "epoch": 0.3015955554339199, "percentage": 30.16, "elapsed_time": "2 days, 2:47:04", "remaining_time": "4 days, 21:35:15", "throughput": 2720.21, "total_tokens": 497320320} {"current_steps": 2756, "total_steps": 9134, "loss": 0.8953, "learning_rate": 3.958450324923924e-05, "epoch": 0.30170502750485784, "percentage": 30.17, "elapsed_time": "2 days, 2:48:11", "remaining_time": "4 days, 21:34:12", "throughput": 2720.36, "total_tokens": 497532224} {"current_steps": 2757, "total_steps": 9134, "loss": 0.7377, "learning_rate": 3.9577518592100114e-05, "epoch": 0.3018144995757957, "percentage": 30.18, "elapsed_time": "2 days, 2:49:17", "remaining_time": "4 days, 21:33:05", "throughput": 2720.4, "total_tokens": 497718592} {"current_steps": 2758, "total_steps": 9134, "loss": 0.5535, "learning_rate": 3.957053221046839e-05, "epoch": 0.3019239716467336, "percentage": 30.19, "elapsed_time": "2 days, 2:50:20", "remaining_time": "4 days, 21:31:49", "throughput": 2720.29, "total_tokens": 497867776} {"current_steps": 2759, "total_steps": 9134, "loss": 0.6142, "learning_rate": 3.956354410517057e-05, "epoch": 0.30203344371767155, "percentage": 30.21, "elapsed_time": "2 days, 2:51:25", "remaining_time": "4 days, 21:30:41", "throughput": 2720.26, "total_tokens": 498040928} {"current_steps": 2760, "total_steps": 9134, "loss": 0.7489, "learning_rate": 3.955655427703332e-05, "epoch": 0.3021429157886094, "percentage": 30.22, "elapsed_time": "2 days, 2:52:32", "remaining_time": "4 days, 21:29:37", "throughput": 2720.3, "total_tokens": 498231104} {"current_steps": 2761, "total_steps": 9134, "loss": 0.5415, "learning_rate": 3.954956272688353e-05, "epoch": 0.30225238785954733, "percentage": 30.23, "elapsed_time": "2 days, 2:53:36", "remaining_time": "4 days, 21:28:24", "throughput": 2720.36, "total_tokens": 498414560} {"current_steps": 2762, "total_steps": 9134, "loss": 0.6429, "learning_rate": 3.954256945554827e-05, "epoch": 0.30236185993048525, "percentage": 30.24, "elapsed_time": "2 days, 2:54:44", "remaining_time": "4 days, 21:27:21", "throughput": 2720.45, "total_tokens": 498616832} {"current_steps": 2763, "total_steps": 9134, "loss": 0.6342, "learning_rate": 3.9535574463854856e-05, "epoch": 0.3024713320014231, "percentage": 30.25, "elapsed_time": "2 days, 2:55:50", "remaining_time": "4 days, 21:26:13", "throughput": 2720.5, "total_tokens": 498804544} {"current_steps": 2764, "total_steps": 9134, "loss": 0.5288, "learning_rate": 3.952857775263077e-05, "epoch": 0.30258080407236104, "percentage": 30.26, "elapsed_time": "2 days, 2:56:54", "remaining_time": "4 days, 21:25:03", "throughput": 2720.53, "total_tokens": 498985088} {"current_steps": 2765, "total_steps": 9134, "loss": 0.6922, "learning_rate": 3.9521579322703704e-05, "epoch": 0.30269027614329896, "percentage": 30.27, "elapsed_time": "2 days, 2:58:01", "remaining_time": "4 days, 21:23:57", "throughput": 2720.54, "total_tokens": 499167200} {"current_steps": 2766, "total_steps": 9134, "loss": 0.7798, "learning_rate": 3.951457917490157e-05, "epoch": 0.30279974821423683, "percentage": 30.28, "elapsed_time": "2 days, 2:59:04", "remaining_time": "4 days, 21:22:43", "throughput": 2720.48, "total_tokens": 499329824} {"current_steps": 2767, "total_steps": 9134, "loss": 0.7547, "learning_rate": 3.950757731005247e-05, "epoch": 0.30290922028517475, "percentage": 30.29, "elapsed_time": "2 days, 3:00:06", "remaining_time": "4 days, 21:21:26", "throughput": 2720.4, "total_tokens": 499481696} {"current_steps": 2768, "total_steps": 9134, "loss": 0.686, "learning_rate": 3.95005737289847e-05, "epoch": 0.3030186923561127, "percentage": 30.3, "elapsed_time": "2 days, 3:01:14", "remaining_time": "4 days, 21:20:25", "throughput": 2720.52, "total_tokens": 499690912} {"current_steps": 2769, "total_steps": 9134, "loss": 0.7246, "learning_rate": 3.9493568432526787e-05, "epoch": 0.30312816442705054, "percentage": 30.32, "elapsed_time": "2 days, 3:02:23", "remaining_time": "4 days, 21:19:24", "throughput": 2720.65, "total_tokens": 499900576} {"current_steps": 2770, "total_steps": 9134, "loss": 0.8593, "learning_rate": 3.948656142150742e-05, "epoch": 0.30323763649798846, "percentage": 30.33, "elapsed_time": "2 days, 3:03:29", "remaining_time": "4 days, 21:18:18", "throughput": 2720.68, "total_tokens": 500088288} {"current_steps": 2771, "total_steps": 9134, "loss": 0.6, "learning_rate": 3.947955269675554e-05, "epoch": 0.3033471085689263, "percentage": 30.34, "elapsed_time": "2 days, 3:04:30", "remaining_time": "4 days, 21:16:58", "throughput": 2720.61, "total_tokens": 500239712} {"current_steps": 2772, "total_steps": 9134, "loss": 0.7396, "learning_rate": 3.9472542259100264e-05, "epoch": 0.30345658063986425, "percentage": 30.35, "elapsed_time": "2 days, 3:05:36", "remaining_time": "4 days, 21:15:51", "throughput": 2720.57, "total_tokens": 500411744} {"current_steps": 2773, "total_steps": 9134, "loss": 0.7097, "learning_rate": 3.94655301093709e-05, "epoch": 0.30356605271080217, "percentage": 30.36, "elapsed_time": "2 days, 3:06:45", "remaining_time": "4 days, 21:14:50", "throughput": 2720.61, "total_tokens": 500605280} {"current_steps": 2774, "total_steps": 9134, "loss": 0.6901, "learning_rate": 3.945851624839697e-05, "epoch": 0.30367552478174004, "percentage": 30.37, "elapsed_time": "2 days, 3:07:53", "remaining_time": "4 days, 21:13:49", "throughput": 2720.61, "total_tokens": 500793440} {"current_steps": 2775, "total_steps": 9134, "loss": 0.6398, "learning_rate": 3.9451500677008213e-05, "epoch": 0.30378499685267796, "percentage": 30.38, "elapsed_time": "2 days, 3:08:57", "remaining_time": "4 days, 21:12:37", "throughput": 2720.62, "total_tokens": 500969280} {"current_steps": 2776, "total_steps": 9134, "loss": 0.7351, "learning_rate": 3.944448339603455e-05, "epoch": 0.3038944689236159, "percentage": 30.39, "elapsed_time": "2 days, 3:10:01", "remaining_time": "4 days, 21:11:24", "throughput": 2720.53, "total_tokens": 501124064} {"current_steps": 2777, "total_steps": 9134, "loss": 0.9323, "learning_rate": 3.9437464406306124e-05, "epoch": 0.30400394099455375, "percentage": 30.4, "elapsed_time": "2 days, 3:11:09", "remaining_time": "4 days, 21:10:22", "throughput": 2720.53, "total_tokens": 501310880} {"current_steps": 2778, "total_steps": 9134, "loss": 0.7429, "learning_rate": 3.9430443708653255e-05, "epoch": 0.30411341306549167, "percentage": 30.41, "elapsed_time": "2 days, 3:12:14", "remaining_time": "4 days, 21:09:13", "throughput": 2720.45, "total_tokens": 501473280} {"current_steps": 2779, "total_steps": 9134, "loss": 0.7402, "learning_rate": 3.9423421303906474e-05, "epoch": 0.3042228851364296, "percentage": 30.42, "elapsed_time": "2 days, 3:13:21", "remaining_time": "4 days, 21:08:08", "throughput": 2720.48, "total_tokens": 501661664} {"current_steps": 2780, "total_steps": 9134, "loss": 0.7956, "learning_rate": 3.9416397192896523e-05, "epoch": 0.30433235720736745, "percentage": 30.44, "elapsed_time": "2 days, 3:14:26", "remaining_time": "4 days, 21:06:59", "throughput": 2720.44, "total_tokens": 501830784} {"current_steps": 2781, "total_steps": 9134, "loss": 0.881, "learning_rate": 3.940937137645435e-05, "epoch": 0.3044418292783054, "percentage": 30.45, "elapsed_time": "2 days, 3:15:32", "remaining_time": "4 days, 21:05:51", "throughput": 2720.41, "total_tokens": 502003712} {"current_steps": 2782, "total_steps": 9134, "loss": 0.8933, "learning_rate": 3.94023438554111e-05, "epoch": 0.3045513013492433, "percentage": 30.46, "elapsed_time": "2 days, 3:16:40", "remaining_time": "4 days, 21:04:49", "throughput": 2720.49, "total_tokens": 502203296} {"current_steps": 2783, "total_steps": 9134, "loss": 0.8568, "learning_rate": 3.939531463059809e-05, "epoch": 0.30466077342018116, "percentage": 30.47, "elapsed_time": "2 days, 3:17:50", "remaining_time": "4 days, 21:03:49", "throughput": 2720.66, "total_tokens": 502424384} {"current_steps": 2784, "total_steps": 9134, "loss": 0.9976, "learning_rate": 3.9388283702846876e-05, "epoch": 0.3047702454911191, "percentage": 30.48, "elapsed_time": "2 days, 3:18:56", "remaining_time": "4 days, 21:02:43", "throughput": 2720.79, "total_tokens": 502628672} {"current_steps": 2785, "total_steps": 9134, "loss": 0.6313, "learning_rate": 3.9381251072989216e-05, "epoch": 0.304879717562057, "percentage": 30.49, "elapsed_time": "2 days, 3:20:03", "remaining_time": "4 days, 21:01:39", "throughput": 2720.88, "total_tokens": 502828480} {"current_steps": 2786, "total_steps": 9134, "loss": 0.7279, "learning_rate": 3.937421674185704e-05, "epoch": 0.3049891896329949, "percentage": 30.5, "elapsed_time": "2 days, 3:21:12", "remaining_time": "4 days, 21:00:38", "throughput": 2720.96, "total_tokens": 503030752} {"current_steps": 2787, "total_steps": 9134, "loss": 0.7397, "learning_rate": 3.9367180710282504e-05, "epoch": 0.3050986617039328, "percentage": 30.51, "elapsed_time": "2 days, 3:22:20", "remaining_time": "4 days, 20:59:36", "throughput": 2720.9, "total_tokens": 503205472} {"current_steps": 2788, "total_steps": 9134, "loss": 0.839, "learning_rate": 3.936014297909796e-05, "epoch": 0.30520813377487066, "percentage": 30.52, "elapsed_time": "2 days, 3:23:27", "remaining_time": "4 days, 20:58:31", "throughput": 2720.9, "total_tokens": 503388032} {"current_steps": 2789, "total_steps": 9134, "loss": 0.6767, "learning_rate": 3.935310354913595e-05, "epoch": 0.3053176058458086, "percentage": 30.53, "elapsed_time": "2 days, 3:24:33", "remaining_time": "4 days, 20:57:23", "throughput": 2720.91, "total_tokens": 503568352} {"current_steps": 2790, "total_steps": 9134, "loss": 0.6014, "learning_rate": 3.934606242122922e-05, "epoch": 0.3054270779167465, "percentage": 30.55, "elapsed_time": "2 days, 3:25:37", "remaining_time": "4 days, 20:56:11", "throughput": 2720.88, "total_tokens": 503736576} {"current_steps": 2791, "total_steps": 9134, "loss": 0.6478, "learning_rate": 3.9339019596210746e-05, "epoch": 0.30553654998768437, "percentage": 30.56, "elapsed_time": "2 days, 3:26:43", "remaining_time": "4 days, 20:55:04", "throughput": 2720.98, "total_tokens": 503934592} {"current_steps": 2792, "total_steps": 9134, "loss": 0.5422, "learning_rate": 3.933197507491366e-05, "epoch": 0.3056460220586223, "percentage": 30.57, "elapsed_time": "2 days, 3:27:50", "remaining_time": "4 days, 20:54:00", "throughput": 2720.91, "total_tokens": 504105280} {"current_steps": 2793, "total_steps": 9134, "loss": 0.7855, "learning_rate": 3.932492885817132e-05, "epoch": 0.3057554941295602, "percentage": 30.58, "elapsed_time": "2 days, 3:28:58", "remaining_time": "4 days, 20:52:57", "throughput": 2720.95, "total_tokens": 504296800} {"current_steps": 2794, "total_steps": 9134, "loss": 0.7483, "learning_rate": 3.9317880946817274e-05, "epoch": 0.3058649662004981, "percentage": 30.59, "elapsed_time": "2 days, 3:30:07", "remaining_time": "4 days, 20:51:56", "throughput": 2721.0, "total_tokens": 504493696} {"current_steps": 2795, "total_steps": 9134, "loss": 0.7795, "learning_rate": 3.931083134168529e-05, "epoch": 0.305974438271436, "percentage": 30.6, "elapsed_time": "2 days, 3:31:15", "remaining_time": "4 days, 20:50:53", "throughput": 2721.12, "total_tokens": 504699552} {"current_steps": 2796, "total_steps": 9134, "loss": 0.596, "learning_rate": 3.9303780043609315e-05, "epoch": 0.3060839103423739, "percentage": 30.61, "elapsed_time": "2 days, 3:32:22", "remaining_time": "4 days, 20:49:48", "throughput": 2721.13, "total_tokens": 504885024} {"current_steps": 2797, "total_steps": 9134, "loss": 0.7177, "learning_rate": 3.9296727053423506e-05, "epoch": 0.3061933824133118, "percentage": 30.62, "elapsed_time": "2 days, 3:33:27", "remaining_time": "4 days, 20:48:39", "throughput": 2721.23, "total_tokens": 505080128} {"current_steps": 2798, "total_steps": 9134, "loss": 0.6644, "learning_rate": 3.9289672371962214e-05, "epoch": 0.3063028544842497, "percentage": 30.63, "elapsed_time": "2 days, 3:34:35", "remaining_time": "4 days, 20:47:36", "throughput": 2721.25, "total_tokens": 505268288} {"current_steps": 2799, "total_steps": 9134, "loss": 0.6082, "learning_rate": 3.928261600006e-05, "epoch": 0.30641232655518763, "percentage": 30.64, "elapsed_time": "2 days, 3:35:40", "remaining_time": "4 days, 20:46:28", "throughput": 2721.21, "total_tokens": 505439200} {"current_steps": 2800, "total_steps": 9134, "loss": 0.8565, "learning_rate": 3.9275557938551614e-05, "epoch": 0.3065217986261255, "percentage": 30.65, "elapsed_time": "2 days, 3:36:47", "remaining_time": "4 days, 20:45:22", "throughput": 2721.24, "total_tokens": 505626016} {"current_steps": 2801, "total_steps": 9134, "loss": 0.5678, "learning_rate": 3.926849818827202e-05, "epoch": 0.3066312706970634, "percentage": 30.67, "elapsed_time": "2 days, 3:37:53", "remaining_time": "4 days, 20:44:15", "throughput": 2721.18, "total_tokens": 505794688} {"current_steps": 2802, "total_steps": 9134, "loss": 0.5778, "learning_rate": 3.9261436750056364e-05, "epoch": 0.30674074276800134, "percentage": 30.68, "elapsed_time": "2 days, 3:38:59", "remaining_time": "4 days, 20:43:08", "throughput": 2721.15, "total_tokens": 505969408} {"current_steps": 2803, "total_steps": 9134, "loss": 0.7556, "learning_rate": 3.925437362474001e-05, "epoch": 0.3068502148389392, "percentage": 30.69, "elapsed_time": "2 days, 3:40:03", "remaining_time": "4 days, 20:41:57", "throughput": 2721.21, "total_tokens": 506154880} {"current_steps": 2804, "total_steps": 9134, "loss": 0.7718, "learning_rate": 3.924730881315849e-05, "epoch": 0.3069596869098771, "percentage": 30.7, "elapsed_time": "2 days, 3:41:07", "remaining_time": "4 days, 20:40:45", "throughput": 2721.15, "total_tokens": 506317280} {"current_steps": 2805, "total_steps": 9134, "loss": 0.6171, "learning_rate": 3.9240242316147586e-05, "epoch": 0.307069158980815, "percentage": 30.71, "elapsed_time": "2 days, 3:42:12", "remaining_time": "4 days, 20:39:37", "throughput": 2721.21, "total_tokens": 506506112} {"current_steps": 2806, "total_steps": 9134, "loss": 0.7287, "learning_rate": 3.923317413454324e-05, "epoch": 0.3071786310517529, "percentage": 30.72, "elapsed_time": "2 days, 3:43:21", "remaining_time": "4 days, 20:38:34", "throughput": 2721.3, "total_tokens": 506709504} {"current_steps": 2807, "total_steps": 9134, "loss": 0.7014, "learning_rate": 3.922610426918159e-05, "epoch": 0.30728810312269084, "percentage": 30.73, "elapsed_time": "2 days, 3:44:27", "remaining_time": "4 days, 20:37:27", "throughput": 2721.37, "total_tokens": 506902816} {"current_steps": 2808, "total_steps": 9134, "loss": 0.6937, "learning_rate": 3.921903272089901e-05, "epoch": 0.3073975751936287, "percentage": 30.74, "elapsed_time": "2 days, 3:45:30", "remaining_time": "4 days, 20:36:15", "throughput": 2721.24, "total_tokens": 507052000} {"current_steps": 2809, "total_steps": 9134, "loss": 0.8297, "learning_rate": 3.9211959490532044e-05, "epoch": 0.3075070472645666, "percentage": 30.75, "elapsed_time": "2 days, 3:46:35", "remaining_time": "4 days, 20:35:05", "throughput": 2721.29, "total_tokens": 507236800} {"current_steps": 2810, "total_steps": 9134, "loss": 0.4767, "learning_rate": 3.920488457891743e-05, "epoch": 0.30761651933550455, "percentage": 30.76, "elapsed_time": "2 days, 3:47:38", "remaining_time": "4 days, 20:33:52", "throughput": 2721.21, "total_tokens": 507393824} {"current_steps": 2811, "total_steps": 9134, "loss": 0.8102, "learning_rate": 3.919780798689213e-05, "epoch": 0.3077259914064424, "percentage": 30.78, "elapsed_time": "2 days, 3:48:45", "remaining_time": "4 days, 20:32:46", "throughput": 2721.19, "total_tokens": 507573024} {"current_steps": 2812, "total_steps": 9134, "loss": 0.7186, "learning_rate": 3.919072971529329e-05, "epoch": 0.30783546347738033, "percentage": 30.79, "elapsed_time": "2 days, 3:49:51", "remaining_time": "4 days, 20:31:39", "throughput": 2721.26, "total_tokens": 507764320} {"current_steps": 2813, "total_steps": 9134, "loss": 0.6168, "learning_rate": 3.918364976495825e-05, "epoch": 0.30794493554831825, "percentage": 30.8, "elapsed_time": "2 days, 3:50:53", "remaining_time": "4 days, 20:30:23", "throughput": 2721.19, "total_tokens": 507919552} {"current_steps": 2814, "total_steps": 9134, "loss": 0.7816, "learning_rate": 3.917656813672456e-05, "epoch": 0.3080544076192561, "percentage": 30.81, "elapsed_time": "2 days, 3:51:58", "remaining_time": "4 days, 20:29:13", "throughput": 2721.17, "total_tokens": 508092256} {"current_steps": 2815, "total_steps": 9134, "loss": 0.6203, "learning_rate": 3.916948483142996e-05, "epoch": 0.30816387969019404, "percentage": 30.82, "elapsed_time": "2 days, 3:53:02", "remaining_time": "4 days, 20:28:01", "throughput": 2721.13, "total_tokens": 508259360} {"current_steps": 2816, "total_steps": 9134, "loss": 0.8996, "learning_rate": 3.916239984991239e-05, "epoch": 0.30827335176113196, "percentage": 30.83, "elapsed_time": "2 days, 3:54:08", "remaining_time": "4 days, 20:26:55", "throughput": 2721.06, "total_tokens": 508426912} {"current_steps": 2817, "total_steps": 9134, "loss": 0.7073, "learning_rate": 3.915531319300999e-05, "epoch": 0.30838282383206983, "percentage": 30.84, "elapsed_time": "2 days, 3:55:13", "remaining_time": "4 days, 20:25:44", "throughput": 2721.08, "total_tokens": 508605888} {"current_steps": 2818, "total_steps": 9134, "loss": 0.6224, "learning_rate": 3.9148224861561105e-05, "epoch": 0.30849229590300775, "percentage": 30.85, "elapsed_time": "2 days, 3:56:18", "remaining_time": "4 days, 20:24:36", "throughput": 2721.07, "total_tokens": 508782176} {"current_steps": 2819, "total_steps": 9134, "loss": 0.6324, "learning_rate": 3.914113485640426e-05, "epoch": 0.3086017679739457, "percentage": 30.86, "elapsed_time": "2 days, 3:57:23", "remaining_time": "4 days, 20:23:26", "throughput": 2721.16, "total_tokens": 508975040} {"current_steps": 2820, "total_steps": 9134, "loss": 0.7823, "learning_rate": 3.91340431783782e-05, "epoch": 0.30871124004488354, "percentage": 30.87, "elapsed_time": "2 days, 3:58:31", "remaining_time": "4 days, 20:22:24", "throughput": 2721.29, "total_tokens": 509184928} {"current_steps": 2821, "total_steps": 9134, "loss": 0.7183, "learning_rate": 3.912694982832185e-05, "epoch": 0.30882071211582146, "percentage": 30.88, "elapsed_time": "2 days, 3:59:35", "remaining_time": "4 days, 20:21:12", "throughput": 2721.25, "total_tokens": 509351360} {"current_steps": 2822, "total_steps": 9134, "loss": 0.7218, "learning_rate": 3.9119854807074336e-05, "epoch": 0.3089301841867593, "percentage": 30.9, "elapsed_time": "2 days, 4:00:42", "remaining_time": "4 days, 20:20:06", "throughput": 2721.33, "total_tokens": 509547584} {"current_steps": 2823, "total_steps": 9134, "loss": 0.4951, "learning_rate": 3.911275811547499e-05, "epoch": 0.30903965625769725, "percentage": 30.91, "elapsed_time": "2 days, 4:01:43", "remaining_time": "4 days, 20:18:48", "throughput": 2721.25, "total_tokens": 509699680} {"current_steps": 2824, "total_steps": 9134, "loss": 0.8541, "learning_rate": 3.910565975436335e-05, "epoch": 0.30914912832863517, "percentage": 30.92, "elapsed_time": "2 days, 4:02:51", "remaining_time": "4 days, 20:17:46", "throughput": 2721.29, "total_tokens": 509892992} {"current_steps": 2825, "total_steps": 9134, "loss": 0.8201, "learning_rate": 3.909855972457912e-05, "epoch": 0.30925860039957304, "percentage": 30.93, "elapsed_time": "2 days, 4:03:57", "remaining_time": "4 days, 20:16:39", "throughput": 2721.3, "total_tokens": 510073984} {"current_steps": 2826, "total_steps": 9134, "loss": 0.6367, "learning_rate": 3.9091458026962226e-05, "epoch": 0.30936807247051096, "percentage": 30.94, "elapsed_time": "2 days, 4:05:01", "remaining_time": "4 days, 20:15:28", "throughput": 2721.29, "total_tokens": 510246464} {"current_steps": 2827, "total_steps": 9134, "loss": 0.7428, "learning_rate": 3.9084354662352784e-05, "epoch": 0.3094775445414489, "percentage": 30.95, "elapsed_time": "2 days, 4:06:07", "remaining_time": "4 days, 20:14:20", "throughput": 2721.26, "total_tokens": 510419616} {"current_steps": 2828, "total_steps": 9134, "loss": 0.6168, "learning_rate": 3.9077249631591106e-05, "epoch": 0.30958701661238675, "percentage": 30.96, "elapsed_time": "2 days, 4:07:08", "remaining_time": "4 days, 20:13:01", "throughput": 2721.22, "total_tokens": 510577984} {"current_steps": 2829, "total_steps": 9134, "loss": 0.9965, "learning_rate": 3.9070142935517714e-05, "epoch": 0.30969648868332467, "percentage": 30.97, "elapsed_time": "2 days, 4:08:17", "remaining_time": "4 days, 20:12:01", "throughput": 2721.24, "total_tokens": 510769056} {"current_steps": 2830, "total_steps": 9134, "loss": 0.7856, "learning_rate": 3.906303457497331e-05, "epoch": 0.3098059607542626, "percentage": 30.98, "elapsed_time": "2 days, 4:09:26", "remaining_time": "4 days, 20:11:00", "throughput": 2721.28, "total_tokens": 510964832} {"current_steps": 2831, "total_steps": 9134, "loss": 0.6376, "learning_rate": 3.9055924550798806e-05, "epoch": 0.30991543282520045, "percentage": 30.99, "elapsed_time": "2 days, 4:10:29", "remaining_time": "4 days, 20:09:46", "throughput": 2721.23, "total_tokens": 511126784} {"current_steps": 2832, "total_steps": 9134, "loss": 0.6484, "learning_rate": 3.904881286383529e-05, "epoch": 0.3100249048961384, "percentage": 31.01, "elapsed_time": "2 days, 4:11:32", "remaining_time": "4 days, 20:08:33", "throughput": 2721.18, "total_tokens": 511289184} {"current_steps": 2833, "total_steps": 9134, "loss": 0.8467, "learning_rate": 3.904169951492407e-05, "epoch": 0.3101343769670763, "percentage": 31.02, "elapsed_time": "2 days, 4:12:38", "remaining_time": "4 days, 20:07:27", "throughput": 2721.22, "total_tokens": 511478464} {"current_steps": 2834, "total_steps": 9134, "loss": 0.6678, "learning_rate": 3.903458450490664e-05, "epoch": 0.31024384903801416, "percentage": 31.03, "elapsed_time": "2 days, 4:13:47", "remaining_time": "4 days, 20:06:25", "throughput": 2721.19, "total_tokens": 511657664} {"current_steps": 2835, "total_steps": 9134, "loss": 0.7997, "learning_rate": 3.9027467834624696e-05, "epoch": 0.3103533211089521, "percentage": 31.04, "elapsed_time": "2 days, 4:14:55", "remaining_time": "4 days, 20:05:24", "throughput": 2721.06, "total_tokens": 511820288} {"current_steps": 2836, "total_steps": 9134, "loss": 0.7553, "learning_rate": 3.902034950492012e-05, "epoch": 0.31046279317989, "percentage": 31.05, "elapsed_time": "2 days, 4:16:01", "remaining_time": "4 days, 20:04:16", "throughput": 2721.04, "total_tokens": 511995680} {"current_steps": 2837, "total_steps": 9134, "loss": 0.7594, "learning_rate": 3.9013229516635e-05, "epoch": 0.3105722652508279, "percentage": 31.06, "elapsed_time": "2 days, 4:17:10", "remaining_time": "4 days, 20:03:16", "throughput": 2721.09, "total_tokens": 512193472} {"current_steps": 2838, "total_steps": 9134, "loss": 0.8091, "learning_rate": 3.900610787061162e-05, "epoch": 0.3106817373217658, "percentage": 31.07, "elapsed_time": "2 days, 4:18:19", "remaining_time": "4 days, 20:02:16", "throughput": 2721.2, "total_tokens": 512401344} {"current_steps": 2839, "total_steps": 9134, "loss": 0.6557, "learning_rate": 3.899898456769245e-05, "epoch": 0.31079120939270366, "percentage": 31.08, "elapsed_time": "2 days, 4:19:26", "remaining_time": "4 days, 20:01:10", "throughput": 2721.18, "total_tokens": 512578752} {"current_steps": 2840, "total_steps": 9134, "loss": 0.826, "learning_rate": 3.899185960872016e-05, "epoch": 0.3109006814636416, "percentage": 31.09, "elapsed_time": "2 days, 4:20:35", "remaining_time": "4 days, 20:00:10", "throughput": 2721.27, "total_tokens": 512783488} {"current_steps": 2841, "total_steps": 9134, "loss": 0.7326, "learning_rate": 3.8984732994537644e-05, "epoch": 0.3110101535345795, "percentage": 31.1, "elapsed_time": "2 days, 4:21:43", "remaining_time": "4 days, 19:59:07", "throughput": 2721.38, "total_tokens": 512990688} {"current_steps": 2842, "total_steps": 9134, "loss": 0.6607, "learning_rate": 3.8977604725987936e-05, "epoch": 0.31111962560551737, "percentage": 31.11, "elapsed_time": "2 days, 4:22:49", "remaining_time": "4 days, 19:58:00", "throughput": 2721.38, "total_tokens": 513169216} {"current_steps": 2843, "total_steps": 9134, "loss": 0.6077, "learning_rate": 3.897047480391431e-05, "epoch": 0.3112290976764553, "percentage": 31.13, "elapsed_time": "2 days, 4:23:58", "remaining_time": "4 days, 19:57:00", "throughput": 2721.43, "total_tokens": 513366112} {"current_steps": 2844, "total_steps": 9134, "loss": 0.5833, "learning_rate": 3.8963343229160235e-05, "epoch": 0.3113385697473932, "percentage": 31.14, "elapsed_time": "2 days, 4:25:06", "remaining_time": "4 days, 19:55:56", "throughput": 2721.36, "total_tokens": 513538144} {"current_steps": 2845, "total_steps": 9134, "loss": 0.5917, "learning_rate": 3.8956210002569334e-05, "epoch": 0.3114480418183311, "percentage": 31.15, "elapsed_time": "2 days, 4:26:12", "remaining_time": "4 days, 19:54:49", "throughput": 2721.32, "total_tokens": 513708608} {"current_steps": 2846, "total_steps": 9134, "loss": 0.6332, "learning_rate": 3.894907512498548e-05, "epoch": 0.311557513889269, "percentage": 31.16, "elapsed_time": "2 days, 4:27:15", "remaining_time": "4 days, 19:53:35", "throughput": 2721.25, "total_tokens": 513868096} {"current_steps": 2847, "total_steps": 9134, "loss": 0.6904, "learning_rate": 3.89419385972527e-05, "epoch": 0.3116669859602069, "percentage": 31.17, "elapsed_time": "2 days, 4:28:22", "remaining_time": "4 days, 19:52:30", "throughput": 2721.21, "total_tokens": 514042368} {"current_steps": 2848, "total_steps": 9134, "loss": 0.6416, "learning_rate": 3.893480042021523e-05, "epoch": 0.3117764580311448, "percentage": 31.18, "elapsed_time": "2 days, 4:29:30", "remaining_time": "4 days, 19:51:29", "throughput": 2721.32, "total_tokens": 514250016} {"current_steps": 2849, "total_steps": 9134, "loss": 0.7677, "learning_rate": 3.892766059471752e-05, "epoch": 0.3118859301020827, "percentage": 31.19, "elapsed_time": "2 days, 4:30:40", "remaining_time": "4 days, 19:50:29", "throughput": 2721.34, "total_tokens": 514442656} {"current_steps": 2850, "total_steps": 9134, "loss": 0.7286, "learning_rate": 3.892051912160418e-05, "epoch": 0.31199540217302063, "percentage": 31.2, "elapsed_time": "2 days, 4:31:45", "remaining_time": "4 days, 19:49:20", "throughput": 2721.32, "total_tokens": 514614912} {"current_steps": 2851, "total_steps": 9134, "loss": 0.8638, "learning_rate": 3.8913376001720046e-05, "epoch": 0.3121048742439585, "percentage": 31.21, "elapsed_time": "2 days, 4:32:49", "remaining_time": "4 days, 19:48:08", "throughput": 2721.37, "total_tokens": 514799488} {"current_steps": 2852, "total_steps": 9134, "loss": 0.7756, "learning_rate": 3.890623123591013e-05, "epoch": 0.3122143463148964, "percentage": 31.22, "elapsed_time": "2 days, 4:33:53", "remaining_time": "4 days, 19:46:58", "throughput": 2721.48, "total_tokens": 514996832} {"current_steps": 2853, "total_steps": 9134, "loss": 0.5609, "learning_rate": 3.889908482501963e-05, "epoch": 0.31232381838583434, "percentage": 31.23, "elapsed_time": "2 days, 4:34:59", "remaining_time": "4 days, 19:45:50", "throughput": 2721.47, "total_tokens": 515172896} {"current_steps": 2854, "total_steps": 9134, "loss": 0.8509, "learning_rate": 3.889193676989398e-05, "epoch": 0.3124332904567722, "percentage": 31.25, "elapsed_time": "2 days, 4:36:03", "remaining_time": "4 days, 19:44:39", "throughput": 2721.46, "total_tokens": 515345152} {"current_steps": 2855, "total_steps": 9134, "loss": 0.8009, "learning_rate": 3.888478707137875e-05, "epoch": 0.3125427625277101, "percentage": 31.26, "elapsed_time": "2 days, 4:37:12", "remaining_time": "4 days, 19:43:39", "throughput": 2721.59, "total_tokens": 515557952} {"current_steps": 2856, "total_steps": 9134, "loss": 0.6578, "learning_rate": 3.8877635730319774e-05, "epoch": 0.312652234598648, "percentage": 31.27, "elapsed_time": "2 days, 4:38:19", "remaining_time": "4 days, 19:42:34", "throughput": 2721.64, "total_tokens": 515750592} {"current_steps": 2857, "total_steps": 9134, "loss": 0.8557, "learning_rate": 3.8870482747563006e-05, "epoch": 0.3127617066695859, "percentage": 31.28, "elapsed_time": "2 days, 4:39:24", "remaining_time": "4 days, 19:41:23", "throughput": 2721.6, "total_tokens": 515917248} {"current_steps": 2858, "total_steps": 9134, "loss": 0.9126, "learning_rate": 3.886332812395465e-05, "epoch": 0.31287117874052384, "percentage": 31.29, "elapsed_time": "2 days, 4:40:32", "remaining_time": "4 days, 19:40:20", "throughput": 2721.68, "total_tokens": 516117952} {"current_steps": 2859, "total_steps": 9134, "loss": 0.7197, "learning_rate": 3.885617186034107e-05, "epoch": 0.3129806508114617, "percentage": 31.3, "elapsed_time": "2 days, 4:41:37", "remaining_time": "4 days, 19:39:13", "throughput": 2721.74, "total_tokens": 516309248} {"current_steps": 2860, "total_steps": 9134, "loss": 0.8931, "learning_rate": 3.884901395756886e-05, "epoch": 0.3130901228823996, "percentage": 31.31, "elapsed_time": "2 days, 4:42:43", "remaining_time": "4 days, 19:38:05", "throughput": 2721.82, "total_tokens": 516502112} {"current_steps": 2861, "total_steps": 9134, "loss": 1.0365, "learning_rate": 3.884185441648477e-05, "epoch": 0.31319959495333755, "percentage": 31.32, "elapsed_time": "2 days, 4:43:53", "remaining_time": "4 days, 19:37:06", "throughput": 2722.03, "total_tokens": 516731488} {"current_steps": 2862, "total_steps": 9134, "loss": 0.7319, "learning_rate": 3.883469323793576e-05, "epoch": 0.3133090670242754, "percentage": 31.33, "elapsed_time": "2 days, 4:44:57", "remaining_time": "4 days, 19:35:55", "throughput": 2722.12, "total_tokens": 516924352} {"current_steps": 2863, "total_steps": 9134, "loss": 0.9392, "learning_rate": 3.882753042276899e-05, "epoch": 0.31341853909521333, "percentage": 31.34, "elapsed_time": "2 days, 4:46:05", "remaining_time": "4 days, 19:34:52", "throughput": 2722.28, "total_tokens": 517138496} {"current_steps": 2864, "total_steps": 9134, "loss": 0.8536, "learning_rate": 3.882036597183181e-05, "epoch": 0.31352801116615125, "percentage": 31.36, "elapsed_time": "2 days, 4:47:14", "remaining_time": "4 days, 19:33:52", "throughput": 2722.35, "total_tokens": 517339872} {"current_steps": 2865, "total_steps": 9134, "loss": 0.8045, "learning_rate": 3.881319988597174e-05, "epoch": 0.3136374832370891, "percentage": 31.37, "elapsed_time": "2 days, 4:48:21", "remaining_time": "4 days, 19:32:46", "throughput": 2722.41, "total_tokens": 517532960} {"current_steps": 2866, "total_steps": 9134, "loss": 0.8623, "learning_rate": 3.8806032166036545e-05, "epoch": 0.31374695530802704, "percentage": 31.38, "elapsed_time": "2 days, 4:49:30", "remaining_time": "4 days, 19:31:46", "throughput": 2722.45, "total_tokens": 517729408} {"current_steps": 2867, "total_steps": 9134, "loss": 0.7046, "learning_rate": 3.8798862812874136e-05, "epoch": 0.31385642737896496, "percentage": 31.39, "elapsed_time": "2 days, 4:50:35", "remaining_time": "4 days, 19:30:36", "throughput": 2722.48, "total_tokens": 517910624} {"current_steps": 2868, "total_steps": 9134, "loss": 0.6361, "learning_rate": 3.8791691827332627e-05, "epoch": 0.31396589944990283, "percentage": 31.4, "elapsed_time": "2 days, 4:51:37", "remaining_time": "4 days, 19:29:22", "throughput": 2722.48, "total_tokens": 518083328} {"current_steps": 2869, "total_steps": 9134, "loss": 0.6417, "learning_rate": 3.8784519210260343e-05, "epoch": 0.31407537152084075, "percentage": 31.41, "elapsed_time": "2 days, 4:52:41", "remaining_time": "4 days, 19:28:10", "throughput": 2722.45, "total_tokens": 518250880} {"current_steps": 2870, "total_steps": 9134, "loss": 0.7183, "learning_rate": 3.877734496250579e-05, "epoch": 0.3141848435917787, "percentage": 31.42, "elapsed_time": "2 days, 4:53:45", "remaining_time": "4 days, 19:26:58", "throughput": 2722.43, "total_tokens": 518419776} {"current_steps": 2871, "total_steps": 9134, "loss": 0.6618, "learning_rate": 3.877016908491767e-05, "epoch": 0.31429431566271654, "percentage": 31.43, "elapsed_time": "2 days, 4:54:48", "remaining_time": "4 days, 19:25:44", "throughput": 2722.4, "total_tokens": 518585088} {"current_steps": 2872, "total_steps": 9134, "loss": 0.8113, "learning_rate": 3.8762991578344864e-05, "epoch": 0.31440378773365446, "percentage": 31.44, "elapsed_time": "2 days, 4:55:55", "remaining_time": "4 days, 19:24:40", "throughput": 2722.4, "total_tokens": 518769888} {"current_steps": 2873, "total_steps": 9134, "loss": 0.6016, "learning_rate": 3.8755812443636466e-05, "epoch": 0.3145132598045923, "percentage": 31.45, "elapsed_time": "2 days, 4:57:00", "remaining_time": "4 days, 19:23:30", "throughput": 2722.43, "total_tokens": 518951328} {"current_steps": 2874, "total_steps": 9134, "loss": 0.7797, "learning_rate": 3.8748631681641757e-05, "epoch": 0.31462273187553025, "percentage": 31.46, "elapsed_time": "2 days, 4:58:08", "remaining_time": "4 days, 19:22:27", "throughput": 2722.54, "total_tokens": 519157408} {"current_steps": 2875, "total_steps": 9134, "loss": 0.6789, "learning_rate": 3.8741449293210194e-05, "epoch": 0.31473220394646817, "percentage": 31.48, "elapsed_time": "2 days, 4:59:10", "remaining_time": "4 days, 19:21:12", "throughput": 2722.45, "total_tokens": 519308608} {"current_steps": 2876, "total_steps": 9134, "loss": 0.7589, "learning_rate": 3.8734265279191455e-05, "epoch": 0.31484167601740604, "percentage": 31.49, "elapsed_time": "2 days, 5:00:19", "remaining_time": "4 days, 19:20:11", "throughput": 2722.55, "total_tokens": 519516032} {"current_steps": 2877, "total_steps": 9134, "loss": 0.5528, "learning_rate": 3.872707964043539e-05, "epoch": 0.31495114808834396, "percentage": 31.5, "elapsed_time": "2 days, 5:01:23", "remaining_time": "4 days, 19:19:00", "throughput": 2722.53, "total_tokens": 519686944} {"current_steps": 2878, "total_steps": 9134, "loss": 0.6317, "learning_rate": 3.871989237779204e-05, "epoch": 0.3150606201592819, "percentage": 31.51, "elapsed_time": "2 days, 5:02:26", "remaining_time": "4 days, 19:17:46", "throughput": 2722.48, "total_tokens": 519847776} {"current_steps": 2879, "total_steps": 9134, "loss": 0.5936, "learning_rate": 3.8712703492111656e-05, "epoch": 0.31517009223021974, "percentage": 31.52, "elapsed_time": "2 days, 5:03:35", "remaining_time": "4 days, 19:16:44", "throughput": 2722.53, "total_tokens": 520044224} {"current_steps": 2880, "total_steps": 9134, "loss": 0.5583, "learning_rate": 3.8705512984244665e-05, "epoch": 0.31527956430115767, "percentage": 31.53, "elapsed_time": "2 days, 5:04:43", "remaining_time": "4 days, 19:15:42", "throughput": 2722.54, "total_tokens": 520232160} {"current_steps": 2881, "total_steps": 9134, "loss": 0.6576, "learning_rate": 3.869832085504168e-05, "epoch": 0.3153890363720956, "percentage": 31.54, "elapsed_time": "2 days, 5:05:50", "remaining_time": "4 days, 19:14:39", "throughput": 2722.59, "total_tokens": 520425472} {"current_steps": 2882, "total_steps": 9134, "loss": 0.6297, "learning_rate": 3.869112710535353e-05, "epoch": 0.31549850844303345, "percentage": 31.55, "elapsed_time": "2 days, 5:07:00", "remaining_time": "4 days, 19:13:38", "throughput": 2722.75, "total_tokens": 520643872} {"current_steps": 2883, "total_steps": 9134, "loss": 0.5198, "learning_rate": 3.868393173603122e-05, "epoch": 0.3156079805139714, "percentage": 31.56, "elapsed_time": "2 days, 5:08:04", "remaining_time": "4 days, 19:12:28", "throughput": 2722.72, "total_tokens": 520814336} {"current_steps": 2884, "total_steps": 9134, "loss": 0.6114, "learning_rate": 3.867673474792593e-05, "epoch": 0.3157174525849093, "percentage": 31.57, "elapsed_time": "2 days, 5:09:09", "remaining_time": "4 days, 19:11:20", "throughput": 2722.59, "total_tokens": 520967552} {"current_steps": 2885, "total_steps": 9134, "loss": 0.6074, "learning_rate": 3.866953614188908e-05, "epoch": 0.31582692465584716, "percentage": 31.59, "elapsed_time": "2 days, 5:10:16", "remaining_time": "4 days, 19:10:15", "throughput": 2722.6, "total_tokens": 521151008} {"current_steps": 2886, "total_steps": 9134, "loss": 0.5478, "learning_rate": 3.866233591877223e-05, "epoch": 0.3159363967267851, "percentage": 31.6, "elapsed_time": "2 days, 5:11:23", "remaining_time": "4 days, 19:09:10", "throughput": 2722.66, "total_tokens": 521344768} {"current_steps": 2887, "total_steps": 9134, "loss": 0.4603, "learning_rate": 3.865513407942716e-05, "epoch": 0.316045868797723, "percentage": 31.61, "elapsed_time": "2 days, 5:12:23", "remaining_time": "4 days, 19:07:48", "throughput": 2722.57, "total_tokens": 521489472} {"current_steps": 2888, "total_steps": 9134, "loss": 0.792, "learning_rate": 3.864793062470583e-05, "epoch": 0.3161553408686609, "percentage": 31.62, "elapsed_time": "2 days, 5:13:30", "remaining_time": "4 days, 19:06:45", "throughput": 2722.62, "total_tokens": 521684352} {"current_steps": 2889, "total_steps": 9134, "loss": 0.8604, "learning_rate": 3.864072555546041e-05, "epoch": 0.3162648129395988, "percentage": 31.63, "elapsed_time": "2 days, 5:14:39", "remaining_time": "4 days, 19:05:43", "throughput": 2722.71, "total_tokens": 521887296} {"current_steps": 2890, "total_steps": 9134, "loss": 0.787, "learning_rate": 3.863351887254322e-05, "epoch": 0.31637428501053666, "percentage": 31.64, "elapsed_time": "2 days, 5:15:48", "remaining_time": "4 days, 19:04:42", "throughput": 2722.76, "total_tokens": 522084640} {"current_steps": 2891, "total_steps": 9134, "loss": 0.691, "learning_rate": 3.862631057680681e-05, "epoch": 0.3164837570814746, "percentage": 31.65, "elapsed_time": "2 days, 5:16:56", "remaining_time": "4 days, 19:03:39", "throughput": 2722.8, "total_tokens": 522277504} {"current_steps": 2892, "total_steps": 9134, "loss": 0.7287, "learning_rate": 3.8619100669103916e-05, "epoch": 0.3165932291524125, "percentage": 31.66, "elapsed_time": "2 days, 5:18:01", "remaining_time": "4 days, 19:02:31", "throughput": 2722.88, "total_tokens": 522471488} {"current_steps": 2893, "total_steps": 9134, "loss": 0.7116, "learning_rate": 3.861188915028744e-05, "epoch": 0.31670270122335037, "percentage": 31.67, "elapsed_time": "2 days, 5:19:10", "remaining_time": "4 days, 19:01:30", "throughput": 2723.06, "total_tokens": 522693024} {"current_steps": 2894, "total_steps": 9134, "loss": 0.7532, "learning_rate": 3.8604676021210506e-05, "epoch": 0.3168121732942883, "percentage": 31.68, "elapsed_time": "2 days, 5:20:18", "remaining_time": "4 days, 19:00:27", "throughput": 2723.2, "total_tokens": 522905600} {"current_steps": 2895, "total_steps": 9134, "loss": 0.5196, "learning_rate": 3.85974612827264e-05, "epoch": 0.3169216453652262, "percentage": 31.69, "elapsed_time": "2 days, 5:21:22", "remaining_time": "4 days, 18:59:16", "throughput": 2723.14, "total_tokens": 523067552} {"current_steps": 2896, "total_steps": 9134, "loss": 0.8541, "learning_rate": 3.859024493568862e-05, "epoch": 0.3170311174361641, "percentage": 31.71, "elapsed_time": "2 days, 5:22:30", "remaining_time": "4 days, 18:58:14", "throughput": 2723.24, "total_tokens": 523273408} {"current_steps": 2897, "total_steps": 9134, "loss": 0.7167, "learning_rate": 3.8583026980950846e-05, "epoch": 0.317140589507102, "percentage": 31.72, "elapsed_time": "2 days, 5:23:37", "remaining_time": "4 days, 18:57:07", "throughput": 2723.14, "total_tokens": 523433344} {"current_steps": 2898, "total_steps": 9134, "loss": 0.5849, "learning_rate": 3.857580741936695e-05, "epoch": 0.3172500615780399, "percentage": 31.73, "elapsed_time": "2 days, 5:24:38", "remaining_time": "4 days, 18:55:51", "throughput": 2723.08, "total_tokens": 523590816} {"current_steps": 2899, "total_steps": 9134, "loss": 0.7044, "learning_rate": 3.856858625179098e-05, "epoch": 0.3173595336489778, "percentage": 31.74, "elapsed_time": "2 days, 5:25:46", "remaining_time": "4 days, 18:54:47", "throughput": 2723.19, "total_tokens": 523795776} {"current_steps": 2900, "total_steps": 9134, "loss": 0.7911, "learning_rate": 3.85613634790772e-05, "epoch": 0.3174690057199157, "percentage": 31.75, "elapsed_time": "2 days, 5:26:51", "remaining_time": "4 days, 18:53:37", "throughput": 2723.19, "total_tokens": 523971840} {"current_steps": 2901, "total_steps": 9134, "loss": 0.7645, "learning_rate": 3.8554139102080044e-05, "epoch": 0.31757847779085363, "percentage": 31.76, "elapsed_time": "2 days, 5:27:59", "remaining_time": "4 days, 18:52:34", "throughput": 2723.25, "total_tokens": 524167840} {"current_steps": 2902, "total_steps": 9134, "loss": 0.6904, "learning_rate": 3.854691312165414e-05, "epoch": 0.3176879498617915, "percentage": 31.77, "elapsed_time": "2 days, 5:29:03", "remaining_time": "4 days, 18:51:23", "throughput": 2723.18, "total_tokens": 524330240} {"current_steps": 2903, "total_steps": 9134, "loss": 0.7055, "learning_rate": 3.8539685538654325e-05, "epoch": 0.3177974219327294, "percentage": 31.78, "elapsed_time": "2 days, 5:30:12", "remaining_time": "4 days, 18:50:22", "throughput": 2723.13, "total_tokens": 524507200} {"current_steps": 2904, "total_steps": 9134, "loss": 0.7334, "learning_rate": 3.853245635393558e-05, "epoch": 0.31790689400366734, "percentage": 31.79, "elapsed_time": "2 days, 5:31:17", "remaining_time": "4 days, 18:49:13", "throughput": 2723.08, "total_tokens": 524675648} {"current_steps": 2905, "total_steps": 9134, "loss": 0.6949, "learning_rate": 3.852522556835313e-05, "epoch": 0.3180163660746052, "percentage": 31.8, "elapsed_time": "2 days, 5:32:22", "remaining_time": "4 days, 18:48:04", "throughput": 2723.11, "total_tokens": 524858432} {"current_steps": 2906, "total_steps": 9134, "loss": 0.6758, "learning_rate": 3.8517993182762334e-05, "epoch": 0.3181258381455431, "percentage": 31.82, "elapsed_time": "2 days, 5:33:28", "remaining_time": "4 days, 18:46:58", "throughput": 2723.08, "total_tokens": 525032480} {"current_steps": 2907, "total_steps": 9134, "loss": 0.6856, "learning_rate": 3.8510759198018805e-05, "epoch": 0.318235310216481, "percentage": 31.83, "elapsed_time": "2 days, 5:34:34", "remaining_time": "4 days, 18:45:50", "throughput": 2723.1, "total_tokens": 525216832} {"current_steps": 2908, "total_steps": 9134, "loss": 0.6203, "learning_rate": 3.8503523614978274e-05, "epoch": 0.3183447822874189, "percentage": 31.84, "elapsed_time": "2 days, 5:35:41", "remaining_time": "4 days, 18:44:46", "throughput": 2723.13, "total_tokens": 525407008} {"current_steps": 2909, "total_steps": 9134, "loss": 0.7456, "learning_rate": 3.849628643449673e-05, "epoch": 0.31845425435835684, "percentage": 31.85, "elapsed_time": "2 days, 5:36:48", "remaining_time": "4 days, 18:43:40", "throughput": 2723.05, "total_tokens": 525571648} {"current_steps": 2910, "total_steps": 9134, "loss": 0.5976, "learning_rate": 3.8489047657430286e-05, "epoch": 0.3185637264292947, "percentage": 31.86, "elapsed_time": "2 days, 5:37:54", "remaining_time": "4 days, 18:42:34", "throughput": 2722.98, "total_tokens": 525740096} {"current_steps": 2911, "total_steps": 9134, "loss": 0.8062, "learning_rate": 3.84818072846353e-05, "epoch": 0.3186731985002326, "percentage": 31.87, "elapsed_time": "2 days, 5:38:58", "remaining_time": "4 days, 18:41:22", "throughput": 2722.97, "total_tokens": 525909216} {"current_steps": 2912, "total_steps": 9134, "loss": 0.7807, "learning_rate": 3.8474565316968284e-05, "epoch": 0.31878267057117055, "percentage": 31.88, "elapsed_time": "2 days, 5:39:59", "remaining_time": "4 days, 18:40:05", "throughput": 2722.91, "total_tokens": 526065344} {"current_steps": 2913, "total_steps": 9134, "loss": 0.8759, "learning_rate": 3.846732175528595e-05, "epoch": 0.3188921426421084, "percentage": 31.89, "elapsed_time": "2 days, 5:41:05", "remaining_time": "4 days, 18:38:58", "throughput": 2722.92, "total_tokens": 526248576} {"current_steps": 2914, "total_steps": 9134, "loss": 0.7472, "learning_rate": 3.84600766004452e-05, "epoch": 0.31900161471304633, "percentage": 31.9, "elapsed_time": "2 days, 5:42:12", "remaining_time": "4 days, 18:37:52", "throughput": 2722.94, "total_tokens": 526432704} {"current_steps": 2915, "total_steps": 9134, "loss": 0.7634, "learning_rate": 3.845282985330311e-05, "epoch": 0.31911108678398425, "percentage": 31.91, "elapsed_time": "2 days, 5:43:16", "remaining_time": "4 days, 18:36:41", "throughput": 2722.83, "total_tokens": 526586368} {"current_steps": 2916, "total_steps": 9134, "loss": 0.601, "learning_rate": 3.8445581514716977e-05, "epoch": 0.3192205588549221, "percentage": 31.92, "elapsed_time": "2 days, 5:44:15", "remaining_time": "4 days, 18:35:20", "throughput": 2722.69, "total_tokens": 526721216} {"current_steps": 2917, "total_steps": 9134, "loss": 0.8711, "learning_rate": 3.843833158554425e-05, "epoch": 0.31933003092586004, "percentage": 31.94, "elapsed_time": "2 days, 5:45:25", "remaining_time": "4 days, 18:34:20", "throughput": 2722.9, "total_tokens": 526950592} {"current_steps": 2918, "total_steps": 9134, "loss": 0.7113, "learning_rate": 3.843108006664259e-05, "epoch": 0.31943950299679796, "percentage": 31.95, "elapsed_time": "2 days, 5:46:27", "remaining_time": "4 days, 18:33:04", "throughput": 2722.86, "total_tokens": 527112096} {"current_steps": 2919, "total_steps": 9134, "loss": 0.7535, "learning_rate": 3.8423826958869825e-05, "epoch": 0.31954897506773583, "percentage": 31.96, "elapsed_time": "2 days, 5:47:34", "remaining_time": "4 days, 18:31:59", "throughput": 2722.91, "total_tokens": 527303616} {"current_steps": 2920, "total_steps": 9134, "loss": 0.8099, "learning_rate": 3.841657226308399e-05, "epoch": 0.31965844713867375, "percentage": 31.97, "elapsed_time": "2 days, 5:48:43", "remaining_time": "4 days, 18:30:59", "throughput": 2722.93, "total_tokens": 527494688} {"current_steps": 2921, "total_steps": 9134, "loss": 0.5972, "learning_rate": 3.840931598014332e-05, "epoch": 0.3197679192096117, "percentage": 31.98, "elapsed_time": "2 days, 5:49:46", "remaining_time": "4 days, 18:29:45", "throughput": 2722.81, "total_tokens": 527643872} {"current_steps": 2922, "total_steps": 9134, "loss": 0.5544, "learning_rate": 3.840205811090619e-05, "epoch": 0.31987739128054954, "percentage": 31.99, "elapsed_time": "2 days, 5:50:48", "remaining_time": "4 days, 18:28:30", "throughput": 2722.82, "total_tokens": 527814336} {"current_steps": 2923, "total_steps": 9134, "loss": 0.8348, "learning_rate": 3.8394798656231215e-05, "epoch": 0.31998686335148746, "percentage": 32.0, "elapsed_time": "2 days, 5:51:56", "remaining_time": "4 days, 18:27:27", "throughput": 2722.91, "total_tokens": 528016160} {"current_steps": 2924, "total_steps": 9134, "loss": 0.9048, "learning_rate": 3.8387537616977165e-05, "epoch": 0.3200963354224253, "percentage": 32.01, "elapsed_time": "2 days, 5:53:04", "remaining_time": "4 days, 18:26:25", "throughput": 2723.04, "total_tokens": 528228064} {"current_steps": 2925, "total_steps": 9134, "loss": 0.562, "learning_rate": 3.8380274994003e-05, "epoch": 0.32020580749336325, "percentage": 32.02, "elapsed_time": "2 days, 5:54:06", "remaining_time": "4 days, 18:25:08", "throughput": 2722.93, "total_tokens": 528374112} {"current_steps": 2926, "total_steps": 9134, "loss": 0.7073, "learning_rate": 3.837301078816789e-05, "epoch": 0.32031527956430117, "percentage": 32.03, "elapsed_time": "2 days, 5:55:12", "remaining_time": "4 days, 18:24:02", "throughput": 2722.82, "total_tokens": 528534944} {"current_steps": 2927, "total_steps": 9134, "loss": 0.6107, "learning_rate": 3.8365745000331164e-05, "epoch": 0.32042475163523904, "percentage": 32.05, "elapsed_time": "2 days, 5:56:18", "remaining_time": "4 days, 18:22:54", "throughput": 2722.79, "total_tokens": 528705856} {"current_steps": 2928, "total_steps": 9134, "loss": 0.5801, "learning_rate": 3.8358477631352364e-05, "epoch": 0.32053422370617696, "percentage": 32.06, "elapsed_time": "2 days, 5:57:20", "remaining_time": "4 days, 18:21:40", "throughput": 2722.71, "total_tokens": 528861312} {"current_steps": 2929, "total_steps": 9134, "loss": 0.8095, "learning_rate": 3.8351208682091185e-05, "epoch": 0.3206436957771149, "percentage": 32.07, "elapsed_time": "2 days, 5:58:26", "remaining_time": "4 days, 18:20:32", "throughput": 2722.76, "total_tokens": 529051040} {"current_steps": 2930, "total_steps": 9134, "loss": 0.6655, "learning_rate": 3.834393815340754e-05, "epoch": 0.32075316784805274, "percentage": 32.08, "elapsed_time": "2 days, 5:59:32", "remaining_time": "4 days, 18:19:26", "throughput": 2722.87, "total_tokens": 529252416} {"current_steps": 2931, "total_steps": 9134, "loss": 0.6824, "learning_rate": 3.833666604616153e-05, "epoch": 0.32086263991899067, "percentage": 32.09, "elapsed_time": "2 days, 6:00:39", "remaining_time": "4 days, 18:18:21", "throughput": 2722.9, "total_tokens": 529439904} {"current_steps": 2932, "total_steps": 9134, "loss": 0.7335, "learning_rate": 3.832939236121342e-05, "epoch": 0.3209721119899286, "percentage": 32.1, "elapsed_time": "2 days, 6:01:42", "remaining_time": "4 days, 18:17:08", "throughput": 2722.84, "total_tokens": 529600512} {"current_steps": 2933, "total_steps": 9134, "loss": 0.7757, "learning_rate": 3.8322117099423674e-05, "epoch": 0.32108158406086645, "percentage": 32.11, "elapsed_time": "2 days, 6:02:48", "remaining_time": "4 days, 18:16:00", "throughput": 2722.93, "total_tokens": 529796064} {"current_steps": 2934, "total_steps": 9134, "loss": 0.7436, "learning_rate": 3.8314840261652954e-05, "epoch": 0.3211910561318044, "percentage": 32.12, "elapsed_time": "2 days, 6:03:53", "remaining_time": "4 days, 18:14:50", "throughput": 2722.93, "total_tokens": 529973024} {"current_steps": 2935, "total_steps": 9134, "loss": 0.6174, "learning_rate": 3.8307561848762066e-05, "epoch": 0.3213005282027423, "percentage": 32.13, "elapsed_time": "2 days, 6:05:01", "remaining_time": "4 days, 18:13:47", "throughput": 2722.93, "total_tokens": 530156928} {"current_steps": 2936, "total_steps": 9134, "loss": 0.8203, "learning_rate": 3.8300281861612056e-05, "epoch": 0.32141000027368016, "percentage": 32.14, "elapsed_time": "2 days, 6:06:10", "remaining_time": "4 days, 18:12:48", "throughput": 2723.04, "total_tokens": 530369056} {"current_steps": 2937, "total_steps": 9134, "loss": 0.69, "learning_rate": 3.829300030106413e-05, "epoch": 0.3215194723446181, "percentage": 32.15, "elapsed_time": "2 days, 6:07:20", "remaining_time": "4 days, 18:11:47", "throughput": 2723.02, "total_tokens": 530553408} {"current_steps": 2938, "total_steps": 9134, "loss": 0.836, "learning_rate": 3.828571716797968e-05, "epoch": 0.321628944415556, "percentage": 32.17, "elapsed_time": "2 days, 6:08:29", "remaining_time": "4 days, 18:10:48", "throughput": 2723.1, "total_tokens": 530759040} {"current_steps": 2939, "total_steps": 9134, "loss": 0.668, "learning_rate": 3.827843246322029e-05, "epoch": 0.3217384164864939, "percentage": 32.18, "elapsed_time": "2 days, 6:09:35", "remaining_time": "4 days, 18:09:41", "throughput": 2723.22, "total_tokens": 530961536} {"current_steps": 2940, "total_steps": 9134, "loss": 0.9635, "learning_rate": 3.827114618764772e-05, "epoch": 0.3218478885574318, "percentage": 32.19, "elapsed_time": "2 days, 6:10:44", "remaining_time": "4 days, 18:08:40", "throughput": 2723.23, "total_tokens": 531151712} {"current_steps": 2941, "total_steps": 9134, "loss": 0.8707, "learning_rate": 3.8263858342123936e-05, "epoch": 0.32195736062836966, "percentage": 32.2, "elapsed_time": "2 days, 6:11:51", "remaining_time": "4 days, 18:07:35", "throughput": 2723.33, "total_tokens": 531353312} {"current_steps": 2942, "total_steps": 9134, "loss": 0.7634, "learning_rate": 3.8256568927511047e-05, "epoch": 0.3220668326993076, "percentage": 32.21, "elapsed_time": "2 days, 6:13:00", "remaining_time": "4 days, 18:06:35", "throughput": 2723.34, "total_tokens": 531543488} {"current_steps": 2943, "total_steps": 9134, "loss": 0.7338, "learning_rate": 3.8249277944671415e-05, "epoch": 0.3221763047702455, "percentage": 32.22, "elapsed_time": "2 days, 6:14:08", "remaining_time": "4 days, 18:05:31", "throughput": 2723.37, "total_tokens": 531733216} {"current_steps": 2944, "total_steps": 9134, "loss": 0.7396, "learning_rate": 3.824198539446752e-05, "epoch": 0.32228577684118337, "percentage": 32.23, "elapsed_time": "2 days, 6:15:13", "remaining_time": "4 days, 18:04:23", "throughput": 2723.37, "total_tokens": 531911520} {"current_steps": 2945, "total_steps": 9134, "loss": 0.6152, "learning_rate": 3.823469127776208e-05, "epoch": 0.3223952489121213, "percentage": 32.24, "elapsed_time": "2 days, 6:16:16", "remaining_time": "4 days, 18:03:08", "throughput": 2723.3, "total_tokens": 532068096} {"current_steps": 2946, "total_steps": 9134, "loss": 0.5899, "learning_rate": 3.822739559541795e-05, "epoch": 0.3225047209830592, "percentage": 32.25, "elapsed_time": "2 days, 6:17:22", "remaining_time": "4 days, 18:02:03", "throughput": 2723.25, "total_tokens": 532240576} {"current_steps": 2947, "total_steps": 9134, "loss": 0.6232, "learning_rate": 3.8220098348298204e-05, "epoch": 0.3226141930539971, "percentage": 32.26, "elapsed_time": "2 days, 6:18:30", "remaining_time": "4 days, 18:01:00", "throughput": 2723.28, "total_tokens": 532431648} {"current_steps": 2948, "total_steps": 9134, "loss": 0.7026, "learning_rate": 3.8212799537266105e-05, "epoch": 0.322723665124935, "percentage": 32.28, "elapsed_time": "2 days, 6:19:35", "remaining_time": "4 days, 17:59:49", "throughput": 2723.22, "total_tokens": 532594944} {"current_steps": 2949, "total_steps": 9134, "loss": 0.796, "learning_rate": 3.8205499163185074e-05, "epoch": 0.3228331371958729, "percentage": 32.29, "elapsed_time": "2 days, 6:20:44", "remaining_time": "4 days, 17:58:49", "throughput": 2723.16, "total_tokens": 532771008} {"current_steps": 2950, "total_steps": 9134, "loss": 0.7151, "learning_rate": 3.819819722691874e-05, "epoch": 0.3229426092668108, "percentage": 32.3, "elapsed_time": "2 days, 6:21:49", "remaining_time": "4 days, 17:57:40", "throughput": 2723.15, "total_tokens": 532947072} {"current_steps": 2951, "total_steps": 9134, "loss": 0.8587, "learning_rate": 3.8190893729330904e-05, "epoch": 0.3230520813377487, "percentage": 32.31, "elapsed_time": "2 days, 6:22:59", "remaining_time": "4 days, 17:56:40", "throughput": 2723.31, "total_tokens": 533166592} {"current_steps": 2952, "total_steps": 9134, "loss": 0.7172, "learning_rate": 3.8183588671285556e-05, "epoch": 0.32316155340868663, "percentage": 32.32, "elapsed_time": "2 days, 6:24:08", "remaining_time": "4 days, 17:55:40", "throughput": 2723.42, "total_tokens": 533376480} {"current_steps": 2953, "total_steps": 9134, "loss": 0.6343, "learning_rate": 3.817628205364687e-05, "epoch": 0.3232710254796245, "percentage": 32.33, "elapsed_time": "2 days, 6:25:16", "remaining_time": "4 days, 17:54:38", "throughput": 2723.34, "total_tokens": 533547168} {"current_steps": 2954, "total_steps": 9134, "loss": 0.8268, "learning_rate": 3.816897387727921e-05, "epoch": 0.3233804975505624, "percentage": 32.34, "elapsed_time": "2 days, 6:26:20", "remaining_time": "4 days, 17:53:26", "throughput": 2723.3, "total_tokens": 533713376} {"current_steps": 2955, "total_steps": 9134, "loss": 0.8066, "learning_rate": 3.816166414304711e-05, "epoch": 0.32348996962150034, "percentage": 32.35, "elapsed_time": "2 days, 6:27:29", "remaining_time": "4 days, 17:52:24", "throughput": 2723.27, "total_tokens": 533893696} {"current_steps": 2956, "total_steps": 9134, "loss": 0.7821, "learning_rate": 3.81543528518153e-05, "epoch": 0.3235994416924382, "percentage": 32.36, "elapsed_time": "2 days, 6:28:38", "remaining_time": "4 days, 17:51:24", "throughput": 2723.37, "total_tokens": 534101792} {"current_steps": 2957, "total_steps": 9134, "loss": 0.8894, "learning_rate": 3.81470400044487e-05, "epoch": 0.3237089137633761, "percentage": 32.37, "elapsed_time": "2 days, 6:29:44", "remaining_time": "4 days, 17:50:17", "throughput": 2723.43, "total_tokens": 534293536} {"current_steps": 2958, "total_steps": 9134, "loss": 0.7484, "learning_rate": 3.81397256018124e-05, "epoch": 0.323818385834314, "percentage": 32.38, "elapsed_time": "2 days, 6:30:46", "remaining_time": "4 days, 17:49:02", "throughput": 2723.44, "total_tokens": 534464896} {"current_steps": 2959, "total_steps": 9134, "loss": 0.605, "learning_rate": 3.8132409644771683e-05, "epoch": 0.3239278579052519, "percentage": 32.4, "elapsed_time": "2 days, 6:31:53", "remaining_time": "4 days, 17:47:57", "throughput": 2723.53, "total_tokens": 534665600} {"current_steps": 2960, "total_steps": 9134, "loss": 0.6027, "learning_rate": 3.812509213419201e-05, "epoch": 0.32403732997618984, "percentage": 32.41, "elapsed_time": "2 days, 6:32:56", "remaining_time": "4 days, 17:46:44", "throughput": 2723.5, "total_tokens": 534832928} {"current_steps": 2961, "total_steps": 9134, "loss": 0.8371, "learning_rate": 3.8117773070939025e-05, "epoch": 0.3241468020471277, "percentage": 32.42, "elapsed_time": "2 days, 6:34:05", "remaining_time": "4 days, 17:45:42", "throughput": 2723.44, "total_tokens": 535006080} {"current_steps": 2962, "total_steps": 9134, "loss": 0.7262, "learning_rate": 3.811045245587856e-05, "epoch": 0.3242562741180656, "percentage": 32.43, "elapsed_time": "2 days, 6:35:14", "remaining_time": "4 days, 17:44:42", "throughput": 2723.51, "total_tokens": 535208576} {"current_steps": 2963, "total_steps": 9134, "loss": 0.7924, "learning_rate": 3.810313028987663e-05, "epoch": 0.32436574618900355, "percentage": 32.44, "elapsed_time": "2 days, 6:36:20", "remaining_time": "4 days, 17:43:36", "throughput": 2723.43, "total_tokens": 535373664} {"current_steps": 2964, "total_steps": 9134, "loss": 0.6628, "learning_rate": 3.809580657379944e-05, "epoch": 0.3244752182599414, "percentage": 32.45, "elapsed_time": "2 days, 6:37:28", "remaining_time": "4 days, 17:42:31", "throughput": 2723.5, "total_tokens": 535570560} {"current_steps": 2965, "total_steps": 9134, "loss": 0.5767, "learning_rate": 3.8088481308513375e-05, "epoch": 0.32458469033087933, "percentage": 32.46, "elapsed_time": "2 days, 6:38:35", "remaining_time": "4 days, 17:41:27", "throughput": 2723.54, "total_tokens": 535761408} {"current_steps": 2966, "total_steps": 9134, "loss": 0.7851, "learning_rate": 3.808115449488499e-05, "epoch": 0.32469416240181725, "percentage": 32.47, "elapsed_time": "2 days, 6:39:40", "remaining_time": "4 days, 17:40:18", "throughput": 2723.63, "total_tokens": 535956512} {"current_steps": 2967, "total_steps": 9134, "loss": 0.7067, "learning_rate": 3.8073826133781026e-05, "epoch": 0.3248036344727551, "percentage": 32.48, "elapsed_time": "2 days, 6:40:41", "remaining_time": "4 days, 17:39:01", "throughput": 2723.52, "total_tokens": 536103008} {"current_steps": 2968, "total_steps": 9134, "loss": 0.6918, "learning_rate": 3.8066496226068426e-05, "epoch": 0.32491310654369304, "percentage": 32.49, "elapsed_time": "2 days, 6:41:49", "remaining_time": "4 days, 17:37:58", "throughput": 2723.55, "total_tokens": 536293856} {"current_steps": 2969, "total_steps": 9134, "loss": 0.7358, "learning_rate": 3.8059164772614304e-05, "epoch": 0.32502257861463096, "percentage": 32.5, "elapsed_time": "2 days, 6:42:56", "remaining_time": "4 days, 17:36:54", "throughput": 2723.56, "total_tokens": 536477984} {"current_steps": 2970, "total_steps": 9134, "loss": 0.7322, "learning_rate": 3.805183177428595e-05, "epoch": 0.32513205068556883, "percentage": 32.52, "elapsed_time": "2 days, 6:44:04", "remaining_time": "4 days, 17:35:49", "throughput": 2723.49, "total_tokens": 536648224} {"current_steps": 2971, "total_steps": 9134, "loss": 0.5611, "learning_rate": 3.8044497231950855e-05, "epoch": 0.32524152275650675, "percentage": 32.53, "elapsed_time": "2 days, 6:45:11", "remaining_time": "4 days, 17:34:45", "throughput": 2723.48, "total_tokens": 536829440} {"current_steps": 2972, "total_steps": 9134, "loss": 0.6641, "learning_rate": 3.803716114647667e-05, "epoch": 0.3253509948274447, "percentage": 32.54, "elapsed_time": "2 days, 6:46:15", "remaining_time": "4 days, 17:33:34", "throughput": 2723.5, "total_tokens": 537007520} {"current_steps": 2973, "total_steps": 9134, "loss": 0.7223, "learning_rate": 3.8029823518731247e-05, "epoch": 0.32546046689838254, "percentage": 32.55, "elapsed_time": "2 days, 6:47:23", "remaining_time": "4 days, 17:32:30", "throughput": 2723.53, "total_tokens": 537198816} {"current_steps": 2974, "total_steps": 9134, "loss": 0.6333, "learning_rate": 3.802248434958261e-05, "epoch": 0.32556993896932046, "percentage": 32.56, "elapsed_time": "2 days, 6:48:26", "remaining_time": "4 days, 17:31:16", "throughput": 2723.51, "total_tokens": 537365248} {"current_steps": 2975, "total_steps": 9134, "loss": 0.6795, "learning_rate": 3.801514363989897e-05, "epoch": 0.3256794110402583, "percentage": 32.57, "elapsed_time": "2 days, 6:49:29", "remaining_time": "4 days, 17:30:03", "throughput": 2723.52, "total_tokens": 537539296} {"current_steps": 2976, "total_steps": 9134, "loss": 0.5947, "learning_rate": 3.8007801390548706e-05, "epoch": 0.32578888311119625, "percentage": 32.58, "elapsed_time": "2 days, 6:50:35", "remaining_time": "4 days, 17:28:57", "throughput": 2723.5, "total_tokens": 537716480} {"current_steps": 2977, "total_steps": 9134, "loss": 0.6689, "learning_rate": 3.800045760240042e-05, "epoch": 0.32589835518213417, "percentage": 32.59, "elapsed_time": "2 days, 6:51:40", "remaining_time": "4 days, 17:27:48", "throughput": 2723.48, "total_tokens": 537888512} {"current_steps": 2978, "total_steps": 9134, "loss": 0.6666, "learning_rate": 3.799311227632284e-05, "epoch": 0.32600782725307204, "percentage": 32.6, "elapsed_time": "2 days, 6:52:48", "remaining_time": "4 days, 17:26:44", "throughput": 2723.52, "total_tokens": 538080928} {"current_steps": 2979, "total_steps": 9134, "loss": 0.7422, "learning_rate": 3.7985765413184924e-05, "epoch": 0.32611729932400996, "percentage": 32.61, "elapsed_time": "2 days, 6:53:50", "remaining_time": "4 days, 17:25:30", "throughput": 2723.47, "total_tokens": 538241536} {"current_steps": 2980, "total_steps": 9134, "loss": 0.6312, "learning_rate": 3.797841701385578e-05, "epoch": 0.3262267713949479, "percentage": 32.63, "elapsed_time": "2 days, 6:54:57", "remaining_time": "4 days, 17:24:24", "throughput": 2723.47, "total_tokens": 538422976} {"current_steps": 2981, "total_steps": 9134, "loss": 0.7662, "learning_rate": 3.7971067079204726e-05, "epoch": 0.32633624346588574, "percentage": 32.64, "elapsed_time": "2 days, 6:56:01", "remaining_time": "4 days, 17:23:13", "throughput": 2723.43, "total_tokens": 538588288} {"current_steps": 2982, "total_steps": 9134, "loss": 0.7762, "learning_rate": 3.7963715610101215e-05, "epoch": 0.32644571553682367, "percentage": 32.65, "elapsed_time": "2 days, 6:57:08", "remaining_time": "4 days, 17:22:09", "throughput": 2723.5, "total_tokens": 538786752} {"current_steps": 2983, "total_steps": 9134, "loss": 1.0204, "learning_rate": 3.795636260741494e-05, "epoch": 0.3265551876077616, "percentage": 32.66, "elapsed_time": "2 days, 6:58:17", "remaining_time": "4 days, 17:21:07", "throughput": 2723.4, "total_tokens": 538953632} {"current_steps": 2984, "total_steps": 9134, "loss": 0.7219, "learning_rate": 3.794900807201574e-05, "epoch": 0.32666465967869945, "percentage": 32.67, "elapsed_time": "2 days, 6:59:23", "remaining_time": "4 days, 17:20:01", "throughput": 2723.36, "total_tokens": 539126112} {"current_steps": 2985, "total_steps": 9134, "loss": 0.4956, "learning_rate": 3.794165200477363e-05, "epoch": 0.3267741317496374, "percentage": 32.68, "elapsed_time": "2 days, 7:00:26", "remaining_time": "4 days, 17:18:47", "throughput": 2723.24, "total_tokens": 539273504} {"current_steps": 2986, "total_steps": 9134, "loss": 0.7768, "learning_rate": 3.793429440655884e-05, "epoch": 0.3268836038205753, "percentage": 32.69, "elapsed_time": "2 days, 7:01:33", "remaining_time": "4 days, 17:17:42", "throughput": 2723.35, "total_tokens": 539477120} {"current_steps": 2987, "total_steps": 9134, "loss": 0.7814, "learning_rate": 3.792693527824174e-05, "epoch": 0.32699307589151316, "percentage": 32.7, "elapsed_time": "2 days, 7:02:34", "remaining_time": "4 days, 17:16:26", "throughput": 2723.38, "total_tokens": 539651616} {"current_steps": 2988, "total_steps": 9134, "loss": 0.7395, "learning_rate": 3.791957462069291e-05, "epoch": 0.3271025479624511, "percentage": 32.71, "elapsed_time": "2 days, 7:03:37", "remaining_time": "4 days, 17:15:12", "throughput": 2723.29, "total_tokens": 539804160} {"current_steps": 2989, "total_steps": 9134, "loss": 0.5808, "learning_rate": 3.7912212434783095e-05, "epoch": 0.327212020033389, "percentage": 32.72, "elapsed_time": "2 days, 7:04:43", "remaining_time": "4 days, 17:14:05", "throughput": 2723.27, "total_tokens": 539979776} {"current_steps": 2990, "total_steps": 9134, "loss": 0.6056, "learning_rate": 3.7904848721383234e-05, "epoch": 0.32732149210432687, "percentage": 32.73, "elapsed_time": "2 days, 7:05:46", "remaining_time": "4 days, 17:12:52", "throughput": 2723.16, "total_tokens": 540129184} {"current_steps": 2991, "total_steps": 9134, "loss": 0.7609, "learning_rate": 3.789748348136444e-05, "epoch": 0.3274309641752648, "percentage": 32.75, "elapsed_time": "2 days, 7:06:55", "remaining_time": "4 days, 17:11:51", "throughput": 2723.27, "total_tokens": 540339072} {"current_steps": 2992, "total_steps": 9134, "loss": 0.5684, "learning_rate": 3.7890116715598013e-05, "epoch": 0.3275404362462027, "percentage": 32.76, "elapsed_time": "2 days, 7:08:02", "remaining_time": "4 days, 17:10:46", "throughput": 2723.39, "total_tokens": 540545376} {"current_steps": 2993, "total_steps": 9134, "loss": 0.9684, "learning_rate": 3.7882748424955414e-05, "epoch": 0.3276499083171406, "percentage": 32.77, "elapsed_time": "2 days, 7:09:11", "remaining_time": "4 days, 17:09:46", "throughput": 2723.44, "total_tokens": 540744736} {"current_steps": 2994, "total_steps": 9134, "loss": 0.7161, "learning_rate": 3.7875378610308306e-05, "epoch": 0.3277593803880785, "percentage": 32.78, "elapsed_time": "2 days, 7:10:16", "remaining_time": "4 days, 17:08:36", "throughput": 2723.49, "total_tokens": 540930208} {"current_steps": 2995, "total_steps": 9134, "loss": 0.8304, "learning_rate": 3.7868007272528524e-05, "epoch": 0.32786885245901637, "percentage": 32.79, "elapsed_time": "2 days, 7:11:19", "remaining_time": "4 days, 17:07:22", "throughput": 2723.39, "total_tokens": 541080960} {"current_steps": 2996, "total_steps": 9134, "loss": 0.6485, "learning_rate": 3.786063441248808e-05, "epoch": 0.3279783245299543, "percentage": 32.8, "elapsed_time": "2 days, 7:12:24", "remaining_time": "4 days, 17:06:14", "throughput": 2723.45, "total_tokens": 541271136} {"current_steps": 2997, "total_steps": 9134, "loss": 0.8814, "learning_rate": 3.785326003105916e-05, "epoch": 0.3280877966008922, "percentage": 32.81, "elapsed_time": "2 days, 7:13:29", "remaining_time": "4 days, 17:05:06", "throughput": 2723.34, "total_tokens": 541427488} {"current_steps": 2998, "total_steps": 9134, "loss": 0.5283, "learning_rate": 3.784588412911416e-05, "epoch": 0.3281972686718301, "percentage": 32.82, "elapsed_time": "2 days, 7:14:37", "remaining_time": "4 days, 17:04:02", "throughput": 2723.37, "total_tokens": 541617888} {"current_steps": 2999, "total_steps": 9134, "loss": 0.6947, "learning_rate": 3.783850670752563e-05, "epoch": 0.328306740742768, "percentage": 32.83, "elapsed_time": "2 days, 7:15:45", "remaining_time": "4 days, 17:02:58", "throughput": 2723.44, "total_tokens": 541816352} {"current_steps": 3000, "total_steps": 9134, "loss": 0.821, "learning_rate": 3.783112776716629e-05, "epoch": 0.3284162128137059, "percentage": 32.84, "elapsed_time": "2 days, 7:16:52", "remaining_time": "4 days, 17:01:53", "throughput": 2723.42, "total_tokens": 541993760} {"current_steps": 3001, "total_steps": 9134, "loss": 1.0811, "learning_rate": 3.782374730890908e-05, "epoch": 0.3285256848846438, "percentage": 32.86, "elapsed_time": "2 days, 7:17:58", "remaining_time": "4 days, 17:00:46", "throughput": 2723.42, "total_tokens": 542173632} {"current_steps": 3002, "total_steps": 9134, "loss": 0.7887, "learning_rate": 3.781636533362706e-05, "epoch": 0.3286351569555817, "percentage": 32.87, "elapsed_time": "2 days, 7:19:06", "remaining_time": "4 days, 16:59:43", "throughput": 2723.49, "total_tokens": 542372320} {"current_steps": 3003, "total_steps": 9134, "loss": 0.7109, "learning_rate": 3.780898184219352e-05, "epoch": 0.32874462902651963, "percentage": 32.88, "elapsed_time": "2 days, 7:20:08", "remaining_time": "4 days, 16:58:28", "throughput": 2723.39, "total_tokens": 542521728} {"current_steps": 3004, "total_steps": 9134, "loss": 0.904, "learning_rate": 3.780159683548192e-05, "epoch": 0.3288541010974575, "percentage": 32.89, "elapsed_time": "2 days, 7:21:15", "remaining_time": "4 days, 16:57:24", "throughput": 2723.36, "total_tokens": 542699584} {"current_steps": 3005, "total_steps": 9134, "loss": 0.8152, "learning_rate": 3.779421031436588e-05, "epoch": 0.3289635731683954, "percentage": 32.9, "elapsed_time": "2 days, 7:22:23", "remaining_time": "4 days, 16:56:22", "throughput": 2723.45, "total_tokens": 542902752} {"current_steps": 3006, "total_steps": 9134, "loss": 0.5504, "learning_rate": 3.7786822279719237e-05, "epoch": 0.32907304523933334, "percentage": 32.91, "elapsed_time": "2 days, 7:23:30", "remaining_time": "4 days, 16:55:15", "throughput": 2723.47, "total_tokens": 543088224} {"current_steps": 3007, "total_steps": 9134, "loss": 0.7772, "learning_rate": 3.777943273241595e-05, "epoch": 0.3291825173102712, "percentage": 32.92, "elapsed_time": "2 days, 7:24:36", "remaining_time": "4 days, 16:54:09", "throughput": 2723.41, "total_tokens": 543258016} {"current_steps": 3008, "total_steps": 9134, "loss": 0.6468, "learning_rate": 3.77720416733302e-05, "epoch": 0.3292919893812091, "percentage": 32.93, "elapsed_time": "2 days, 7:25:40", "remaining_time": "4 days, 16:52:58", "throughput": 2723.39, "total_tokens": 543426912} {"current_steps": 3009, "total_steps": 9134, "loss": 0.5287, "learning_rate": 3.776464910333635e-05, "epoch": 0.32940146145214705, "percentage": 32.94, "elapsed_time": "2 days, 7:26:46", "remaining_time": "4 days, 16:51:51", "throughput": 2723.44, "total_tokens": 543617312} {"current_steps": 3010, "total_steps": 9134, "loss": 0.6494, "learning_rate": 3.77572550233089e-05, "epoch": 0.3295109335230849, "percentage": 32.95, "elapsed_time": "2 days, 7:27:52", "remaining_time": "4 days, 16:50:44", "throughput": 2723.51, "total_tokens": 543810848} {"current_steps": 3011, "total_steps": 9134, "loss": 0.6514, "learning_rate": 3.774985943412257e-05, "epoch": 0.32962040559402284, "percentage": 32.96, "elapsed_time": "2 days, 7:28:58", "remaining_time": "4 days, 16:49:36", "throughput": 2723.5, "total_tokens": 543986912} {"current_steps": 3012, "total_steps": 9134, "loss": 0.9398, "learning_rate": 3.774246233665224e-05, "epoch": 0.3297298776649607, "percentage": 32.98, "elapsed_time": "2 days, 7:30:06", "remaining_time": "4 days, 16:48:34", "throughput": 2723.58, "total_tokens": 544188960} {"current_steps": 3013, "total_steps": 9134, "loss": 0.5982, "learning_rate": 3.773506373177298e-05, "epoch": 0.3298393497358986, "percentage": 32.99, "elapsed_time": "2 days, 7:31:11", "remaining_time": "4 days, 16:47:24", "throughput": 2723.63, "total_tokens": 544376896} {"current_steps": 3014, "total_steps": 9134, "loss": 0.5543, "learning_rate": 3.7727663620360026e-05, "epoch": 0.32994882180683655, "percentage": 33.0, "elapsed_time": "2 days, 7:32:16", "remaining_time": "4 days, 16:46:16", "throughput": 2723.62, "total_tokens": 544550944} {"current_steps": 3015, "total_steps": 9134, "loss": 0.5163, "learning_rate": 3.772026200328879e-05, "epoch": 0.3300582938777744, "percentage": 33.01, "elapsed_time": "2 days, 7:33:24", "remaining_time": "4 days, 16:45:12", "throughput": 2723.6, "total_tokens": 544731936} {"current_steps": 3016, "total_steps": 9134, "loss": 0.7702, "learning_rate": 3.771285888143489e-05, "epoch": 0.33016776594871233, "percentage": 33.02, "elapsed_time": "2 days, 7:34:32", "remaining_time": "4 days, 16:44:09", "throughput": 2723.6, "total_tokens": 544918080} {"current_steps": 3017, "total_steps": 9134, "loss": 0.5687, "learning_rate": 3.7705454255674064e-05, "epoch": 0.33027723801965025, "percentage": 33.03, "elapsed_time": "2 days, 7:35:34", "remaining_time": "4 days, 16:42:54", "throughput": 2723.54, "total_tokens": 545073984} {"current_steps": 3018, "total_steps": 9134, "loss": 0.8614, "learning_rate": 3.769804812688231e-05, "epoch": 0.3303867100905881, "percentage": 33.04, "elapsed_time": "2 days, 7:36:39", "remaining_time": "4 days, 16:41:45", "throughput": 2723.51, "total_tokens": 545245120} {"current_steps": 3019, "total_steps": 9134, "loss": 0.748, "learning_rate": 3.769064049593573e-05, "epoch": 0.33049618216152604, "percentage": 33.05, "elapsed_time": "2 days, 7:37:45", "remaining_time": "4 days, 16:40:37", "throughput": 2723.48, "total_tokens": 545417600} {"current_steps": 3020, "total_steps": 9134, "loss": 0.6956, "learning_rate": 3.768323136371064e-05, "epoch": 0.33060565423246396, "percentage": 33.06, "elapsed_time": "2 days, 7:38:45", "remaining_time": "4 days, 16:39:20", "throughput": 2723.41, "total_tokens": 545569024} {"current_steps": 3021, "total_steps": 9134, "loss": 0.6547, "learning_rate": 3.7675820731083526e-05, "epoch": 0.33071512630340183, "percentage": 33.07, "elapsed_time": "2 days, 7:39:49", "remaining_time": "4 days, 16:38:08", "throughput": 2723.45, "total_tokens": 545751360} {"current_steps": 3022, "total_steps": 9134, "loss": 0.8081, "learning_rate": 3.766840859893105e-05, "epoch": 0.33082459837433975, "percentage": 33.09, "elapsed_time": "2 days, 7:40:57", "remaining_time": "4 days, 16:37:05", "throughput": 2723.4, "total_tokens": 545925184} {"current_steps": 3023, "total_steps": 9134, "loss": 0.6221, "learning_rate": 3.766099496813006e-05, "epoch": 0.3309340704452777, "percentage": 33.1, "elapsed_time": "2 days, 7:41:59", "remaining_time": "4 days, 16:35:50", "throughput": 2723.27, "total_tokens": 546068544} {"current_steps": 3024, "total_steps": 9134, "loss": 0.5686, "learning_rate": 3.765357983955756e-05, "epoch": 0.33104354251621554, "percentage": 33.11, "elapsed_time": "2 days, 7:43:04", "remaining_time": "4 days, 16:34:40", "throughput": 2723.24, "total_tokens": 546239680} {"current_steps": 3025, "total_steps": 9134, "loss": 0.6519, "learning_rate": 3.764616321409076e-05, "epoch": 0.33115301458715346, "percentage": 33.12, "elapsed_time": "2 days, 7:44:11", "remaining_time": "4 days, 16:33:37", "throughput": 2723.2, "total_tokens": 546415072} {"current_steps": 3026, "total_steps": 9134, "loss": 0.7772, "learning_rate": 3.763874509260702e-05, "epoch": 0.3312624866580914, "percentage": 33.13, "elapsed_time": "2 days, 7:45:19", "remaining_time": "4 days, 16:32:33", "throughput": 2723.29, "total_tokens": 546616672} {"current_steps": 3027, "total_steps": 9134, "loss": 0.6952, "learning_rate": 3.7631325475983905e-05, "epoch": 0.33137195872902925, "percentage": 33.14, "elapsed_time": "2 days, 7:46:25", "remaining_time": "4 days, 16:31:26", "throughput": 2723.29, "total_tokens": 546797664} {"current_steps": 3028, "total_steps": 9134, "loss": 0.7839, "learning_rate": 3.7623904365099134e-05, "epoch": 0.33148143079996717, "percentage": 33.15, "elapsed_time": "2 days, 7:47:34", "remaining_time": "4 days, 16:30:26", "throughput": 2723.31, "total_tokens": 546989632} {"current_steps": 3029, "total_steps": 9134, "loss": 0.8631, "learning_rate": 3.761648176083061e-05, "epoch": 0.33159090287090504, "percentage": 33.16, "elapsed_time": "2 days, 7:48:41", "remaining_time": "4 days, 16:29:20", "throughput": 2723.36, "total_tokens": 547180032} {"current_steps": 3030, "total_steps": 9134, "loss": 0.6256, "learning_rate": 3.76090576640564e-05, "epoch": 0.33170037494184296, "percentage": 33.17, "elapsed_time": "2 days, 7:49:48", "remaining_time": "4 days, 16:28:16", "throughput": 2723.35, "total_tokens": 547363712} {"current_steps": 3031, "total_steps": 9134, "loss": 0.7486, "learning_rate": 3.7601632075654784e-05, "epoch": 0.3318098470127809, "percentage": 33.18, "elapsed_time": "2 days, 7:50:51", "remaining_time": "4 days, 16:27:03", "throughput": 2723.32, "total_tokens": 547529248} {"current_steps": 3032, "total_steps": 9134, "loss": 0.6361, "learning_rate": 3.759420499650419e-05, "epoch": 0.33191931908371874, "percentage": 33.19, "elapsed_time": "2 days, 7:51:55", "remaining_time": "4 days, 16:25:51", "throughput": 2723.27, "total_tokens": 547691872} {"current_steps": 3033, "total_steps": 9134, "loss": 0.7569, "learning_rate": 3.758677642748321e-05, "epoch": 0.33202879115465667, "percentage": 33.21, "elapsed_time": "2 days, 7:53:03", "remaining_time": "4 days, 16:24:48", "throughput": 2723.44, "total_tokens": 547911392} {"current_steps": 3034, "total_steps": 9134, "loss": 0.6862, "learning_rate": 3.757934636947064e-05, "epoch": 0.3321382632255946, "percentage": 33.22, "elapsed_time": "2 days, 7:54:09", "remaining_time": "4 days, 16:23:40", "throughput": 2723.37, "total_tokens": 548075808} {"current_steps": 3035, "total_steps": 9134, "loss": 0.7132, "learning_rate": 3.7571914823345444e-05, "epoch": 0.33224773529653245, "percentage": 33.23, "elapsed_time": "2 days, 7:55:14", "remaining_time": "4 days, 16:22:32", "throughput": 2723.35, "total_tokens": 548250080} {"current_steps": 3036, "total_steps": 9134, "loss": 0.701, "learning_rate": 3.756448178998676e-05, "epoch": 0.3323572073674704, "percentage": 33.24, "elapsed_time": "2 days, 7:56:23", "remaining_time": "4 days, 16:21:31", "throughput": 2723.47, "total_tokens": 548462432} {"current_steps": 3037, "total_steps": 9134, "loss": 0.6908, "learning_rate": 3.755704727027389e-05, "epoch": 0.3324666794384083, "percentage": 33.25, "elapsed_time": "2 days, 7:57:27", "remaining_time": "4 days, 16:20:20", "throughput": 2723.45, "total_tokens": 548632000} {"current_steps": 3038, "total_steps": 9134, "loss": 0.5264, "learning_rate": 3.754961126508634e-05, "epoch": 0.33257615150934616, "percentage": 33.26, "elapsed_time": "2 days, 7:58:31", "remaining_time": "4 days, 16:19:09", "throughput": 2723.34, "total_tokens": 548783648} {"current_steps": 3039, "total_steps": 9134, "loss": 0.5652, "learning_rate": 3.754217377530377e-05, "epoch": 0.3326856235802841, "percentage": 33.27, "elapsed_time": "2 days, 7:59:39", "remaining_time": "4 days, 16:18:05", "throughput": 2723.42, "total_tokens": 548983680} {"current_steps": 3040, "total_steps": 9134, "loss": 0.701, "learning_rate": 3.753473480180603e-05, "epoch": 0.332795095651222, "percentage": 33.28, "elapsed_time": "2 days, 8:00:42", "remaining_time": "4 days, 16:16:52", "throughput": 2723.4, "total_tokens": 549152576} {"current_steps": 3041, "total_steps": 9134, "loss": 0.6705, "learning_rate": 3.752729434547311e-05, "epoch": 0.33290456772215987, "percentage": 33.29, "elapsed_time": "2 days, 8:01:49", "remaining_time": "4 days, 16:15:48", "throughput": 2723.48, "total_tokens": 549351040} {"current_steps": 3042, "total_steps": 9134, "loss": 0.6188, "learning_rate": 3.751985240718522e-05, "epoch": 0.3330140397930978, "percentage": 33.3, "elapsed_time": "2 days, 8:02:49", "remaining_time": "4 days, 16:14:29", "throughput": 2723.37, "total_tokens": 549493728} {"current_steps": 3043, "total_steps": 9134, "loss": 0.8571, "learning_rate": 3.7512408987822724e-05, "epoch": 0.3331235118640357, "percentage": 33.32, "elapsed_time": "2 days, 8:03:58", "remaining_time": "4 days, 16:13:29", "throughput": 2723.44, "total_tokens": 549695552} {"current_steps": 3044, "total_steps": 9134, "loss": 0.6649, "learning_rate": 3.750496408826616e-05, "epoch": 0.3332329839349736, "percentage": 33.33, "elapsed_time": "2 days, 8:05:07", "remaining_time": "4 days, 16:12:26", "throughput": 2723.42, "total_tokens": 549878560} {"current_steps": 3045, "total_steps": 9134, "loss": 0.6378, "learning_rate": 3.749751770939626e-05, "epoch": 0.3333424560059115, "percentage": 33.34, "elapsed_time": "2 days, 8:06:12", "remaining_time": "4 days, 16:11:19", "throughput": 2723.35, "total_tokens": 550043200} {"current_steps": 3046, "total_steps": 9134, "loss": 0.7189, "learning_rate": 3.74900698520939e-05, "epoch": 0.33345192807684937, "percentage": 33.35, "elapsed_time": "2 days, 8:07:22", "remaining_time": "4 days, 16:10:19", "throughput": 2723.46, "total_tokens": 550253536} {"current_steps": 3047, "total_steps": 9134, "loss": 0.5551, "learning_rate": 3.7482620517240155e-05, "epoch": 0.3335614001477873, "percentage": 33.36, "elapsed_time": "2 days, 8:08:29", "remaining_time": "4 days, 16:09:15", "throughput": 2723.46, "total_tokens": 550438336} {"current_steps": 3048, "total_steps": 9134, "loss": 0.8268, "learning_rate": 3.747516970571626e-05, "epoch": 0.3336708722187252, "percentage": 33.37, "elapsed_time": "2 days, 8:09:37", "remaining_time": "4 days, 16:08:11", "throughput": 2723.4, "total_tokens": 550610368} {"current_steps": 3049, "total_steps": 9134, "loss": 0.5868, "learning_rate": 3.746771741840365e-05, "epoch": 0.3337803442896631, "percentage": 33.38, "elapsed_time": "2 days, 8:10:38", "remaining_time": "4 days, 16:06:55", "throughput": 2723.35, "total_tokens": 550766944} {"current_steps": 3050, "total_steps": 9134, "loss": 0.6358, "learning_rate": 3.746026365618389e-05, "epoch": 0.333889816360601, "percentage": 33.39, "elapsed_time": "2 days, 8:11:41", "remaining_time": "4 days, 16:05:42", "throughput": 2723.38, "total_tokens": 550944128} {"current_steps": 3051, "total_steps": 9134, "loss": 0.7253, "learning_rate": 3.745280841993876e-05, "epoch": 0.3339992884315389, "percentage": 33.4, "elapsed_time": "2 days, 8:12:47", "remaining_time": "4 days, 16:04:35", "throughput": 2723.35, "total_tokens": 551118624} {"current_steps": 3052, "total_steps": 9134, "loss": 0.6385, "learning_rate": 3.744535171055021e-05, "epoch": 0.3341087605024768, "percentage": 33.41, "elapsed_time": "2 days, 8:13:53", "remaining_time": "4 days, 16:03:27", "throughput": 2723.37, "total_tokens": 551301856} {"current_steps": 3053, "total_steps": 9134, "loss": 0.7595, "learning_rate": 3.743789352890034e-05, "epoch": 0.3342182325734147, "percentage": 33.42, "elapsed_time": "2 days, 8:14:58", "remaining_time": "4 days, 16:02:17", "throughput": 2723.33, "total_tokens": 551468736} {"current_steps": 3054, "total_steps": 9134, "loss": 0.8359, "learning_rate": 3.743043387587144e-05, "epoch": 0.33432770464435263, "percentage": 33.44, "elapsed_time": "2 days, 8:16:06", "remaining_time": "4 days, 16:01:15", "throughput": 2723.27, "total_tokens": 551643456} {"current_steps": 3055, "total_steps": 9134, "loss": 0.6378, "learning_rate": 3.742297275234598e-05, "epoch": 0.3344371767152905, "percentage": 33.45, "elapsed_time": "2 days, 8:17:11", "remaining_time": "4 days, 16:00:06", "throughput": 2723.25, "total_tokens": 551815712} {"current_steps": 3056, "total_steps": 9134, "loss": 0.6353, "learning_rate": 3.7415510159206593e-05, "epoch": 0.3345466487862284, "percentage": 33.46, "elapsed_time": "2 days, 8:18:16", "remaining_time": "4 days, 15:58:57", "throughput": 2723.21, "total_tokens": 551983936} {"current_steps": 3057, "total_steps": 9134, "loss": 0.6878, "learning_rate": 3.740804609733608e-05, "epoch": 0.33465612085716634, "percentage": 33.47, "elapsed_time": "2 days, 8:19:23", "remaining_time": "4 days, 15:57:52", "throughput": 2723.26, "total_tokens": 552176800} {"current_steps": 3058, "total_steps": 9134, "loss": 0.7228, "learning_rate": 3.740058056761743e-05, "epoch": 0.3347655929281042, "percentage": 33.48, "elapsed_time": "2 days, 8:20:27", "remaining_time": "4 days, 15:56:42", "throughput": 2723.23, "total_tokens": 552345696} {"current_steps": 3059, "total_steps": 9134, "loss": 0.5975, "learning_rate": 3.739311357093382e-05, "epoch": 0.3348750649990421, "percentage": 33.49, "elapsed_time": "2 days, 8:21:35", "remaining_time": "4 days, 15:55:39", "throughput": 2723.23, "total_tokens": 552532960} {"current_steps": 3060, "total_steps": 9134, "loss": 0.8951, "learning_rate": 3.738564510816856e-05, "epoch": 0.33498453706998005, "percentage": 33.5, "elapsed_time": "2 days, 8:22:41", "remaining_time": "4 days, 15:54:31", "throughput": 2723.19, "total_tokens": 552701632} {"current_steps": 3061, "total_steps": 9134, "loss": 0.7841, "learning_rate": 3.737817518020516e-05, "epoch": 0.3350940091409179, "percentage": 33.51, "elapsed_time": "2 days, 8:23:47", "remaining_time": "4 days, 15:53:25", "throughput": 2723.24, "total_tokens": 552892480} {"current_steps": 3062, "total_steps": 9134, "loss": 0.642, "learning_rate": 3.73707037879273e-05, "epoch": 0.33520348121185584, "percentage": 33.52, "elapsed_time": "2 days, 8:24:53", "remaining_time": "4 days, 15:52:17", "throughput": 2723.21, "total_tokens": 553065856} {"current_steps": 3063, "total_steps": 9134, "loss": 0.9782, "learning_rate": 3.736323093221884e-05, "epoch": 0.3353129532827937, "percentage": 33.53, "elapsed_time": "2 days, 8:26:01", "remaining_time": "4 days, 15:51:14", "throughput": 2723.21, "total_tokens": 553250656} {"current_steps": 3064, "total_steps": 9134, "loss": 0.6574, "learning_rate": 3.735575661396378e-05, "epoch": 0.3354224253537316, "percentage": 33.54, "elapsed_time": "2 days, 8:27:06", "remaining_time": "4 days, 15:50:06", "throughput": 2723.17, "total_tokens": 553420000} {"current_steps": 3065, "total_steps": 9134, "loss": 0.7347, "learning_rate": 3.7348280834046334e-05, "epoch": 0.33553189742466955, "percentage": 33.56, "elapsed_time": "2 days, 8:28:13", "remaining_time": "4 days, 15:49:00", "throughput": 2723.23, "total_tokens": 553614656} {"current_steps": 3066, "total_steps": 9134, "loss": 0.838, "learning_rate": 3.7340803593350884e-05, "epoch": 0.3356413694956074, "percentage": 33.57, "elapsed_time": "2 days, 8:29:21", "remaining_time": "4 days, 15:47:57", "throughput": 2723.32, "total_tokens": 553818048} {"current_steps": 3067, "total_steps": 9134, "loss": 0.81, "learning_rate": 3.733332489276195e-05, "epoch": 0.33575084156654533, "percentage": 33.58, "elapsed_time": "2 days, 8:30:25", "remaining_time": "4 days, 15:46:47", "throughput": 2723.31, "total_tokens": 553992096} {"current_steps": 3068, "total_steps": 9134, "loss": 0.7872, "learning_rate": 3.7325844733164256e-05, "epoch": 0.33586031363748325, "percentage": 33.59, "elapsed_time": "2 days, 8:31:34", "remaining_time": "4 days, 15:45:47", "throughput": 2723.33, "total_tokens": 554184288} {"current_steps": 3069, "total_steps": 9134, "loss": 0.6419, "learning_rate": 3.73183631154427e-05, "epoch": 0.3359697857084211, "percentage": 33.6, "elapsed_time": "2 days, 8:32:43", "remaining_time": "4 days, 15:44:45", "throughput": 2723.45, "total_tokens": 554396192} {"current_steps": 3070, "total_steps": 9134, "loss": 0.7937, "learning_rate": 3.7310880040482335e-05, "epoch": 0.33607925777935904, "percentage": 33.61, "elapsed_time": "2 days, 8:33:51", "remaining_time": "4 days, 15:43:42", "throughput": 2723.55, "total_tokens": 554600704} {"current_steps": 3071, "total_steps": 9134, "loss": 0.7986, "learning_rate": 3.730339550916839e-05, "epoch": 0.33618872985029696, "percentage": 33.62, "elapsed_time": "2 days, 8:34:59", "remaining_time": "4 days, 15:42:38", "throughput": 2723.64, "total_tokens": 554803648} {"current_steps": 3072, "total_steps": 9134, "loss": 0.6929, "learning_rate": 3.729590952238628e-05, "epoch": 0.33629820192123483, "percentage": 33.63, "elapsed_time": "2 days, 8:36:06", "remaining_time": "4 days, 15:41:33", "throughput": 2723.66, "total_tokens": 554989792} {"current_steps": 3073, "total_steps": 9134, "loss": 0.7243, "learning_rate": 3.728842208102158e-05, "epoch": 0.33640767399217275, "percentage": 33.64, "elapsed_time": "2 days, 8:37:12", "remaining_time": "4 days, 15:40:25", "throughput": 2723.7, "total_tokens": 555178176} {"current_steps": 3074, "total_steps": 9134, "loss": 0.5647, "learning_rate": 3.728093318596004e-05, "epoch": 0.3365171460631107, "percentage": 33.65, "elapsed_time": "2 days, 8:38:19", "remaining_time": "4 days, 15:39:21", "throughput": 2723.75, "total_tokens": 555370368} {"current_steps": 3075, "total_steps": 9134, "loss": 0.7666, "learning_rate": 3.7273442838087584e-05, "epoch": 0.33662661813404854, "percentage": 33.67, "elapsed_time": "2 days, 8:39:24", "remaining_time": "4 days, 15:38:12", "throughput": 2723.66, "total_tokens": 555529632} {"current_steps": 3076, "total_steps": 9134, "loss": 0.6633, "learning_rate": 3.7265951038290305e-05, "epoch": 0.33673609020498646, "percentage": 33.68, "elapsed_time": "2 days, 8:40:24", "remaining_time": "4 days, 15:36:54", "throughput": 2723.54, "total_tokens": 555668288} {"current_steps": 3077, "total_steps": 9134, "loss": 0.6464, "learning_rate": 3.725845778745446e-05, "epoch": 0.3368455622759244, "percentage": 33.69, "elapsed_time": "2 days, 8:41:33", "remaining_time": "4 days, 15:35:53", "throughput": 2723.73, "total_tokens": 555896096} {"current_steps": 3078, "total_steps": 9134, "loss": 0.5667, "learning_rate": 3.725096308646649e-05, "epoch": 0.33695503434686225, "percentage": 33.7, "elapsed_time": "2 days, 8:42:40", "remaining_time": "4 days, 15:34:47", "throughput": 2723.77, "total_tokens": 556085152} {"current_steps": 3079, "total_steps": 9134, "loss": 0.7083, "learning_rate": 3.724346693621301e-05, "epoch": 0.33706450641780017, "percentage": 33.71, "elapsed_time": "2 days, 8:43:43", "remaining_time": "4 days, 15:33:36", "throughput": 2723.75, "total_tokens": 556254944} {"current_steps": 3080, "total_steps": 9134, "loss": 0.804, "learning_rate": 3.72359693375808e-05, "epoch": 0.33717397848873804, "percentage": 33.72, "elapsed_time": "2 days, 8:44:49", "remaining_time": "4 days, 15:32:29", "throughput": 2723.72, "total_tokens": 556428992} {"current_steps": 3081, "total_steps": 9134, "loss": 0.6773, "learning_rate": 3.722847029145681e-05, "epoch": 0.33728345055967596, "percentage": 33.73, "elapsed_time": "2 days, 8:45:56", "remaining_time": "4 days, 15:31:23", "throughput": 2723.68, "total_tokens": 556602144} {"current_steps": 3082, "total_steps": 9134, "loss": 0.7295, "learning_rate": 3.722096979872815e-05, "epoch": 0.3373929226306139, "percentage": 33.74, "elapsed_time": "2 days, 8:47:01", "remaining_time": "4 days, 15:30:13", "throughput": 2723.65, "total_tokens": 556771264} {"current_steps": 3083, "total_steps": 9134, "loss": 0.9204, "learning_rate": 3.7213467860282144e-05, "epoch": 0.33750239470155174, "percentage": 33.75, "elapsed_time": "2 days, 8:48:06", "remaining_time": "4 days, 15:29:05", "throughput": 2723.71, "total_tokens": 556961664} {"current_steps": 3084, "total_steps": 9134, "loss": 0.6539, "learning_rate": 3.720596447700623e-05, "epoch": 0.33761186677248967, "percentage": 33.76, "elapsed_time": "2 days, 8:49:12", "remaining_time": "4 days, 15:27:58", "throughput": 2723.64, "total_tokens": 557126528} {"current_steps": 3085, "total_steps": 9134, "loss": 0.6929, "learning_rate": 3.7198459649788045e-05, "epoch": 0.3377213388434276, "percentage": 33.77, "elapsed_time": "2 days, 8:50:16", "remaining_time": "4 days, 15:26:47", "throughput": 2723.66, "total_tokens": 557306624} {"current_steps": 3086, "total_steps": 9134, "loss": 0.7993, "learning_rate": 3.7190953379515404e-05, "epoch": 0.33783081091436545, "percentage": 33.79, "elapsed_time": "2 days, 8:51:26", "remaining_time": "4 days, 15:25:47", "throughput": 2723.78, "total_tokens": 557520320} {"current_steps": 3087, "total_steps": 9134, "loss": 0.7108, "learning_rate": 3.718344566707629e-05, "epoch": 0.3379402829853034, "percentage": 33.8, "elapsed_time": "2 days, 8:52:31", "remaining_time": "4 days, 15:24:40", "throughput": 2723.81, "total_tokens": 557704896} {"current_steps": 3088, "total_steps": 9134, "loss": 0.6535, "learning_rate": 3.717593651335884e-05, "epoch": 0.3380497550562413, "percentage": 33.81, "elapsed_time": "2 days, 8:53:35", "remaining_time": "4 days, 15:23:29", "throughput": 2723.76, "total_tokens": 557868864} {"current_steps": 3089, "total_steps": 9134, "loss": 0.6744, "learning_rate": 3.716842591925138e-05, "epoch": 0.33815922712717916, "percentage": 33.82, "elapsed_time": "2 days, 8:54:40", "remaining_time": "4 days, 15:22:19", "throughput": 2723.74, "total_tokens": 558042016} {"current_steps": 3090, "total_steps": 9134, "loss": 0.6626, "learning_rate": 3.71609138856424e-05, "epoch": 0.3382686991981171, "percentage": 33.83, "elapsed_time": "2 days, 8:55:40", "remaining_time": "4 days, 15:21:01", "throughput": 2723.67, "total_tokens": 558191648} {"current_steps": 3091, "total_steps": 9134, "loss": 0.737, "learning_rate": 3.715340041342055e-05, "epoch": 0.338378171269055, "percentage": 33.84, "elapsed_time": "2 days, 8:56:47", "remaining_time": "4 days, 15:19:56", "throughput": 2723.7, "total_tokens": 558379584} {"current_steps": 3092, "total_steps": 9134, "loss": 0.7874, "learning_rate": 3.7145885503474654e-05, "epoch": 0.33848764333999287, "percentage": 33.85, "elapsed_time": "2 days, 8:57:53", "remaining_time": "4 days, 15:18:49", "throughput": 2723.65, "total_tokens": 558549152} {"current_steps": 3093, "total_steps": 9134, "loss": 0.6163, "learning_rate": 3.713836915669373e-05, "epoch": 0.3385971154109308, "percentage": 33.86, "elapsed_time": "2 days, 8:58:55", "remaining_time": "4 days, 15:17:34", "throughput": 2723.66, "total_tokens": 558719168} {"current_steps": 3094, "total_steps": 9134, "loss": 0.8031, "learning_rate": 3.713085137396694e-05, "epoch": 0.3387065874818687, "percentage": 33.87, "elapsed_time": "2 days, 9:00:00", "remaining_time": "4 days, 15:16:25", "throughput": 2723.64, "total_tokens": 558892096} {"current_steps": 3095, "total_steps": 9134, "loss": 0.9104, "learning_rate": 3.712333215618363e-05, "epoch": 0.3388160595528066, "percentage": 33.88, "elapsed_time": "2 days, 9:01:09", "remaining_time": "4 days, 15:15:23", "throughput": 2723.64, "total_tokens": 559080704} {"current_steps": 3096, "total_steps": 9134, "loss": 0.6035, "learning_rate": 3.71158115042333e-05, "epoch": 0.3389255316237445, "percentage": 33.9, "elapsed_time": "2 days, 9:02:13", "remaining_time": "4 days, 15:14:12", "throughput": 2723.59, "total_tokens": 559244224} {"current_steps": 3097, "total_steps": 9134, "loss": 0.7184, "learning_rate": 3.7108289419005625e-05, "epoch": 0.33903500369468237, "percentage": 33.91, "elapsed_time": "2 days, 9:03:21", "remaining_time": "4 days, 15:13:11", "throughput": 2723.59, "total_tokens": 559429472} {"current_steps": 3098, "total_steps": 9134, "loss": 0.8382, "learning_rate": 3.710076590139045e-05, "epoch": 0.3391444757656203, "percentage": 33.92, "elapsed_time": "2 days, 9:04:26", "remaining_time": "4 days, 15:12:00", "throughput": 2723.67, "total_tokens": 559622784} {"current_steps": 3099, "total_steps": 9134, "loss": 0.8304, "learning_rate": 3.7093240952277816e-05, "epoch": 0.3392539478365582, "percentage": 33.93, "elapsed_time": "2 days, 9:05:35", "remaining_time": "4 days, 15:10:59", "throughput": 2723.64, "total_tokens": 559803104} {"current_steps": 3100, "total_steps": 9134, "loss": 0.7293, "learning_rate": 3.708571457255789e-05, "epoch": 0.3393634199074961, "percentage": 33.94, "elapsed_time": "2 days, 9:06:44", "remaining_time": "4 days, 15:09:58", "throughput": 2723.62, "total_tokens": 559989024} {"current_steps": 3101, "total_steps": 9134, "loss": 0.8897, "learning_rate": 3.7078186763121034e-05, "epoch": 0.339472891978434, "percentage": 33.95, "elapsed_time": "2 days, 9:07:50", "remaining_time": "4 days, 15:08:52", "throughput": 2723.6, "total_tokens": 560163072} {"current_steps": 3102, "total_steps": 9134, "loss": 0.523, "learning_rate": 3.7070657524857786e-05, "epoch": 0.3395823640493719, "percentage": 33.96, "elapsed_time": "2 days, 9:08:54", "remaining_time": "4 days, 15:07:41", "throughput": 2723.54, "total_tokens": 560325920} {"current_steps": 3103, "total_steps": 9134, "loss": 0.7425, "learning_rate": 3.706312685865881e-05, "epoch": 0.3396918361203098, "percentage": 33.97, "elapsed_time": "2 days, 9:10:03", "remaining_time": "4 days, 15:06:40", "throughput": 2723.59, "total_tokens": 560524832} {"current_steps": 3104, "total_steps": 9134, "loss": 0.7011, "learning_rate": 3.7055594765415e-05, "epoch": 0.3398013081912477, "percentage": 33.98, "elapsed_time": "2 days, 9:11:07", "remaining_time": "4 days, 15:05:30", "throughput": 2723.6, "total_tokens": 560701344} {"current_steps": 3105, "total_steps": 9134, "loss": 0.6051, "learning_rate": 3.704806124601736e-05, "epoch": 0.33991078026218563, "percentage": 33.99, "elapsed_time": "2 days, 9:12:08", "remaining_time": "4 days, 15:04:12", "throughput": 2723.52, "total_tokens": 560850976} {"current_steps": 3106, "total_steps": 9134, "loss": 0.6006, "learning_rate": 3.704052630135713e-05, "epoch": 0.3400202523331235, "percentage": 34.0, "elapsed_time": "2 days, 9:13:15", "remaining_time": "4 days, 15:03:08", "throughput": 2723.55, "total_tokens": 561039808} {"current_steps": 3107, "total_steps": 9134, "loss": 0.5989, "learning_rate": 3.7032989932325634e-05, "epoch": 0.3401297244040614, "percentage": 34.02, "elapsed_time": "2 days, 9:14:16", "remaining_time": "4 days, 15:01:50", "throughput": 2723.47, "total_tokens": 561188320} {"current_steps": 3108, "total_steps": 9134, "loss": 0.7302, "learning_rate": 3.7025452139814445e-05, "epoch": 0.34023919647499934, "percentage": 34.03, "elapsed_time": "2 days, 9:15:20", "remaining_time": "4 days, 15:00:40", "throughput": 2723.42, "total_tokens": 561352288} {"current_steps": 3109, "total_steps": 9134, "loss": 0.92, "learning_rate": 3.7017912924715257e-05, "epoch": 0.3403486685459372, "percentage": 34.04, "elapsed_time": "2 days, 9:16:29", "remaining_time": "4 days, 14:59:39", "throughput": 2723.45, "total_tokens": 561546496} {"current_steps": 3110, "total_steps": 9134, "loss": 0.6253, "learning_rate": 3.701037228791993e-05, "epoch": 0.3404581406168751, "percentage": 34.05, "elapsed_time": "2 days, 9:17:36", "remaining_time": "4 days, 14:58:34", "throughput": 2723.45, "total_tokens": 561729280} {"current_steps": 3111, "total_steps": 9134, "loss": 0.6745, "learning_rate": 3.7002830230320537e-05, "epoch": 0.34056761268781305, "percentage": 34.06, "elapsed_time": "2 days, 9:18:43", "remaining_time": "4 days, 14:57:30", "throughput": 2723.44, "total_tokens": 561910496} {"current_steps": 3112, "total_steps": 9134, "loss": 0.9247, "learning_rate": 3.699528675280926e-05, "epoch": 0.3406770847587509, "percentage": 34.07, "elapsed_time": "2 days, 9:19:49", "remaining_time": "4 days, 14:56:21", "throughput": 2723.41, "total_tokens": 562082080} {"current_steps": 3113, "total_steps": 9134, "loss": 0.6365, "learning_rate": 3.69877418562785e-05, "epoch": 0.34078655682968884, "percentage": 34.08, "elapsed_time": "2 days, 9:20:58", "remaining_time": "4 days, 14:55:20", "throughput": 2723.47, "total_tokens": 562282560} {"current_steps": 3114, "total_steps": 9134, "loss": 0.8286, "learning_rate": 3.69801955416208e-05, "epoch": 0.3408960289006267, "percentage": 34.09, "elapsed_time": "2 days, 9:22:07", "remaining_time": "4 days, 14:54:19", "throughput": 2723.5, "total_tokens": 562476768} {"current_steps": 3115, "total_steps": 9134, "loss": 0.7051, "learning_rate": 3.697264780972886e-05, "epoch": 0.3410055009715646, "percentage": 34.1, "elapsed_time": "2 days, 9:23:13", "remaining_time": "4 days, 14:53:12", "throughput": 2723.55, "total_tokens": 562667840} {"current_steps": 3116, "total_steps": 9134, "loss": 0.7157, "learning_rate": 3.696509866149558e-05, "epoch": 0.34111497304250255, "percentage": 34.11, "elapsed_time": "2 days, 9:24:21", "remaining_time": "4 days, 14:52:09", "throughput": 2723.49, "total_tokens": 562840544} {"current_steps": 3117, "total_steps": 9134, "loss": 0.8251, "learning_rate": 3.6957548097814e-05, "epoch": 0.3412244451134404, "percentage": 34.13, "elapsed_time": "2 days, 9:25:28", "remaining_time": "4 days, 14:51:04", "throughput": 2723.52, "total_tokens": 563028928} {"current_steps": 3118, "total_steps": 9134, "loss": 0.7393, "learning_rate": 3.6949996119577335e-05, "epoch": 0.34133391718437833, "percentage": 34.14, "elapsed_time": "2 days, 9:26:33", "remaining_time": "4 days, 14:49:56", "throughput": 2723.51, "total_tokens": 563203424} {"current_steps": 3119, "total_steps": 9134, "loss": 0.4825, "learning_rate": 3.694244272767897e-05, "epoch": 0.34144338925531625, "percentage": 34.15, "elapsed_time": "2 days, 9:27:39", "remaining_time": "4 days, 14:48:49", "throughput": 2723.52, "total_tokens": 563385088} {"current_steps": 3120, "total_steps": 9134, "loss": 0.7199, "learning_rate": 3.693488792301247e-05, "epoch": 0.3415528613262541, "percentage": 34.16, "elapsed_time": "2 days, 9:28:46", "remaining_time": "4 days, 14:47:43", "throughput": 2723.5, "total_tokens": 563563392} {"current_steps": 3121, "total_steps": 9134, "loss": 0.6731, "learning_rate": 3.6927331706471536e-05, "epoch": 0.34166233339719204, "percentage": 34.17, "elapsed_time": "2 days, 9:29:52", "remaining_time": "4 days, 14:46:37", "throughput": 2723.51, "total_tokens": 563747072} {"current_steps": 3122, "total_steps": 9134, "loss": 0.9561, "learning_rate": 3.6919774078950065e-05, "epoch": 0.34177180546812996, "percentage": 34.18, "elapsed_time": "2 days, 9:30:56", "remaining_time": "4 days, 14:45:26", "throughput": 2723.58, "total_tokens": 563935232} {"current_steps": 3123, "total_steps": 9134, "loss": 0.7495, "learning_rate": 3.691221504134211e-05, "epoch": 0.34188127753906783, "percentage": 34.19, "elapsed_time": "2 days, 9:32:03", "remaining_time": "4 days, 14:44:21", "throughput": 2723.52, "total_tokens": 564103680} {"current_steps": 3124, "total_steps": 9134, "loss": 0.5662, "learning_rate": 3.6904654594541885e-05, "epoch": 0.34199074961000575, "percentage": 34.2, "elapsed_time": "2 days, 9:33:08", "remaining_time": "4 days, 14:43:11", "throughput": 2723.51, "total_tokens": 564279072} {"current_steps": 3125, "total_steps": 9134, "loss": 0.9131, "learning_rate": 3.689709273944378e-05, "epoch": 0.3421002216809437, "percentage": 34.21, "elapsed_time": "2 days, 9:34:15", "remaining_time": "4 days, 14:42:07", "throughput": 2723.63, "total_tokens": 564487616} {"current_steps": 3126, "total_steps": 9134, "loss": 0.664, "learning_rate": 3.6889529476942344e-05, "epoch": 0.34220969375188154, "percentage": 34.22, "elapsed_time": "2 days, 9:35:20", "remaining_time": "4 days, 14:40:58", "throughput": 2723.58, "total_tokens": 564654944} {"current_steps": 3127, "total_steps": 9134, "loss": 0.7431, "learning_rate": 3.6881964807932306e-05, "epoch": 0.34231916582281946, "percentage": 34.23, "elapsed_time": "2 days, 9:36:29", "remaining_time": "4 days, 14:39:57", "throughput": 2723.73, "total_tokens": 564873344} {"current_steps": 3128, "total_steps": 9134, "loss": 0.7563, "learning_rate": 3.6874398733308544e-05, "epoch": 0.3424286378937574, "percentage": 34.25, "elapsed_time": "2 days, 9:37:37", "remaining_time": "4 days, 14:38:53", "throughput": 2723.8, "total_tokens": 565071584} {"current_steps": 3129, "total_steps": 9134, "loss": 0.739, "learning_rate": 3.686683125396611e-05, "epoch": 0.34253810996469525, "percentage": 34.26, "elapsed_time": "2 days, 9:38:35", "remaining_time": "4 days, 14:37:31", "throughput": 2723.68, "total_tokens": 565204640} {"current_steps": 3130, "total_steps": 9134, "loss": 0.779, "learning_rate": 3.685926237080023e-05, "epoch": 0.34264758203563317, "percentage": 34.27, "elapsed_time": "2 days, 9:39:43", "remaining_time": "4 days, 14:36:28", "throughput": 2723.77, "total_tokens": 565410048} {"current_steps": 3131, "total_steps": 9134, "loss": 0.6577, "learning_rate": 3.6851692084706266e-05, "epoch": 0.34275705410657104, "percentage": 34.28, "elapsed_time": "2 days, 9:40:47", "remaining_time": "4 days, 14:35:17", "throughput": 2723.72, "total_tokens": 565572448} {"current_steps": 3132, "total_steps": 9134, "loss": 0.6851, "learning_rate": 3.68441203965798e-05, "epoch": 0.34286652617750896, "percentage": 34.29, "elapsed_time": "2 days, 9:41:51", "remaining_time": "4 days, 14:34:07", "throughput": 2723.66, "total_tokens": 565735072} {"current_steps": 3133, "total_steps": 9134, "loss": 0.5406, "learning_rate": 3.6836547307316524e-05, "epoch": 0.3429759982484469, "percentage": 34.3, "elapsed_time": "2 days, 9:42:58", "remaining_time": "4 days, 14:33:03", "throughput": 2723.76, "total_tokens": 565940032} {"current_steps": 3134, "total_steps": 9134, "loss": 0.6749, "learning_rate": 3.682897281781234e-05, "epoch": 0.34308547031938474, "percentage": 34.31, "elapsed_time": "2 days, 9:44:00", "remaining_time": "4 days, 14:31:47", "throughput": 2723.72, "total_tokens": 566097280} {"current_steps": 3135, "total_steps": 9134, "loss": 0.6863, "learning_rate": 3.682139692896328e-05, "epoch": 0.34319494239032267, "percentage": 34.32, "elapsed_time": "2 days, 9:45:04", "remaining_time": "4 days, 14:30:37", "throughput": 2723.66, "total_tokens": 566263040} {"current_steps": 3136, "total_steps": 9134, "loss": 0.7361, "learning_rate": 3.681381964166556e-05, "epoch": 0.3433044144612606, "percentage": 34.33, "elapsed_time": "2 days, 9:46:07", "remaining_time": "4 days, 14:29:25", "throughput": 2723.63, "total_tokens": 566426784} {"current_steps": 3137, "total_steps": 9134, "loss": 0.605, "learning_rate": 3.680624095681557e-05, "epoch": 0.34341388653219845, "percentage": 34.34, "elapsed_time": "2 days, 9:47:08", "remaining_time": "4 days, 14:28:08", "throughput": 2723.48, "total_tokens": 566561856} {"current_steps": 3138, "total_steps": 9134, "loss": 0.6285, "learning_rate": 3.6798660875309836e-05, "epoch": 0.3435233586031364, "percentage": 34.36, "elapsed_time": "2 days, 9:48:10", "remaining_time": "4 days, 14:26:52", "throughput": 2723.44, "total_tokens": 566719776} {"current_steps": 3139, "total_steps": 9134, "loss": 0.5439, "learning_rate": 3.679107939804507e-05, "epoch": 0.3436328306740743, "percentage": 34.37, "elapsed_time": "2 days, 9:49:14", "remaining_time": "4 days, 14:25:42", "throughput": 2723.39, "total_tokens": 566885984} {"current_steps": 3140, "total_steps": 9134, "loss": 0.4707, "learning_rate": 3.678349652591816e-05, "epoch": 0.34374230274501216, "percentage": 34.38, "elapsed_time": "2 days, 9:50:20", "remaining_time": "4 days, 14:24:36", "throughput": 2723.38, "total_tokens": 567065632} {"current_steps": 3141, "total_steps": 9134, "loss": 0.7488, "learning_rate": 3.677591225982614e-05, "epoch": 0.3438517748159501, "percentage": 34.39, "elapsed_time": "2 days, 9:51:26", "remaining_time": "4 days, 14:23:28", "throughput": 2723.41, "total_tokens": 567249536} {"current_steps": 3142, "total_steps": 9134, "loss": 0.7251, "learning_rate": 3.67683266006662e-05, "epoch": 0.343961246886888, "percentage": 34.4, "elapsed_time": "2 days, 9:52:33", "remaining_time": "4 days, 14:22:24", "throughput": 2723.51, "total_tokens": 567454272} {"current_steps": 3143, "total_steps": 9134, "loss": 0.6472, "learning_rate": 3.676073954933573e-05, "epoch": 0.34407071895782587, "percentage": 34.41, "elapsed_time": "2 days, 9:53:39", "remaining_time": "4 days, 14:21:17", "throughput": 2723.55, "total_tokens": 567641312} {"current_steps": 3144, "total_steps": 9134, "loss": 0.7084, "learning_rate": 3.6753151106732255e-05, "epoch": 0.3441801910287638, "percentage": 34.42, "elapsed_time": "2 days, 9:54:47", "remaining_time": "4 days, 14:20:14", "throughput": 2723.51, "total_tokens": 567819168} {"current_steps": 3145, "total_steps": 9134, "loss": 0.6171, "learning_rate": 3.674556127375347e-05, "epoch": 0.3442896630997017, "percentage": 34.43, "elapsed_time": "2 days, 9:55:54", "remaining_time": "4 days, 14:19:08", "throughput": 2723.52, "total_tokens": 568002400} {"current_steps": 3146, "total_steps": 9134, "loss": 0.8196, "learning_rate": 3.6737970051297234e-05, "epoch": 0.3443991351706396, "percentage": 34.44, "elapsed_time": "2 days, 9:57:02", "remaining_time": "4 days, 14:18:05", "throughput": 2723.61, "total_tokens": 568205792} {"current_steps": 3147, "total_steps": 9134, "loss": 0.7456, "learning_rate": 3.673037744026159e-05, "epoch": 0.3445086072415775, "percentage": 34.45, "elapsed_time": "2 days, 9:58:09", "remaining_time": "4 days, 14:17:00", "throughput": 2723.67, "total_tokens": 568401120} {"current_steps": 3148, "total_steps": 9134, "loss": 0.5945, "learning_rate": 3.672278344154471e-05, "epoch": 0.34461807931251537, "percentage": 34.46, "elapsed_time": "2 days, 9:59:12", "remaining_time": "4 days, 14:15:48", "throughput": 2723.6, "total_tokens": 568557696} {"current_steps": 3149, "total_steps": 9134, "loss": 0.7462, "learning_rate": 3.671518805604496e-05, "epoch": 0.3447275513834533, "percentage": 34.48, "elapsed_time": "2 days, 10:00:19", "remaining_time": "4 days, 14:14:43", "throughput": 2723.58, "total_tokens": 568737792} {"current_steps": 3150, "total_steps": 9134, "loss": 0.7897, "learning_rate": 3.670759128466087e-05, "epoch": 0.3448370234543912, "percentage": 34.49, "elapsed_time": "2 days, 10:01:29", "remaining_time": "4 days, 14:13:43", "throughput": 2723.65, "total_tokens": 568940960} {"current_steps": 3151, "total_steps": 9134, "loss": 0.4074, "learning_rate": 3.669999312829111e-05, "epoch": 0.3449464955253291, "percentage": 34.5, "elapsed_time": "2 days, 10:02:36", "remaining_time": "4 days, 14:12:38", "throughput": 2723.6, "total_tokens": 569113888} {"current_steps": 3152, "total_steps": 9134, "loss": 0.7551, "learning_rate": 3.669239358783452e-05, "epoch": 0.345055967596267, "percentage": 34.51, "elapsed_time": "2 days, 10:03:42", "remaining_time": "4 days, 14:11:31", "throughput": 2723.57, "total_tokens": 569288160} {"current_steps": 3153, "total_steps": 9134, "loss": 0.5305, "learning_rate": 3.668479266419012e-05, "epoch": 0.3451654396672049, "percentage": 34.52, "elapsed_time": "2 days, 10:04:46", "remaining_time": "4 days, 14:10:20", "throughput": 2723.46, "total_tokens": 569438016} {"current_steps": 3154, "total_steps": 9134, "loss": 0.8747, "learning_rate": 3.6677190358257086e-05, "epoch": 0.3452749117381428, "percentage": 34.53, "elapsed_time": "2 days, 10:05:54", "remaining_time": "4 days, 14:09:18", "throughput": 2723.45, "total_tokens": 569623040} {"current_steps": 3155, "total_steps": 9134, "loss": 0.7497, "learning_rate": 3.666958667093476e-05, "epoch": 0.3453843838090807, "percentage": 34.54, "elapsed_time": "2 days, 10:07:00", "remaining_time": "4 days, 14:08:10", "throughput": 2723.5, "total_tokens": 569811424} {"current_steps": 3156, "total_steps": 9134, "loss": 0.5819, "learning_rate": 3.6661981603122645e-05, "epoch": 0.34549385588001863, "percentage": 34.55, "elapsed_time": "2 days, 10:08:07", "remaining_time": "4 days, 14:07:05", "throughput": 2723.46, "total_tokens": 569986368} {"current_steps": 3157, "total_steps": 9134, "loss": 0.6702, "learning_rate": 3.665437515572039e-05, "epoch": 0.3456033279509565, "percentage": 34.56, "elapsed_time": "2 days, 10:09:14", "remaining_time": "4 days, 14:06:00", "throughput": 2723.54, "total_tokens": 570184160} {"current_steps": 3158, "total_steps": 9134, "loss": 0.8348, "learning_rate": 3.664676732962784e-05, "epoch": 0.3457128000218944, "percentage": 34.57, "elapsed_time": "2 days, 10:10:23", "remaining_time": "4 days, 14:04:59", "throughput": 2723.64, "total_tokens": 570394720} {"current_steps": 3159, "total_steps": 9134, "loss": 0.5655, "learning_rate": 3.663915812574497e-05, "epoch": 0.34582227209283234, "percentage": 34.59, "elapsed_time": "2 days, 10:11:27", "remaining_time": "4 days, 14:03:49", "throughput": 2723.65, "total_tokens": 570571008} {"current_steps": 3160, "total_steps": 9134, "loss": 0.6114, "learning_rate": 3.663154754497196e-05, "epoch": 0.3459317441637702, "percentage": 34.6, "elapsed_time": "2 days, 10:12:33", "remaining_time": "4 days, 14:02:41", "throughput": 2723.6, "total_tokens": 570739008} {"current_steps": 3161, "total_steps": 9134, "loss": 0.6208, "learning_rate": 3.66239355882091e-05, "epoch": 0.3460412162347081, "percentage": 34.61, "elapsed_time": "2 days, 10:13:38", "remaining_time": "4 days, 14:01:34", "throughput": 2723.49, "total_tokens": 570895360} {"current_steps": 3162, "total_steps": 9134, "loss": 0.7707, "learning_rate": 3.6616322256356884e-05, "epoch": 0.34615068830564605, "percentage": 34.62, "elapsed_time": "2 days, 10:14:46", "remaining_time": "4 days, 14:00:29", "throughput": 2723.53, "total_tokens": 571085536} {"current_steps": 3163, "total_steps": 9134, "loss": 0.6948, "learning_rate": 3.6608707550315944e-05, "epoch": 0.3462601603765839, "percentage": 34.63, "elapsed_time": "2 days, 10:15:53", "remaining_time": "4 days, 13:59:26", "throughput": 2723.54, "total_tokens": 571273024} {"current_steps": 3164, "total_steps": 9134, "loss": 0.7548, "learning_rate": 3.660109147098711e-05, "epoch": 0.34636963244752184, "percentage": 34.64, "elapsed_time": "2 days, 10:16:57", "remaining_time": "4 days, 13:58:14", "throughput": 2723.53, "total_tokens": 571444160} {"current_steps": 3165, "total_steps": 9134, "loss": 0.7098, "learning_rate": 3.659347401927131e-05, "epoch": 0.3464791045184597, "percentage": 34.65, "elapsed_time": "2 days, 10:18:03", "remaining_time": "4 days, 13:57:07", "throughput": 2723.62, "total_tokens": 571642400} {"current_steps": 3166, "total_steps": 9134, "loss": 0.6282, "learning_rate": 3.6585855196069704e-05, "epoch": 0.3465885765893976, "percentage": 34.66, "elapsed_time": "2 days, 10:19:11", "remaining_time": "4 days, 13:56:04", "throughput": 2723.58, "total_tokens": 571820032} {"current_steps": 3167, "total_steps": 9134, "loss": 0.7717, "learning_rate": 3.657823500228359e-05, "epoch": 0.34669804866033554, "percentage": 34.67, "elapsed_time": "2 days, 10:20:15", "remaining_time": "4 days, 13:54:53", "throughput": 2723.59, "total_tokens": 571995648} {"current_steps": 3168, "total_steps": 9134, "loss": 0.5266, "learning_rate": 3.65706134388144e-05, "epoch": 0.3468075207312734, "percentage": 34.68, "elapsed_time": "2 days, 10:21:18", "remaining_time": "4 days, 13:53:41", "throughput": 2723.5, "total_tokens": 572149536} {"current_steps": 3169, "total_steps": 9134, "loss": 0.6338, "learning_rate": 3.656299050656376e-05, "epoch": 0.34691699280221133, "percentage": 34.69, "elapsed_time": "2 days, 10:22:20", "remaining_time": "4 days, 13:52:27", "throughput": 2723.46, "total_tokens": 572310816} {"current_steps": 3170, "total_steps": 9134, "loss": 0.6667, "learning_rate": 3.655536620643345e-05, "epoch": 0.34702646487314925, "percentage": 34.71, "elapsed_time": "2 days, 10:23:22", "remaining_time": "4 days, 13:51:12", "throughput": 2723.45, "total_tokens": 572476576} {"current_steps": 3171, "total_steps": 9134, "loss": 0.6294, "learning_rate": 3.654774053932541e-05, "epoch": 0.3471359369440871, "percentage": 34.72, "elapsed_time": "2 days, 10:24:27", "remaining_time": "4 days, 13:50:03", "throughput": 2723.49, "total_tokens": 572661376} {"current_steps": 3172, "total_steps": 9134, "loss": 0.8661, "learning_rate": 3.6540113506141734e-05, "epoch": 0.34724540901502504, "percentage": 34.73, "elapsed_time": "2 days, 10:25:32", "remaining_time": "4 days, 13:48:54", "throughput": 2723.47, "total_tokens": 572833184} {"current_steps": 3173, "total_steps": 9134, "loss": 0.7283, "learning_rate": 3.653248510778469e-05, "epoch": 0.34735488108596296, "percentage": 34.74, "elapsed_time": "2 days, 10:26:40", "remaining_time": "4 days, 13:47:51", "throughput": 2723.5, "total_tokens": 573025600} {"current_steps": 3174, "total_steps": 9134, "loss": 0.7794, "learning_rate": 3.652485534515671e-05, "epoch": 0.34746435315690083, "percentage": 34.75, "elapsed_time": "2 days, 10:27:49", "remaining_time": "4 days, 13:46:50", "throughput": 2723.58, "total_tokens": 573230336} {"current_steps": 3175, "total_steps": 9134, "loss": 0.7147, "learning_rate": 3.6517224219160365e-05, "epoch": 0.34757382522783875, "percentage": 34.76, "elapsed_time": "2 days, 10:28:54", "remaining_time": "4 days, 13:45:41", "throughput": 2723.58, "total_tokens": 573406176} {"current_steps": 3176, "total_steps": 9134, "loss": 0.5735, "learning_rate": 3.6509591730698416e-05, "epoch": 0.3476832972987767, "percentage": 34.77, "elapsed_time": "2 days, 10:29:59", "remaining_time": "4 days, 13:44:33", "throughput": 2723.66, "total_tokens": 573601504} {"current_steps": 3177, "total_steps": 9134, "loss": 0.6359, "learning_rate": 3.6501957880673775e-05, "epoch": 0.34779276936971454, "percentage": 34.78, "elapsed_time": "2 days, 10:31:07", "remaining_time": "4 days, 13:43:29", "throughput": 2723.63, "total_tokens": 573781376} {"current_steps": 3178, "total_steps": 9134, "loss": 0.6908, "learning_rate": 3.64943226699895e-05, "epoch": 0.34790224144065246, "percentage": 34.79, "elapsed_time": "2 days, 10:32:13", "remaining_time": "4 days, 13:42:22", "throughput": 2723.65, "total_tokens": 573964160} {"current_steps": 3179, "total_steps": 9134, "loss": 0.7793, "learning_rate": 3.648668609954883e-05, "epoch": 0.3480117135115904, "percentage": 34.8, "elapsed_time": "2 days, 10:33:19", "remaining_time": "4 days, 13:41:16", "throughput": 2723.72, "total_tokens": 574157920} {"current_steps": 3180, "total_steps": 9134, "loss": 0.5795, "learning_rate": 3.647904817025514e-05, "epoch": 0.34812118558252825, "percentage": 34.81, "elapsed_time": "2 days, 10:34:21", "remaining_time": "4 days, 13:40:00", "throughput": 2723.69, "total_tokens": 574319648} {"current_steps": 3181, "total_steps": 9134, "loss": 0.8677, "learning_rate": 3.6471408883012006e-05, "epoch": 0.34823065765346617, "percentage": 34.83, "elapsed_time": "2 days, 10:35:23", "remaining_time": "4 days, 13:38:48", "throughput": 2723.63, "total_tokens": 574479136} {"current_steps": 3182, "total_steps": 9134, "loss": 1.0189, "learning_rate": 3.646376823872313e-05, "epoch": 0.34834012972440404, "percentage": 34.84, "elapsed_time": "2 days, 10:36:32", "remaining_time": "4 days, 13:37:46", "throughput": 2723.78, "total_tokens": 574696864} {"current_steps": 3183, "total_steps": 9134, "loss": 0.6874, "learning_rate": 3.6456126238292394e-05, "epoch": 0.34844960179534196, "percentage": 34.85, "elapsed_time": "2 days, 10:37:38", "remaining_time": "4 days, 13:36:39", "throughput": 2723.76, "total_tokens": 574873824} {"current_steps": 3184, "total_steps": 9134, "loss": 0.8923, "learning_rate": 3.6448482882623814e-05, "epoch": 0.3485590738662799, "percentage": 34.86, "elapsed_time": "2 days, 10:38:44", "remaining_time": "4 days, 13:35:33", "throughput": 2723.89, "total_tokens": 575080576} {"current_steps": 3185, "total_steps": 9134, "loss": 0.7943, "learning_rate": 3.64408381726216e-05, "epoch": 0.34866854593721774, "percentage": 34.87, "elapsed_time": "2 days, 10:39:51", "remaining_time": "4 days, 13:34:26", "throughput": 2723.96, "total_tokens": 575275232} {"current_steps": 3186, "total_steps": 9134, "loss": 0.929, "learning_rate": 3.6433192109190096e-05, "epoch": 0.34877801800815567, "percentage": 34.88, "elapsed_time": "2 days, 10:40:56", "remaining_time": "4 days, 13:33:18", "throughput": 2723.96, "total_tokens": 575455776} {"current_steps": 3187, "total_steps": 9134, "loss": 0.5777, "learning_rate": 3.642554469323382e-05, "epoch": 0.3488874900790936, "percentage": 34.89, "elapsed_time": "2 days, 10:42:00", "remaining_time": "4 days, 13:32:08", "throughput": 2723.91, "total_tokens": 575619296} {"current_steps": 3188, "total_steps": 9134, "loss": 0.7902, "learning_rate": 3.641789592565746e-05, "epoch": 0.34899696215003145, "percentage": 34.9, "elapsed_time": "2 days, 10:43:09", "remaining_time": "4 days, 13:31:06", "throughput": 2723.99, "total_tokens": 575823136} {"current_steps": 3189, "total_steps": 9134, "loss": 0.6671, "learning_rate": 3.641024580736583e-05, "epoch": 0.3491064342209694, "percentage": 34.91, "elapsed_time": "2 days, 10:44:17", "remaining_time": "4 days, 13:30:03", "throughput": 2723.98, "total_tokens": 576006592} {"current_steps": 3190, "total_steps": 9134, "loss": 0.7917, "learning_rate": 3.640259433926394e-05, "epoch": 0.3492159062919073, "percentage": 34.92, "elapsed_time": "2 days, 10:45:23", "remaining_time": "4 days, 13:28:55", "throughput": 2723.86, "total_tokens": 576158464} {"current_steps": 3191, "total_steps": 9134, "loss": 0.9047, "learning_rate": 3.639494152225693e-05, "epoch": 0.34932537836284516, "percentage": 34.94, "elapsed_time": "2 days, 10:46:31", "remaining_time": "4 days, 13:27:53", "throughput": 2723.96, "total_tokens": 576366784} {"current_steps": 3192, "total_steps": 9134, "loss": 0.5282, "learning_rate": 3.638728735725013e-05, "epoch": 0.3494348504337831, "percentage": 34.95, "elapsed_time": "2 days, 10:47:31", "remaining_time": "4 days, 13:26:35", "throughput": 2723.93, "total_tokens": 576524256} {"current_steps": 3193, "total_steps": 9134, "loss": 0.6554, "learning_rate": 3.6379631845148995e-05, "epoch": 0.349544322504721, "percentage": 34.96, "elapsed_time": "2 days, 10:48:37", "remaining_time": "4 days, 13:25:28", "throughput": 2723.95, "total_tokens": 576708832} {"current_steps": 3194, "total_steps": 9134, "loss": 0.4771, "learning_rate": 3.637197498685917e-05, "epoch": 0.34965379457565887, "percentage": 34.97, "elapsed_time": "2 days, 10:49:44", "remaining_time": "4 days, 13:24:22", "throughput": 2723.93, "total_tokens": 576884896} {"current_steps": 3195, "total_steps": 9134, "loss": 0.8125, "learning_rate": 3.636431678328646e-05, "epoch": 0.3497632666465968, "percentage": 34.98, "elapsed_time": "2 days, 10:50:51", "remaining_time": "4 days, 13:23:18", "throughput": 2724.03, "total_tokens": 577090752} {"current_steps": 3196, "total_steps": 9134, "loss": 0.58, "learning_rate": 3.635665723533678e-05, "epoch": 0.3498727387175347, "percentage": 34.99, "elapsed_time": "2 days, 10:51:58", "remaining_time": "4 days, 13:22:13", "throughput": 2723.93, "total_tokens": 577250688} {"current_steps": 3197, "total_steps": 9134, "loss": 0.7901, "learning_rate": 3.634899634391626e-05, "epoch": 0.3499822107884726, "percentage": 35.0, "elapsed_time": "2 days, 10:53:02", "remaining_time": "4 days, 13:21:03", "throughput": 2723.94, "total_tokens": 577427872} {"current_steps": 3198, "total_steps": 9134, "loss": 0.5697, "learning_rate": 3.634133410993117e-05, "epoch": 0.3500916828594105, "percentage": 35.01, "elapsed_time": "2 days, 10:54:03", "remaining_time": "4 days, 13:19:46", "throughput": 2723.84, "total_tokens": 577572128} {"current_steps": 3199, "total_steps": 9134, "loss": 0.6586, "learning_rate": 3.6333670534287945e-05, "epoch": 0.35020115493034837, "percentage": 35.02, "elapsed_time": "2 days, 10:55:07", "remaining_time": "4 days, 13:18:36", "throughput": 2723.83, "total_tokens": 577743936} {"current_steps": 3200, "total_steps": 9134, "loss": 0.6503, "learning_rate": 3.632600561789315e-05, "epoch": 0.3503106270012863, "percentage": 35.03, "elapsed_time": "2 days, 10:56:10", "remaining_time": "4 days, 13:17:23", "throughput": 2723.76, "total_tokens": 577902528} {"current_steps": 3201, "total_steps": 9134, "loss": 0.9012, "learning_rate": 3.6318339361653545e-05, "epoch": 0.3504200990722242, "percentage": 35.04, "elapsed_time": "2 days, 10:57:16", "remaining_time": "4 days, 13:16:17", "throughput": 2723.82, "total_tokens": 578095168} {"current_steps": 3202, "total_steps": 9134, "loss": 0.6675, "learning_rate": 3.631067176647603e-05, "epoch": 0.3505295711431621, "percentage": 35.06, "elapsed_time": "2 days, 10:58:20", "remaining_time": "4 days, 13:15:05", "throughput": 2723.81, "total_tokens": 578265184} {"current_steps": 3203, "total_steps": 9134, "loss": 0.7568, "learning_rate": 3.630300283326768e-05, "epoch": 0.3506390432141, "percentage": 35.07, "elapsed_time": "2 days, 10:59:26", "remaining_time": "4 days, 13:13:59", "throughput": 2723.87, "total_tokens": 578458720} {"current_steps": 3204, "total_steps": 9134, "loss": 0.648, "learning_rate": 3.629533256293569e-05, "epoch": 0.3507485152850379, "percentage": 35.08, "elapsed_time": "2 days, 11:00:34", "remaining_time": "4 days, 13:12:55", "throughput": 2723.9, "total_tokens": 578649344} {"current_steps": 3205, "total_steps": 9134, "loss": 0.5904, "learning_rate": 3.6287660956387454e-05, "epoch": 0.3508579873559758, "percentage": 35.09, "elapsed_time": "2 days, 11:01:37", "remaining_time": "4 days, 13:11:43", "throughput": 2723.82, "total_tokens": 578803008} {"current_steps": 3206, "total_steps": 9134, "loss": 0.736, "learning_rate": 3.62799880145305e-05, "epoch": 0.3509674594269137, "percentage": 35.1, "elapsed_time": "2 days, 11:02:39", "remaining_time": "4 days, 13:10:29", "throughput": 2723.77, "total_tokens": 578962496} {"current_steps": 3207, "total_steps": 9134, "loss": 0.8662, "learning_rate": 3.627231373827253e-05, "epoch": 0.35107693149785163, "percentage": 35.11, "elapsed_time": "2 days, 11:03:46", "remaining_time": "4 days, 13:09:23", "throughput": 2723.82, "total_tokens": 579156256} {"current_steps": 3208, "total_steps": 9134, "loss": 0.5092, "learning_rate": 3.62646381285214e-05, "epoch": 0.3511864035687895, "percentage": 35.12, "elapsed_time": "2 days, 11:04:47", "remaining_time": "4 days, 13:08:08", "throughput": 2723.82, "total_tokens": 579323136} {"current_steps": 3209, "total_steps": 9134, "loss": 0.6725, "learning_rate": 3.6256961186185115e-05, "epoch": 0.3512958756397274, "percentage": 35.13, "elapsed_time": "2 days, 11:05:55", "remaining_time": "4 days, 13:07:05", "throughput": 2723.82, "total_tokens": 579508608} {"current_steps": 3210, "total_steps": 9134, "loss": 0.6277, "learning_rate": 3.624928291217184e-05, "epoch": 0.35140534771066534, "percentage": 35.14, "elapsed_time": "2 days, 11:06:59", "remaining_time": "4 days, 13:05:54", "throughput": 2723.78, "total_tokens": 579673920} {"current_steps": 3211, "total_steps": 9134, "loss": 0.5944, "learning_rate": 3.624160330738989e-05, "epoch": 0.3515148197816032, "percentage": 35.15, "elapsed_time": "2 days, 11:08:02", "remaining_time": "4 days, 13:04:42", "throughput": 2723.81, "total_tokens": 579851104} {"current_steps": 3212, "total_steps": 9134, "loss": 0.6536, "learning_rate": 3.623392237274777e-05, "epoch": 0.3516242918525411, "percentage": 35.17, "elapsed_time": "2 days, 11:09:08", "remaining_time": "4 days, 13:03:34", "throughput": 2723.76, "total_tokens": 580018880} {"current_steps": 3213, "total_steps": 9134, "loss": 0.6492, "learning_rate": 3.6226240109154105e-05, "epoch": 0.35173376392347905, "percentage": 35.18, "elapsed_time": "2 days, 11:10:09", "remaining_time": "4 days, 13:02:20", "throughput": 2723.74, "total_tokens": 580183520} {"current_steps": 3214, "total_steps": 9134, "loss": 0.8064, "learning_rate": 3.6218556517517695e-05, "epoch": 0.3518432359944169, "percentage": 35.19, "elapsed_time": "2 days, 11:11:18", "remaining_time": "4 days, 13:01:17", "throughput": 2723.89, "total_tokens": 580401472} {"current_steps": 3215, "total_steps": 9134, "loss": 0.6504, "learning_rate": 3.6210871598747495e-05, "epoch": 0.35195270806535484, "percentage": 35.2, "elapsed_time": "2 days, 11:12:27", "remaining_time": "4 days, 13:00:16", "throughput": 2723.92, "total_tokens": 580597248} {"current_steps": 3216, "total_steps": 9134, "loss": 0.9963, "learning_rate": 3.620318535375262e-05, "epoch": 0.3520621801362927, "percentage": 35.21, "elapsed_time": "2 days, 11:13:35", "remaining_time": "4 days, 12:59:12", "throughput": 2724.0, "total_tokens": 580798624} {"current_steps": 3217, "total_steps": 9134, "loss": 0.6888, "learning_rate": 3.6195497783442336e-05, "epoch": 0.3521716522072306, "percentage": 35.22, "elapsed_time": "2 days, 11:14:42", "remaining_time": "4 days, 12:58:08", "throughput": 2724.1, "total_tokens": 581004032} {"current_steps": 3218, "total_steps": 9134, "loss": 0.8282, "learning_rate": 3.618780888872606e-05, "epoch": 0.35228112427816854, "percentage": 35.23, "elapsed_time": "2 days, 11:15:49", "remaining_time": "4 days, 12:57:03", "throughput": 2724.05, "total_tokens": 581174048} {"current_steps": 3219, "total_steps": 9134, "loss": 0.69, "learning_rate": 3.618011867051339e-05, "epoch": 0.3523905963491064, "percentage": 35.24, "elapsed_time": "2 days, 11:16:54", "remaining_time": "4 days, 12:55:54", "throughput": 2724.02, "total_tokens": 581343616} {"current_steps": 3220, "total_steps": 9134, "loss": 0.8062, "learning_rate": 3.6172427129714036e-05, "epoch": 0.35250006842004433, "percentage": 35.25, "elapsed_time": "2 days, 11:18:00", "remaining_time": "4 days, 12:54:48", "throughput": 2723.99, "total_tokens": 581519680} {"current_steps": 3221, "total_steps": 9134, "loss": 0.6634, "learning_rate": 3.616473426723792e-05, "epoch": 0.35260954049098225, "percentage": 35.26, "elapsed_time": "2 days, 11:19:06", "remaining_time": "4 days, 12:53:40", "throughput": 2723.9, "total_tokens": 581679168} {"current_steps": 3222, "total_steps": 9134, "loss": 0.8617, "learning_rate": 3.615704008399509e-05, "epoch": 0.3527190125619201, "percentage": 35.27, "elapsed_time": "2 days, 11:20:10", "remaining_time": "4 days, 12:52:30", "throughput": 2723.89, "total_tokens": 581851872} {"current_steps": 3223, "total_steps": 9134, "loss": 0.6769, "learning_rate": 3.614934458089575e-05, "epoch": 0.35282848463285804, "percentage": 35.29, "elapsed_time": "2 days, 11:21:16", "remaining_time": "4 days, 12:51:24", "throughput": 2723.91, "total_tokens": 582036672} {"current_steps": 3224, "total_steps": 9134, "loss": 0.8119, "learning_rate": 3.614164775885025e-05, "epoch": 0.35293795670379596, "percentage": 35.3, "elapsed_time": "2 days, 11:22:25", "remaining_time": "4 days, 12:50:21", "throughput": 2724.01, "total_tokens": 582243424} {"current_steps": 3225, "total_steps": 9134, "loss": 0.5529, "learning_rate": 3.613394961876912e-05, "epoch": 0.35304742877473383, "percentage": 35.31, "elapsed_time": "2 days, 11:23:30", "remaining_time": "4 days, 12:49:13", "throughput": 2723.96, "total_tokens": 582410752} {"current_steps": 3226, "total_steps": 9134, "loss": 0.8328, "learning_rate": 3.612625016156303e-05, "epoch": 0.35315690084567175, "percentage": 35.32, "elapsed_time": "2 days, 11:24:34", "remaining_time": "4 days, 12:48:04", "throughput": 2723.92, "total_tokens": 582577632} {"current_steps": 3227, "total_steps": 9134, "loss": 0.527, "learning_rate": 3.611854938814282e-05, "epoch": 0.35326637291660967, "percentage": 35.33, "elapsed_time": "2 days, 11:25:35", "remaining_time": "4 days, 12:46:48", "throughput": 2723.83, "total_tokens": 582725248} {"current_steps": 3228, "total_steps": 9134, "loss": 0.7511, "learning_rate": 3.6110847299419474e-05, "epoch": 0.35337584498754754, "percentage": 35.34, "elapsed_time": "2 days, 11:26:40", "remaining_time": "4 days, 12:45:39", "throughput": 2723.78, "total_tokens": 582890560} {"current_steps": 3229, "total_steps": 9134, "loss": 0.6117, "learning_rate": 3.6103143896304136e-05, "epoch": 0.35348531705848546, "percentage": 35.35, "elapsed_time": "2 days, 11:27:47", "remaining_time": "4 days, 12:44:32", "throughput": 2723.79, "total_tokens": 583074016} {"current_steps": 3230, "total_steps": 9134, "loss": 0.7153, "learning_rate": 3.6095439179708096e-05, "epoch": 0.3535947891294234, "percentage": 35.36, "elapsed_time": "2 days, 11:28:52", "remaining_time": "4 days, 12:43:24", "throughput": 2723.78, "total_tokens": 583249184} {"current_steps": 3231, "total_steps": 9134, "loss": 0.6756, "learning_rate": 3.6087733150542814e-05, "epoch": 0.35370426120036125, "percentage": 35.37, "elapsed_time": "2 days, 11:29:56", "remaining_time": "4 days, 12:42:14", "throughput": 2723.83, "total_tokens": 583436448} {"current_steps": 3232, "total_steps": 9134, "loss": 0.6668, "learning_rate": 3.6080025809719894e-05, "epoch": 0.35381373327129917, "percentage": 35.38, "elapsed_time": "2 days, 11:31:01", "remaining_time": "4 days, 12:41:05", "throughput": 2723.78, "total_tokens": 583600192} {"current_steps": 3233, "total_steps": 9134, "loss": 0.6171, "learning_rate": 3.607231715815111e-05, "epoch": 0.35392320534223703, "percentage": 35.4, "elapsed_time": "2 days, 11:32:07", "remaining_time": "4 days, 12:39:59", "throughput": 2723.88, "total_tokens": 583804032} {"current_steps": 3234, "total_steps": 9134, "loss": 0.6807, "learning_rate": 3.6064607196748365e-05, "epoch": 0.35403267741317496, "percentage": 35.41, "elapsed_time": "2 days, 11:33:14", "remaining_time": "4 days, 12:38:53", "throughput": 2723.92, "total_tokens": 583993760} {"current_steps": 3235, "total_steps": 9134, "loss": 0.8425, "learning_rate": 3.6056895926423736e-05, "epoch": 0.3541421494841129, "percentage": 35.42, "elapsed_time": "2 days, 11:34:19", "remaining_time": "4 days, 12:37:45", "throughput": 2723.95, "total_tokens": 584178112} {"current_steps": 3236, "total_steps": 9134, "loss": 0.5065, "learning_rate": 3.604918334808947e-05, "epoch": 0.35425162155505074, "percentage": 35.43, "elapsed_time": "2 days, 11:35:22", "remaining_time": "4 days, 12:36:32", "throughput": 2723.95, "total_tokens": 584347456} {"current_steps": 3237, "total_steps": 9134, "loss": 0.7108, "learning_rate": 3.6041469462657926e-05, "epoch": 0.35436109362598867, "percentage": 35.44, "elapsed_time": "2 days, 11:36:26", "remaining_time": "4 days, 12:35:22", "throughput": 2723.94, "total_tokens": 584520160} {"current_steps": 3238, "total_steps": 9134, "loss": 0.5951, "learning_rate": 3.6033754271041654e-05, "epoch": 0.3544705656969266, "percentage": 35.45, "elapsed_time": "2 days, 11:37:30", "remaining_time": "4 days, 12:34:11", "throughput": 2723.89, "total_tokens": 584683008} {"current_steps": 3239, "total_steps": 9134, "loss": 0.8605, "learning_rate": 3.602603777415335e-05, "epoch": 0.35458003776786445, "percentage": 35.46, "elapsed_time": "2 days, 11:38:38", "remaining_time": "4 days, 12:33:08", "throughput": 2723.96, "total_tokens": 584884608} {"current_steps": 3240, "total_steps": 9134, "loss": 0.7763, "learning_rate": 3.601831997290585e-05, "epoch": 0.3546895098388024, "percentage": 35.47, "elapsed_time": "2 days, 11:39:44", "remaining_time": "4 days, 12:32:01", "throughput": 2723.92, "total_tokens": 585055072} {"current_steps": 3241, "total_steps": 9134, "loss": 0.6473, "learning_rate": 3.6010600868212156e-05, "epoch": 0.3547989819097403, "percentage": 35.48, "elapsed_time": "2 days, 11:40:50", "remaining_time": "4 days, 12:30:54", "throughput": 2723.85, "total_tokens": 585220160} {"current_steps": 3242, "total_steps": 9134, "loss": 0.6425, "learning_rate": 3.6002880460985436e-05, "epoch": 0.35490845398067816, "percentage": 35.49, "elapsed_time": "2 days, 11:41:52", "remaining_time": "4 days, 12:29:41", "throughput": 2723.8, "total_tokens": 585380320} {"current_steps": 3243, "total_steps": 9134, "loss": 0.6272, "learning_rate": 3.599515875213899e-05, "epoch": 0.3550179260516161, "percentage": 35.5, "elapsed_time": "2 days, 11:43:01", "remaining_time": "4 days, 12:28:40", "throughput": 2723.82, "total_tokens": 585570944} {"current_steps": 3244, "total_steps": 9134, "loss": 0.6361, "learning_rate": 3.5987435742586286e-05, "epoch": 0.355127398122554, "percentage": 35.52, "elapsed_time": "2 days, 11:44:04", "remaining_time": "4 days, 12:27:28", "throughput": 2723.77, "total_tokens": 585733792} {"current_steps": 3245, "total_steps": 9134, "loss": 0.606, "learning_rate": 3.5979711433240934e-05, "epoch": 0.35523687019349187, "percentage": 35.53, "elapsed_time": "2 days, 11:45:03", "remaining_time": "4 days, 12:26:08", "throughput": 2723.61, "total_tokens": 585858336} {"current_steps": 3246, "total_steps": 9134, "loss": 0.6926, "learning_rate": 3.597198582501671e-05, "epoch": 0.3553463422644298, "percentage": 35.54, "elapsed_time": "2 days, 11:46:12", "remaining_time": "4 days, 12:25:06", "throughput": 2723.74, "total_tokens": 586074272} {"current_steps": 3247, "total_steps": 9134, "loss": 0.65, "learning_rate": 3.596425891882754e-05, "epoch": 0.3554558143353677, "percentage": 35.55, "elapsed_time": "2 days, 11:47:20", "remaining_time": "4 days, 12:24:02", "throughput": 2723.78, "total_tokens": 586266912} {"current_steps": 3248, "total_steps": 9134, "loss": 0.7093, "learning_rate": 3.59565307155875e-05, "epoch": 0.3555652864063056, "percentage": 35.56, "elapsed_time": "2 days, 11:48:24", "remaining_time": "4 days, 12:22:53", "throughput": 2723.77, "total_tokens": 586441632} {"current_steps": 3249, "total_steps": 9134, "loss": 0.7655, "learning_rate": 3.594880121621081e-05, "epoch": 0.3556747584772435, "percentage": 35.57, "elapsed_time": "2 days, 11:49:27", "remaining_time": "4 days, 12:21:40", "throughput": 2723.72, "total_tokens": 586600224} {"current_steps": 3250, "total_steps": 9134, "loss": 0.6586, "learning_rate": 3.5941070421611874e-05, "epoch": 0.35578423054818137, "percentage": 35.58, "elapsed_time": "2 days, 11:50:32", "remaining_time": "4 days, 12:20:32", "throughput": 2723.71, "total_tokens": 586775616} {"current_steps": 3251, "total_steps": 9134, "loss": 0.6395, "learning_rate": 3.5933338332705225e-05, "epoch": 0.3558937026191193, "percentage": 35.59, "elapsed_time": "2 days, 11:51:41", "remaining_time": "4 days, 12:19:30", "throughput": 2723.76, "total_tokens": 586973632} {"current_steps": 3252, "total_steps": 9134, "loss": 0.5088, "learning_rate": 3.592560495040556e-05, "epoch": 0.3560031746900572, "percentage": 35.6, "elapsed_time": "2 days, 11:52:45", "remaining_time": "4 days, 12:18:20", "throughput": 2723.66, "total_tokens": 587128416} {"current_steps": 3253, "total_steps": 9134, "loss": 0.6844, "learning_rate": 3.59178702756277e-05, "epoch": 0.3561126467609951, "percentage": 35.61, "elapsed_time": "2 days, 11:53:51", "remaining_time": "4 days, 12:17:13", "throughput": 2723.66, "total_tokens": 587306496} {"current_steps": 3254, "total_steps": 9134, "loss": 0.746, "learning_rate": 3.591013430928666e-05, "epoch": 0.356222118831933, "percentage": 35.63, "elapsed_time": "2 days, 11:54:53", "remaining_time": "4 days, 12:15:59", "throughput": 2723.65, "total_tokens": 587474048} {"current_steps": 3255, "total_steps": 9134, "loss": 0.5208, "learning_rate": 3.59023970522976e-05, "epoch": 0.3563315909028709, "percentage": 35.64, "elapsed_time": "2 days, 11:55:57", "remaining_time": "4 days, 12:14:49", "throughput": 2723.65, "total_tokens": 587648096} {"current_steps": 3256, "total_steps": 9134, "loss": 0.7146, "learning_rate": 3.5894658505575805e-05, "epoch": 0.3564410629738088, "percentage": 35.65, "elapsed_time": "2 days, 11:57:04", "remaining_time": "4 days, 12:13:43", "throughput": 2723.67, "total_tokens": 587833568} {"current_steps": 3257, "total_steps": 9134, "loss": 0.6186, "learning_rate": 3.588691867003673e-05, "epoch": 0.3565505350447467, "percentage": 35.66, "elapsed_time": "2 days, 11:58:07", "remaining_time": "4 days, 12:12:32", "throughput": 2723.56, "total_tokens": 587983648} {"current_steps": 3258, "total_steps": 9134, "loss": 0.7749, "learning_rate": 3.5879177546595996e-05, "epoch": 0.35666000711568463, "percentage": 35.67, "elapsed_time": "2 days, 11:59:14", "remaining_time": "4 days, 12:11:27", "throughput": 2723.53, "total_tokens": 588159712} {"current_steps": 3259, "total_steps": 9134, "loss": 0.5357, "learning_rate": 3.5871435136169355e-05, "epoch": 0.3567694791866225, "percentage": 35.68, "elapsed_time": "2 days, 12:00:21", "remaining_time": "4 days, 12:10:21", "throughput": 2723.53, "total_tokens": 588341376} {"current_steps": 3260, "total_steps": 9134, "loss": 0.9149, "learning_rate": 3.5863691439672715e-05, "epoch": 0.3568789512575604, "percentage": 35.69, "elapsed_time": "2 days, 12:01:26", "remaining_time": "4 days, 12:09:13", "throughput": 2723.58, "total_tokens": 588528640} {"current_steps": 3261, "total_steps": 9134, "loss": 0.6582, "learning_rate": 3.5855946458022145e-05, "epoch": 0.35698842332849834, "percentage": 35.7, "elapsed_time": "2 days, 12:02:30", "remaining_time": "4 days, 12:08:02", "throughput": 2723.5, "total_tokens": 588685888} {"current_steps": 3262, "total_steps": 9134, "loss": 0.6487, "learning_rate": 3.5848200192133866e-05, "epoch": 0.3570978953994362, "percentage": 35.71, "elapsed_time": "2 days, 12:03:34", "remaining_time": "4 days, 12:06:53", "throughput": 2723.5, "total_tokens": 588860832} {"current_steps": 3263, "total_steps": 9134, "loss": 0.8504, "learning_rate": 3.5840452642924243e-05, "epoch": 0.3572073674703741, "percentage": 35.72, "elapsed_time": "2 days, 12:04:37", "remaining_time": "4 days, 12:05:41", "throughput": 2723.44, "total_tokens": 589020096} {"current_steps": 3264, "total_steps": 9134, "loss": 0.7016, "learning_rate": 3.5832703811309795e-05, "epoch": 0.35731683954131205, "percentage": 35.73, "elapsed_time": "2 days, 12:05:43", "remaining_time": "4 days, 12:04:33", "throughput": 2723.47, "total_tokens": 589203328} {"current_steps": 3265, "total_steps": 9134, "loss": 1.0058, "learning_rate": 3.58249536982072e-05, "epoch": 0.3574263116122499, "percentage": 35.75, "elapsed_time": "2 days, 12:06:51", "remaining_time": "4 days, 12:03:31", "throughput": 2723.43, "total_tokens": 589383424} {"current_steps": 3266, "total_steps": 9134, "loss": 0.8033, "learning_rate": 3.581720230453327e-05, "epoch": 0.35753578368318784, "percentage": 35.76, "elapsed_time": "2 days, 12:07:58", "remaining_time": "4 days, 12:02:25", "throughput": 2723.51, "total_tokens": 589581440} {"current_steps": 3267, "total_steps": 9134, "loss": 0.682, "learning_rate": 3.5809449631204985e-05, "epoch": 0.3576452557541257, "percentage": 35.77, "elapsed_time": "2 days, 12:09:02", "remaining_time": "4 days, 12:01:14", "throughput": 2723.47, "total_tokens": 589745632} {"current_steps": 3268, "total_steps": 9134, "loss": 0.7716, "learning_rate": 3.580169567913947e-05, "epoch": 0.3577547278250636, "percentage": 35.78, "elapsed_time": "2 days, 12:10:06", "remaining_time": "4 days, 12:00:04", "throughput": 2723.47, "total_tokens": 589922368} {"current_steps": 3269, "total_steps": 9134, "loss": 0.6651, "learning_rate": 3.5793940449254016e-05, "epoch": 0.35786419989600154, "percentage": 35.79, "elapsed_time": "2 days, 12:11:07", "remaining_time": "4 days, 11:58:48", "throughput": 2723.35, "total_tokens": 590061696} {"current_steps": 3270, "total_steps": 9134, "loss": 0.6599, "learning_rate": 3.578618394246603e-05, "epoch": 0.3579736719669394, "percentage": 35.8, "elapsed_time": "2 days, 12:12:08", "remaining_time": "4 days, 11:57:33", "throughput": 2723.36, "total_tokens": 590231712} {"current_steps": 3271, "total_steps": 9134, "loss": 0.7798, "learning_rate": 3.577842615969311e-05, "epoch": 0.35808314403787733, "percentage": 35.81, "elapsed_time": "2 days, 12:13:15", "remaining_time": "4 days, 11:56:28", "throughput": 2723.36, "total_tokens": 590412480} {"current_steps": 3272, "total_steps": 9134, "loss": 0.6977, "learning_rate": 3.577066710185298e-05, "epoch": 0.35819261610881525, "percentage": 35.82, "elapsed_time": "2 days, 12:14:20", "remaining_time": "4 days, 11:55:19", "throughput": 2723.27, "total_tokens": 590569952} {"current_steps": 3273, "total_steps": 9134, "loss": 0.6471, "learning_rate": 3.576290676986352e-05, "epoch": 0.3583020881797531, "percentage": 35.83, "elapsed_time": "2 days, 12:15:29", "remaining_time": "4 days, 11:54:18", "throughput": 2723.34, "total_tokens": 590773792} {"current_steps": 3274, "total_steps": 9134, "loss": 0.7674, "learning_rate": 3.575514516464277e-05, "epoch": 0.35841156025069104, "percentage": 35.84, "elapsed_time": "2 days, 12:16:39", "remaining_time": "4 days, 11:53:18", "throughput": 2723.33, "total_tokens": 590960160} {"current_steps": 3275, "total_steps": 9134, "loss": 0.5837, "learning_rate": 3.57473822871089e-05, "epoch": 0.35852103232162896, "percentage": 35.86, "elapsed_time": "2 days, 12:17:47", "remaining_time": "4 days, 11:52:15", "throughput": 2723.4, "total_tokens": 591161088} {"current_steps": 3276, "total_steps": 9134, "loss": 0.708, "learning_rate": 3.5739618138180254e-05, "epoch": 0.35863050439256683, "percentage": 35.87, "elapsed_time": "2 days, 12:18:52", "remaining_time": "4 days, 11:51:06", "throughput": 2723.36, "total_tokens": 591330432} {"current_steps": 3277, "total_steps": 9134, "loss": 0.7754, "learning_rate": 3.573185271877531e-05, "epoch": 0.35873997646350475, "percentage": 35.88, "elapsed_time": "2 days, 12:19:54", "remaining_time": "4 days, 11:49:52", "throughput": 2723.28, "total_tokens": 591480288} {"current_steps": 3278, "total_steps": 9134, "loss": 0.7743, "learning_rate": 3.572408602981271e-05, "epoch": 0.35884944853444267, "percentage": 35.89, "elapsed_time": "2 days, 12:21:03", "remaining_time": "4 days, 11:48:50", "throughput": 2723.42, "total_tokens": 591699360} {"current_steps": 3279, "total_steps": 9134, "loss": 0.6722, "learning_rate": 3.571631807221123e-05, "epoch": 0.35895892060538054, "percentage": 35.9, "elapsed_time": "2 days, 12:22:09", "remaining_time": "4 days, 11:47:44", "throughput": 2723.5, "total_tokens": 591897600} {"current_steps": 3280, "total_steps": 9134, "loss": 0.6769, "learning_rate": 3.570854884688981e-05, "epoch": 0.35906839267631846, "percentage": 35.91, "elapsed_time": "2 days, 12:23:17", "remaining_time": "4 days, 11:46:40", "throughput": 2723.55, "total_tokens": 592092032} {"current_steps": 3281, "total_steps": 9134, "loss": 0.9675, "learning_rate": 3.570077835476753e-05, "epoch": 0.3591778647472564, "percentage": 35.92, "elapsed_time": "2 days, 12:24:24", "remaining_time": "4 days, 11:45:36", "throughput": 2723.6, "total_tokens": 592286688} {"current_steps": 3282, "total_steps": 9134, "loss": 0.6696, "learning_rate": 3.569300659676363e-05, "epoch": 0.35928733681819425, "percentage": 35.93, "elapsed_time": "2 days, 12:25:27", "remaining_time": "4 days, 11:44:24", "throughput": 2723.59, "total_tokens": 592456704} {"current_steps": 3283, "total_steps": 9134, "loss": 0.6586, "learning_rate": 3.568523357379749e-05, "epoch": 0.35939680888913217, "percentage": 35.94, "elapsed_time": "2 days, 12:26:35", "remaining_time": "4 days, 11:43:21", "throughput": 2723.69, "total_tokens": 592663904} {"current_steps": 3284, "total_steps": 9134, "loss": 0.6057, "learning_rate": 3.5677459286788645e-05, "epoch": 0.35950628096007003, "percentage": 35.95, "elapsed_time": "2 days, 12:27:42", "remaining_time": "4 days, 11:42:16", "throughput": 2723.77, "total_tokens": 592863712} {"current_steps": 3285, "total_steps": 9134, "loss": 0.6455, "learning_rate": 3.566968373665678e-05, "epoch": 0.35961575303100796, "percentage": 35.96, "elapsed_time": "2 days, 12:28:51", "remaining_time": "4 days, 11:41:14", "throughput": 2723.9, "total_tokens": 593078528} {"current_steps": 3286, "total_steps": 9134, "loss": 0.7128, "learning_rate": 3.5661906924321723e-05, "epoch": 0.3597252251019459, "percentage": 35.98, "elapsed_time": "2 days, 12:29:57", "remaining_time": "4 days, 11:40:08", "throughput": 2723.8, "total_tokens": 593238688} {"current_steps": 3287, "total_steps": 9134, "loss": 0.5496, "learning_rate": 3.5654128850703464e-05, "epoch": 0.35983469717288374, "percentage": 35.99, "elapsed_time": "2 days, 12:31:05", "remaining_time": "4 days, 11:39:03", "throughput": 2723.86, "total_tokens": 593433568} {"current_steps": 3288, "total_steps": 9134, "loss": 0.5224, "learning_rate": 3.564634951672212e-05, "epoch": 0.35994416924382167, "percentage": 36.0, "elapsed_time": "2 days, 12:32:13", "remaining_time": "4 days, 11:38:01", "throughput": 2723.76, "total_tokens": 593597984} {"current_steps": 3289, "total_steps": 9134, "loss": 0.5969, "learning_rate": 3.5638568923297985e-05, "epoch": 0.3600536413147596, "percentage": 36.01, "elapsed_time": "2 days, 12:33:19", "remaining_time": "4 days, 11:36:55", "throughput": 2723.67, "total_tokens": 593759040} {"current_steps": 3290, "total_steps": 9134, "loss": 0.7618, "learning_rate": 3.563078707135149e-05, "epoch": 0.36016311338569745, "percentage": 36.02, "elapsed_time": "2 days, 12:34:27", "remaining_time": "4 days, 11:35:52", "throughput": 2723.69, "total_tokens": 593949888} {"current_steps": 3291, "total_steps": 9134, "loss": 0.7381, "learning_rate": 3.56230039618032e-05, "epoch": 0.3602725854566354, "percentage": 36.03, "elapsed_time": "2 days, 12:35:35", "remaining_time": "4 days, 11:34:49", "throughput": 2723.71, "total_tokens": 594138496} {"current_steps": 3292, "total_steps": 9134, "loss": 0.524, "learning_rate": 3.561521959557385e-05, "epoch": 0.3603820575275733, "percentage": 36.04, "elapsed_time": "2 days, 12:36:39", "remaining_time": "4 days, 11:33:38", "throughput": 2723.59, "total_tokens": 594287904} {"current_steps": 3293, "total_steps": 9134, "loss": 0.5885, "learning_rate": 3.5607433973584316e-05, "epoch": 0.36049152959851116, "percentage": 36.05, "elapsed_time": "2 days, 12:37:47", "remaining_time": "4 days, 11:32:34", "throughput": 2723.59, "total_tokens": 594470912} {"current_steps": 3294, "total_steps": 9134, "loss": 0.7536, "learning_rate": 3.5599647096755624e-05, "epoch": 0.3606010016694491, "percentage": 36.06, "elapsed_time": "2 days, 12:38:54", "remaining_time": "4 days, 11:31:29", "throughput": 2723.64, "total_tokens": 594664448} {"current_steps": 3295, "total_steps": 9134, "loss": 0.7582, "learning_rate": 3.5591858966008935e-05, "epoch": 0.360710473740387, "percentage": 36.07, "elapsed_time": "2 days, 12:39:58", "remaining_time": "4 days, 11:30:19", "throughput": 2723.6, "total_tokens": 594830208} {"current_steps": 3296, "total_steps": 9134, "loss": 0.7423, "learning_rate": 3.558406958226559e-05, "epoch": 0.36081994581132487, "percentage": 36.08, "elapsed_time": "2 days, 12:40:56", "remaining_time": "4 days, 11:28:57", "throughput": 2723.5, "total_tokens": 594965952} {"current_steps": 3297, "total_steps": 9134, "loss": 0.6987, "learning_rate": 3.5576278946447036e-05, "epoch": 0.3609294178822628, "percentage": 36.1, "elapsed_time": "2 days, 12:42:03", "remaining_time": "4 days, 11:27:53", "throughput": 2723.52, "total_tokens": 595152992} {"current_steps": 3298, "total_steps": 9134, "loss": 0.7194, "learning_rate": 3.556848705947491e-05, "epoch": 0.3610388899532007, "percentage": 36.11, "elapsed_time": "2 days, 12:43:11", "remaining_time": "4 days, 11:26:50", "throughput": 2723.67, "total_tokens": 595372512} {"current_steps": 3299, "total_steps": 9134, "loss": 0.6593, "learning_rate": 3.556069392227096e-05, "epoch": 0.3611483620241386, "percentage": 36.12, "elapsed_time": "2 days, 12:44:17", "remaining_time": "4 days, 11:25:43", "throughput": 2723.63, "total_tokens": 595542752} {"current_steps": 3300, "total_steps": 9134, "loss": 0.5969, "learning_rate": 3.5552899535757115e-05, "epoch": 0.3612578340950765, "percentage": 36.13, "elapsed_time": "2 days, 12:45:26", "remaining_time": "4 days, 11:24:42", "throughput": 2723.63, "total_tokens": 595731360} {"current_steps": 3301, "total_steps": 9134, "loss": 0.5062, "learning_rate": 3.554510390085543e-05, "epoch": 0.36136730616601437, "percentage": 36.14, "elapsed_time": "2 days, 12:46:35", "remaining_time": "4 days, 11:23:40", "throughput": 2723.63, "total_tokens": 595918624} {"current_steps": 3302, "total_steps": 9134, "loss": 0.6638, "learning_rate": 3.5537307018488095e-05, "epoch": 0.3614767782369523, "percentage": 36.15, "elapsed_time": "2 days, 12:47:44", "remaining_time": "4 days, 11:22:38", "throughput": 2723.65, "total_tokens": 596109472} {"current_steps": 3303, "total_steps": 9134, "loss": 0.6893, "learning_rate": 3.55295088895775e-05, "epoch": 0.3615862503078902, "percentage": 36.16, "elapsed_time": "2 days, 12:48:47", "remaining_time": "4 days, 11:21:27", "throughput": 2723.58, "total_tokens": 596267168} {"current_steps": 3304, "total_steps": 9134, "loss": 0.6731, "learning_rate": 3.552170951504613e-05, "epoch": 0.3616957223788281, "percentage": 36.17, "elapsed_time": "2 days, 12:49:53", "remaining_time": "4 days, 11:20:20", "throughput": 2723.47, "total_tokens": 596422400} {"current_steps": 3305, "total_steps": 9134, "loss": 0.6372, "learning_rate": 3.551390889581664e-05, "epoch": 0.361805194449766, "percentage": 36.18, "elapsed_time": "2 days, 12:51:02", "remaining_time": "4 days, 11:19:18", "throughput": 2723.58, "total_tokens": 596632736} {"current_steps": 3306, "total_steps": 9134, "loss": 0.683, "learning_rate": 3.550610703281182e-05, "epoch": 0.3619146665207039, "percentage": 36.19, "elapsed_time": "2 days, 12:52:09", "remaining_time": "4 days, 11:18:14", "throughput": 2723.54, "total_tokens": 596809024} {"current_steps": 3307, "total_steps": 9134, "loss": 0.5589, "learning_rate": 3.5498303926954626e-05, "epoch": 0.3620241385916418, "percentage": 36.21, "elapsed_time": "2 days, 12:53:15", "remaining_time": "4 days, 11:17:07", "throughput": 2723.58, "total_tokens": 596996288} {"current_steps": 3308, "total_steps": 9134, "loss": 0.5323, "learning_rate": 3.549049957916815e-05, "epoch": 0.3621336106625797, "percentage": 36.22, "elapsed_time": "2 days, 12:54:17", "remaining_time": "4 days, 11:15:52", "throughput": 2723.51, "total_tokens": 597149504} {"current_steps": 3309, "total_steps": 9134, "loss": 0.7142, "learning_rate": 3.548269399037562e-05, "epoch": 0.36224308273351763, "percentage": 36.23, "elapsed_time": "2 days, 12:55:23", "remaining_time": "4 days, 11:14:46", "throughput": 2723.51, "total_tokens": 597329824} {"current_steps": 3310, "total_steps": 9134, "loss": 0.7663, "learning_rate": 3.547488716150044e-05, "epoch": 0.3623525548044555, "percentage": 36.24, "elapsed_time": "2 days, 12:56:28", "remaining_time": "4 days, 11:13:36", "throughput": 2723.45, "total_tokens": 597491552} {"current_steps": 3311, "total_steps": 9134, "loss": 0.6858, "learning_rate": 3.546707909346613e-05, "epoch": 0.3624620268753934, "percentage": 36.25, "elapsed_time": "2 days, 12:57:37", "remaining_time": "4 days, 11:12:35", "throughput": 2723.44, "total_tokens": 597678144} {"current_steps": 3312, "total_steps": 9134, "loss": 0.8191, "learning_rate": 3.545926978719637e-05, "epoch": 0.36257149894633134, "percentage": 36.26, "elapsed_time": "2 days, 12:58:45", "remaining_time": "4 days, 11:11:32", "throughput": 2723.55, "total_tokens": 597886464} {"current_steps": 3313, "total_steps": 9134, "loss": 0.9161, "learning_rate": 3.545145924361499e-05, "epoch": 0.3626809710172692, "percentage": 36.27, "elapsed_time": "2 days, 12:59:54", "remaining_time": "4 days, 11:10:30", "throughput": 2723.64, "total_tokens": 598096576} {"current_steps": 3314, "total_steps": 9134, "loss": 0.7122, "learning_rate": 3.544364746364596e-05, "epoch": 0.3627904430882071, "percentage": 36.28, "elapsed_time": "2 days, 13:01:03", "remaining_time": "4 days, 11:09:29", "throughput": 2723.59, "total_tokens": 598273088} {"current_steps": 3315, "total_steps": 9134, "loss": 0.6235, "learning_rate": 3.54358344482134e-05, "epoch": 0.36289991515914505, "percentage": 36.29, "elapsed_time": "2 days, 13:02:11", "remaining_time": "4 days, 11:08:26", "throughput": 2723.56, "total_tokens": 598450720} {"current_steps": 3316, "total_steps": 9134, "loss": 0.7491, "learning_rate": 3.542802019824158e-05, "epoch": 0.3630093872300829, "percentage": 36.3, "elapsed_time": "2 days, 13:03:18", "remaining_time": "4 days, 11:07:21", "throughput": 2723.58, "total_tokens": 598638880} {"current_steps": 3317, "total_steps": 9134, "loss": 0.5544, "learning_rate": 3.5420204714654906e-05, "epoch": 0.36311885930102084, "percentage": 36.31, "elapsed_time": "2 days, 13:04:27", "remaining_time": "4 days, 11:06:19", "throughput": 2723.62, "total_tokens": 598834880} {"current_steps": 3318, "total_steps": 9134, "loss": 0.6329, "learning_rate": 3.5412387998377926e-05, "epoch": 0.3632283313719587, "percentage": 36.33, "elapsed_time": "2 days, 13:05:31", "remaining_time": "4 days, 11:05:09", "throughput": 2723.61, "total_tokens": 599006240} {"current_steps": 3319, "total_steps": 9134, "loss": 0.9257, "learning_rate": 3.5404570050335354e-05, "epoch": 0.3633378034428966, "percentage": 36.34, "elapsed_time": "2 days, 13:06:38", "remaining_time": "4 days, 11:04:04", "throughput": 2723.69, "total_tokens": 599208064} {"current_steps": 3320, "total_steps": 9134, "loss": 0.5907, "learning_rate": 3.5396750871452036e-05, "epoch": 0.36344727551383454, "percentage": 36.35, "elapsed_time": "2 days, 13:07:47", "remaining_time": "4 days, 11:03:02", "throughput": 2723.62, "total_tokens": 599379648} {"current_steps": 3321, "total_steps": 9134, "loss": 0.8463, "learning_rate": 3.538893046265297e-05, "epoch": 0.3635567475847724, "percentage": 36.36, "elapsed_time": "2 days, 13:08:56", "remaining_time": "4 days, 11:02:01", "throughput": 2723.69, "total_tokens": 599581920} {"current_steps": 3322, "total_steps": 9134, "loss": 0.6833, "learning_rate": 3.5381108824863284e-05, "epoch": 0.36366621965571033, "percentage": 36.37, "elapsed_time": "2 days, 13:10:02", "remaining_time": "4 days, 11:00:54", "throughput": 2723.71, "total_tokens": 599766048} {"current_steps": 3323, "total_steps": 9134, "loss": 0.6742, "learning_rate": 3.5373285959008265e-05, "epoch": 0.36377569172664825, "percentage": 36.38, "elapsed_time": "2 days, 13:11:11", "remaining_time": "4 days, 10:59:52", "throughput": 2723.87, "total_tokens": 599989376} {"current_steps": 3324, "total_steps": 9134, "loss": 0.6352, "learning_rate": 3.536546186601336e-05, "epoch": 0.3638851637975861, "percentage": 36.39, "elapsed_time": "2 days, 13:12:16", "remaining_time": "4 days, 10:58:45", "throughput": 2723.89, "total_tokens": 600173952} {"current_steps": 3325, "total_steps": 9134, "loss": 0.8862, "learning_rate": 3.5357636546804125e-05, "epoch": 0.36399463586852404, "percentage": 36.4, "elapsed_time": "2 days, 13:13:21", "remaining_time": "4 days, 10:57:37", "throughput": 2723.89, "total_tokens": 600350016} {"current_steps": 3326, "total_steps": 9134, "loss": 0.6444, "learning_rate": 3.534981000230629e-05, "epoch": 0.36410410793946196, "percentage": 36.41, "elapsed_time": "2 days, 13:14:29", "remaining_time": "4 days, 10:56:33", "throughput": 2723.9, "total_tokens": 600536608} {"current_steps": 3327, "total_steps": 9134, "loss": 0.7013, "learning_rate": 3.5341982233445715e-05, "epoch": 0.36421358001039983, "percentage": 36.42, "elapsed_time": "2 days, 13:15:35", "remaining_time": "4 days, 10:55:26", "throughput": 2723.91, "total_tokens": 600719616} {"current_steps": 3328, "total_steps": 9134, "loss": 0.8, "learning_rate": 3.533415324114841e-05, "epoch": 0.36432305208133775, "percentage": 36.44, "elapsed_time": "2 days, 13:16:43", "remaining_time": "4 days, 10:54:22", "throughput": 2723.93, "total_tokens": 600907552} {"current_steps": 3329, "total_steps": 9134, "loss": 0.5329, "learning_rate": 3.532632302634053e-05, "epoch": 0.36443252415227567, "percentage": 36.45, "elapsed_time": "2 days, 13:17:49", "remaining_time": "4 days, 10:53:15", "throughput": 2723.92, "total_tokens": 601085856} {"current_steps": 3330, "total_steps": 9134, "loss": 0.6869, "learning_rate": 3.531849158994839e-05, "epoch": 0.36454199622321354, "percentage": 36.46, "elapsed_time": "2 days, 13:18:51", "remaining_time": "4 days, 10:52:02", "throughput": 2723.9, "total_tokens": 601250272} {"current_steps": 3331, "total_steps": 9134, "loss": 0.6708, "learning_rate": 3.531065893289841e-05, "epoch": 0.36465146829415146, "percentage": 36.47, "elapsed_time": "2 days, 13:19:57", "remaining_time": "4 days, 10:50:55", "throughput": 2723.79, "total_tokens": 601406624} {"current_steps": 3332, "total_steps": 9134, "loss": 0.8848, "learning_rate": 3.530282505611719e-05, "epoch": 0.3647609403650894, "percentage": 36.48, "elapsed_time": "2 days, 13:21:05", "remaining_time": "4 days, 10:49:53", "throughput": 2723.83, "total_tokens": 601601728} {"current_steps": 3333, "total_steps": 9134, "loss": 0.7992, "learning_rate": 3.5294989960531456e-05, "epoch": 0.36487041243602725, "percentage": 36.49, "elapsed_time": "2 days, 13:22:13", "remaining_time": "4 days, 10:48:49", "throughput": 2723.9, "total_tokens": 601800640} {"current_steps": 3334, "total_steps": 9134, "loss": 0.684, "learning_rate": 3.52871536470681e-05, "epoch": 0.36497988450696517, "percentage": 36.5, "elapsed_time": "2 days, 13:23:19", "remaining_time": "4 days, 10:47:42", "throughput": 2723.73, "total_tokens": 601942880} {"current_steps": 3335, "total_steps": 9134, "loss": 0.665, "learning_rate": 3.5279316116654126e-05, "epoch": 0.36508935657790303, "percentage": 36.51, "elapsed_time": "2 days, 13:24:24", "remaining_time": "4 days, 10:46:34", "throughput": 2723.66, "total_tokens": 602105952} {"current_steps": 3336, "total_steps": 9134, "loss": 0.7021, "learning_rate": 3.527147737021671e-05, "epoch": 0.36519882864884096, "percentage": 36.52, "elapsed_time": "2 days, 13:25:33", "remaining_time": "4 days, 10:45:31", "throughput": 2723.6, "total_tokens": 602279104} {"current_steps": 3337, "total_steps": 9134, "loss": 0.6554, "learning_rate": 3.526363740868316e-05, "epoch": 0.3653083007197789, "percentage": 36.53, "elapsed_time": "2 days, 13:26:41", "remaining_time": "4 days, 10:44:28", "throughput": 2723.66, "total_tokens": 602478016} {"current_steps": 3338, "total_steps": 9134, "loss": 0.6294, "learning_rate": 3.525579623298092e-05, "epoch": 0.36541777279071674, "percentage": 36.54, "elapsed_time": "2 days, 13:27:49", "remaining_time": "4 days, 10:43:26", "throughput": 2723.76, "total_tokens": 602686560} {"current_steps": 3339, "total_steps": 9134, "loss": 0.7855, "learning_rate": 3.52479538440376e-05, "epoch": 0.36552724486165467, "percentage": 36.56, "elapsed_time": "2 days, 13:28:57", "remaining_time": "4 days, 10:42:22", "throughput": 2723.84, "total_tokens": 602887936} {"current_steps": 3340, "total_steps": 9134, "loss": 0.9159, "learning_rate": 3.5240110242780916e-05, "epoch": 0.3656367169325926, "percentage": 36.57, "elapsed_time": "2 days, 13:30:03", "remaining_time": "4 days, 10:41:16", "throughput": 2723.93, "total_tokens": 603089088} {"current_steps": 3341, "total_steps": 9134, "loss": 0.5979, "learning_rate": 3.5232265430138776e-05, "epoch": 0.36574618900353045, "percentage": 36.58, "elapsed_time": "2 days, 13:31:05", "remaining_time": "4 days, 10:40:01", "throughput": 2723.9, "total_tokens": 603250144} {"current_steps": 3342, "total_steps": 9134, "loss": 0.836, "learning_rate": 3.52244194070392e-05, "epoch": 0.3658556610744684, "percentage": 36.59, "elapsed_time": "2 days, 13:32:11", "remaining_time": "4 days, 10:38:55", "throughput": 2723.89, "total_tokens": 603428000} {"current_steps": 3343, "total_steps": 9134, "loss": 0.6995, "learning_rate": 3.521657217441034e-05, "epoch": 0.3659651331454063, "percentage": 36.6, "elapsed_time": "2 days, 13:33:15", "remaining_time": "4 days, 10:37:43", "throughput": 2723.82, "total_tokens": 603585472} {"current_steps": 3344, "total_steps": 9134, "loss": 0.6596, "learning_rate": 3.520872373318053e-05, "epoch": 0.36607460521634416, "percentage": 36.61, "elapsed_time": "2 days, 13:34:21", "remaining_time": "4 days, 10:36:37", "throughput": 2723.82, "total_tokens": 603764896} {"current_steps": 3345, "total_steps": 9134, "loss": 0.8945, "learning_rate": 3.520087408427822e-05, "epoch": 0.3661840772872821, "percentage": 36.62, "elapsed_time": "2 days, 13:35:30", "remaining_time": "4 days, 10:35:36", "throughput": 2723.9, "total_tokens": 603971648} {"current_steps": 3346, "total_steps": 9134, "loss": 0.9512, "learning_rate": 3.5193023228632003e-05, "epoch": 0.36629354935822, "percentage": 36.63, "elapsed_time": "2 days, 13:36:38", "remaining_time": "4 days, 10:34:33", "throughput": 2723.93, "total_tokens": 604164064} {"current_steps": 3347, "total_steps": 9134, "loss": 0.7553, "learning_rate": 3.518517116717063e-05, "epoch": 0.36640302142915787, "percentage": 36.64, "elapsed_time": "2 days, 13:37:44", "remaining_time": "4 days, 10:33:26", "throughput": 2723.89, "total_tokens": 604334528} {"current_steps": 3348, "total_steps": 9134, "loss": 0.6105, "learning_rate": 3.5177317900822974e-05, "epoch": 0.3665124935000958, "percentage": 36.65, "elapsed_time": "2 days, 13:38:51", "remaining_time": "4 days, 10:32:21", "throughput": 2723.96, "total_tokens": 604531424} {"current_steps": 3349, "total_steps": 9134, "loss": 0.6353, "learning_rate": 3.516946343051806e-05, "epoch": 0.3666219655710337, "percentage": 36.67, "elapsed_time": "2 days, 13:40:00", "remaining_time": "4 days, 10:31:20", "throughput": 2724.01, "total_tokens": 604732800} {"current_steps": 3350, "total_steps": 9134, "loss": 0.7061, "learning_rate": 3.516160775718508e-05, "epoch": 0.3667314376419716, "percentage": 36.68, "elapsed_time": "2 days, 13:41:08", "remaining_time": "4 days, 10:30:15", "throughput": 2724.11, "total_tokens": 604938880} {"current_steps": 3351, "total_steps": 9134, "loss": 0.6514, "learning_rate": 3.5153750881753314e-05, "epoch": 0.3668409097129095, "percentage": 36.69, "elapsed_time": "2 days, 13:42:11", "remaining_time": "4 days, 10:29:04", "throughput": 2724.07, "total_tokens": 605102624} {"current_steps": 3352, "total_steps": 9134, "loss": 0.7267, "learning_rate": 3.514589280515223e-05, "epoch": 0.3669503817838474, "percentage": 36.7, "elapsed_time": "2 days, 13:43:19", "remaining_time": "4 days, 10:28:00", "throughput": 2723.99, "total_tokens": 605268608} {"current_steps": 3353, "total_steps": 9134, "loss": 0.9207, "learning_rate": 3.513803352831143e-05, "epoch": 0.3670598538547853, "percentage": 36.71, "elapsed_time": "2 days, 13:44:25", "remaining_time": "4 days, 10:26:54", "throughput": 2723.98, "total_tokens": 605448256} {"current_steps": 3354, "total_steps": 9134, "loss": 0.7838, "learning_rate": 3.5130173052160645e-05, "epoch": 0.3671693259257232, "percentage": 36.72, "elapsed_time": "2 days, 13:45:32", "remaining_time": "4 days, 10:25:48", "throughput": 2724.03, "total_tokens": 605639552} {"current_steps": 3355, "total_steps": 9134, "loss": 0.5323, "learning_rate": 3.512231137762975e-05, "epoch": 0.3672787979966611, "percentage": 36.73, "elapsed_time": "2 days, 13:46:38", "remaining_time": "4 days, 10:24:42", "throughput": 2724.05, "total_tokens": 605824576} {"current_steps": 3356, "total_steps": 9134, "loss": 0.7502, "learning_rate": 3.5114448505648754e-05, "epoch": 0.367388270067599, "percentage": 36.74, "elapsed_time": "2 days, 13:47:47", "remaining_time": "4 days, 10:23:40", "throughput": 2724.07, "total_tokens": 606016768} {"current_steps": 3357, "total_steps": 9134, "loss": 0.5687, "learning_rate": 3.510658443714785e-05, "epoch": 0.3674977421385369, "percentage": 36.75, "elapsed_time": "2 days, 13:48:51", "remaining_time": "4 days, 10:22:29", "throughput": 2724.05, "total_tokens": 606185216} {"current_steps": 3358, "total_steps": 9134, "loss": 0.6255, "learning_rate": 3.509871917305734e-05, "epoch": 0.3676072142094748, "percentage": 36.76, "elapsed_time": "2 days, 13:49:59", "remaining_time": "4 days, 10:21:27", "throughput": 2724.06, "total_tokens": 606374272} {"current_steps": 3359, "total_steps": 9134, "loss": 0.5482, "learning_rate": 3.509085271430764e-05, "epoch": 0.3677166862804127, "percentage": 36.77, "elapsed_time": "2 days, 13:51:02", "remaining_time": "4 days, 10:20:14", "throughput": 2724.03, "total_tokens": 606539360} {"current_steps": 3360, "total_steps": 9134, "loss": 0.6908, "learning_rate": 3.508298506182936e-05, "epoch": 0.36782615835135063, "percentage": 36.79, "elapsed_time": "2 days, 13:52:09", "remaining_time": "4 days, 10:19:09", "throughput": 2724.06, "total_tokens": 606727968} {"current_steps": 3361, "total_steps": 9134, "loss": 0.5082, "learning_rate": 3.5075116216553225e-05, "epoch": 0.3679356304222885, "percentage": 36.8, "elapsed_time": "2 days, 13:53:17", "remaining_time": "4 days, 10:18:06", "throughput": 2724.14, "total_tokens": 606932928} {"current_steps": 3362, "total_steps": 9134, "loss": 0.9114, "learning_rate": 3.50672461794101e-05, "epoch": 0.3680451024932264, "percentage": 36.81, "elapsed_time": "2 days, 13:54:22", "remaining_time": "4 days, 10:16:58", "throughput": 2724.09, "total_tokens": 607099584} {"current_steps": 3363, "total_steps": 9134, "loss": 0.8327, "learning_rate": 3.5059374951330995e-05, "epoch": 0.36815457456416434, "percentage": 36.82, "elapsed_time": "2 days, 13:55:27", "remaining_time": "4 days, 10:15:50", "throughput": 2724.04, "total_tokens": 607264224} {"current_steps": 3364, "total_steps": 9134, "loss": 0.6214, "learning_rate": 3.505150253324706e-05, "epoch": 0.3682640466351022, "percentage": 36.83, "elapsed_time": "2 days, 13:56:35", "remaining_time": "4 days, 10:14:45", "throughput": 2724.09, "total_tokens": 607459104} {"current_steps": 3365, "total_steps": 9134, "loss": 0.7016, "learning_rate": 3.5043628926089596e-05, "epoch": 0.3683735187060401, "percentage": 36.84, "elapsed_time": "2 days, 13:57:40", "remaining_time": "4 days, 10:13:37", "throughput": 2724.13, "total_tokens": 607644800} {"current_steps": 3366, "total_steps": 9134, "loss": 0.6754, "learning_rate": 3.503575413079003e-05, "epoch": 0.36848299077697805, "percentage": 36.85, "elapsed_time": "2 days, 13:58:49", "remaining_time": "4 days, 10:12:36", "throughput": 2724.22, "total_tokens": 607854016} {"current_steps": 3367, "total_steps": 9134, "loss": 0.6725, "learning_rate": 3.502787814827994e-05, "epoch": 0.3685924628479159, "percentage": 36.86, "elapsed_time": "2 days, 13:59:56", "remaining_time": "4 days, 10:11:31", "throughput": 2724.25, "total_tokens": 608042400} {"current_steps": 3368, "total_steps": 9134, "loss": 0.6151, "learning_rate": 3.5020000979491025e-05, "epoch": 0.36870193491885384, "percentage": 36.87, "elapsed_time": "2 days, 14:01:02", "remaining_time": "4 days, 10:10:23", "throughput": 2724.2, "total_tokens": 608211072} {"current_steps": 3369, "total_steps": 9134, "loss": 0.6844, "learning_rate": 3.501212262535515e-05, "epoch": 0.36881140698979176, "percentage": 36.88, "elapsed_time": "2 days, 14:02:11", "remaining_time": "4 days, 10:09:22", "throughput": 2724.29, "total_tokens": 608418496} {"current_steps": 3370, "total_steps": 9134, "loss": 0.6813, "learning_rate": 3.500424308680431e-05, "epoch": 0.3689208790607296, "percentage": 36.9, "elapsed_time": "2 days, 14:03:16", "remaining_time": "4 days, 10:08:13", "throughput": 2724.2, "total_tokens": 608574624} {"current_steps": 3371, "total_steps": 9134, "loss": 0.5584, "learning_rate": 3.499636236477064e-05, "epoch": 0.36903035113166754, "percentage": 36.91, "elapsed_time": "2 days, 14:04:21", "remaining_time": "4 days, 10:07:05", "throughput": 2724.2, "total_tokens": 608753600} {"current_steps": 3372, "total_steps": 9134, "loss": 0.747, "learning_rate": 3.498848046018641e-05, "epoch": 0.3691398232026054, "percentage": 36.92, "elapsed_time": "2 days, 14:05:28", "remaining_time": "4 days, 10:06:01", "throughput": 2724.29, "total_tokens": 608956768} {"current_steps": 3373, "total_steps": 9134, "loss": 0.7515, "learning_rate": 3.498059737398405e-05, "epoch": 0.36924929527354333, "percentage": 36.93, "elapsed_time": "2 days, 14:06:33", "remaining_time": "4 days, 10:04:52", "throughput": 2724.35, "total_tokens": 609147392} {"current_steps": 3374, "total_steps": 9134, "loss": 0.6842, "learning_rate": 3.497271310709608e-05, "epoch": 0.36935876734448125, "percentage": 36.94, "elapsed_time": "2 days, 14:07:36", "remaining_time": "4 days, 10:03:40", "throughput": 2724.24, "total_tokens": 609293888} {"current_steps": 3375, "total_steps": 9134, "loss": 0.7378, "learning_rate": 3.4964827660455226e-05, "epoch": 0.3694682394154191, "percentage": 36.95, "elapsed_time": "2 days, 14:08:42", "remaining_time": "4 days, 10:02:32", "throughput": 2724.25, "total_tokens": 609474432} {"current_steps": 3376, "total_steps": 9134, "loss": 0.4927, "learning_rate": 3.495694103499431e-05, "epoch": 0.36957771148635704, "percentage": 36.96, "elapsed_time": "2 days, 14:09:47", "remaining_time": "4 days, 10:01:25", "throughput": 2724.31, "total_tokens": 609666176} {"current_steps": 3377, "total_steps": 9134, "loss": 0.7194, "learning_rate": 3.494905323164629e-05, "epoch": 0.36968718355729496, "percentage": 36.97, "elapsed_time": "2 days, 14:10:54", "remaining_time": "4 days, 10:00:20", "throughput": 2724.29, "total_tokens": 609844928} {"current_steps": 3378, "total_steps": 9134, "loss": 0.6797, "learning_rate": 3.4941164251344306e-05, "epoch": 0.36979665562823283, "percentage": 36.98, "elapsed_time": "2 days, 14:12:01", "remaining_time": "4 days, 9:59:15", "throughput": 2724.28, "total_tokens": 610026368} {"current_steps": 3379, "total_steps": 9134, "loss": 0.8618, "learning_rate": 3.493327409502159e-05, "epoch": 0.36990612769917075, "percentage": 36.99, "elapsed_time": "2 days, 14:13:09", "remaining_time": "4 days, 9:58:11", "throughput": 2724.33, "total_tokens": 610220576} {"current_steps": 3380, "total_steps": 9134, "loss": 0.7187, "learning_rate": 3.492538276361154e-05, "epoch": 0.37001559977010867, "percentage": 37.0, "elapsed_time": "2 days, 14:14:09", "remaining_time": "4 days, 9:56:54", "throughput": 2724.25, "total_tokens": 610367296} {"current_steps": 3381, "total_steps": 9134, "loss": 0.8269, "learning_rate": 3.491749025804768e-05, "epoch": 0.37012507184104654, "percentage": 37.02, "elapsed_time": "2 days, 14:15:14", "remaining_time": "4 days, 9:55:45", "throughput": 2724.24, "total_tokens": 610542016} {"current_steps": 3382, "total_steps": 9134, "loss": 0.7192, "learning_rate": 3.4909596579263685e-05, "epoch": 0.37023454391198446, "percentage": 37.03, "elapsed_time": "2 days, 14:16:22", "remaining_time": "4 days, 9:54:42", "throughput": 2724.33, "total_tokens": 610747872} {"current_steps": 3383, "total_steps": 9134, "loss": 0.5798, "learning_rate": 3.490170172819336e-05, "epoch": 0.3703440159829224, "percentage": 37.04, "elapsed_time": "2 days, 14:17:26", "remaining_time": "4 days, 9:53:32", "throughput": 2724.24, "total_tokens": 610901536} {"current_steps": 3384, "total_steps": 9134, "loss": 0.6032, "learning_rate": 3.489380570577064e-05, "epoch": 0.37045348805386025, "percentage": 37.05, "elapsed_time": "2 days, 14:18:31", "remaining_time": "4 days, 9:52:23", "throughput": 2724.19, "total_tokens": 611066848} {"current_steps": 3385, "total_steps": 9134, "loss": 0.759, "learning_rate": 3.488590851292963e-05, "epoch": 0.37056296012479817, "percentage": 37.06, "elapsed_time": "2 days, 14:19:39", "remaining_time": "4 days, 9:51:20", "throughput": 2724.33, "total_tokens": 611283680} {"current_steps": 3386, "total_steps": 9134, "loss": 0.6417, "learning_rate": 3.487801015060453e-05, "epoch": 0.3706724321957361, "percentage": 37.07, "elapsed_time": "2 days, 14:20:47", "remaining_time": "4 days, 9:50:17", "throughput": 2724.37, "total_tokens": 611478560} {"current_steps": 3387, "total_steps": 9134, "loss": 1.0781, "learning_rate": 3.487011061972972e-05, "epoch": 0.37078190426667396, "percentage": 37.08, "elapsed_time": "2 days, 14:21:56", "remaining_time": "4 days, 9:49:15", "throughput": 2724.46, "total_tokens": 611686432} {"current_steps": 3388, "total_steps": 9134, "loss": 0.6617, "learning_rate": 3.48622099212397e-05, "epoch": 0.3708913763376119, "percentage": 37.09, "elapsed_time": "2 days, 14:23:00", "remaining_time": "4 days, 9:48:06", "throughput": 2724.49, "total_tokens": 611868768} {"current_steps": 3389, "total_steps": 9134, "loss": 0.5927, "learning_rate": 3.485430805606909e-05, "epoch": 0.37100084840854974, "percentage": 37.1, "elapsed_time": "2 days, 14:24:03", "remaining_time": "4 days, 9:46:53", "throughput": 2724.36, "total_tokens": 612009216} {"current_steps": 3390, "total_steps": 9134, "loss": 0.8317, "learning_rate": 3.484640502515267e-05, "epoch": 0.37111032047948767, "percentage": 37.11, "elapsed_time": "2 days, 14:25:09", "remaining_time": "4 days, 9:45:46", "throughput": 2724.41, "total_tokens": 612200736} {"current_steps": 3391, "total_steps": 9134, "loss": 0.8839, "learning_rate": 3.483850082942537e-05, "epoch": 0.3712197925504256, "percentage": 37.13, "elapsed_time": "2 days, 14:26:18", "remaining_time": "4 days, 9:44:44", "throughput": 2724.57, "total_tokens": 612423840} {"current_steps": 3392, "total_steps": 9134, "loss": 0.7767, "learning_rate": 3.4830595469822224e-05, "epoch": 0.37132926462136345, "percentage": 37.14, "elapsed_time": "2 days, 14:27:24", "remaining_time": "4 days, 9:43:37", "throughput": 2724.54, "total_tokens": 612597888} {"current_steps": 3393, "total_steps": 9134, "loss": 0.7403, "learning_rate": 3.482268894727843e-05, "epoch": 0.3714387366923014, "percentage": 37.15, "elapsed_time": "2 days, 14:28:27", "remaining_time": "4 days, 9:42:25", "throughput": 2724.5, "total_tokens": 612759616} {"current_steps": 3394, "total_steps": 9134, "loss": 0.7046, "learning_rate": 3.481478126272931e-05, "epoch": 0.3715482087632393, "percentage": 37.16, "elapsed_time": "2 days, 14:29:32", "remaining_time": "4 days, 9:41:17", "throughput": 2724.44, "total_tokens": 612924928} {"current_steps": 3395, "total_steps": 9134, "loss": 0.6082, "learning_rate": 3.4806872417110333e-05, "epoch": 0.37165768083417716, "percentage": 37.17, "elapsed_time": "2 days, 14:30:35", "remaining_time": "4 days, 9:40:05", "throughput": 2724.46, "total_tokens": 613099424} {"current_steps": 3396, "total_steps": 9134, "loss": 0.8083, "learning_rate": 3.479896241135709e-05, "epoch": 0.3717671529051151, "percentage": 37.18, "elapsed_time": "2 days, 14:31:39", "remaining_time": "4 days, 9:38:55", "throughput": 2724.49, "total_tokens": 613279744} {"current_steps": 3397, "total_steps": 9134, "loss": 0.5648, "learning_rate": 3.4791051246405326e-05, "epoch": 0.371876624976053, "percentage": 37.19, "elapsed_time": "2 days, 14:32:48", "remaining_time": "4 days, 9:37:53", "throughput": 2724.41, "total_tokens": 613451552} {"current_steps": 3398, "total_steps": 9134, "loss": 0.6135, "learning_rate": 3.478313892319092e-05, "epoch": 0.37198609704699087, "percentage": 37.2, "elapsed_time": "2 days, 14:33:57", "remaining_time": "4 days, 9:36:52", "throughput": 2724.41, "total_tokens": 613638592} {"current_steps": 3399, "total_steps": 9134, "loss": 0.5899, "learning_rate": 3.477522544264988e-05, "epoch": 0.3720955691179288, "percentage": 37.21, "elapsed_time": "2 days, 14:35:03", "remaining_time": "4 days, 9:35:45", "throughput": 2724.38, "total_tokens": 613812192} {"current_steps": 3400, "total_steps": 9134, "loss": 0.6572, "learning_rate": 3.4767310805718355e-05, "epoch": 0.3722050411888667, "percentage": 37.22, "elapsed_time": "2 days, 14:36:11", "remaining_time": "4 days, 9:34:43", "throughput": 2724.43, "total_tokens": 614010208} {"current_steps": 3401, "total_steps": 9134, "loss": 0.8875, "learning_rate": 3.475939501333264e-05, "epoch": 0.3723145132598046, "percentage": 37.23, "elapsed_time": "2 days, 14:37:20", "remaining_time": "4 days, 9:33:40", "throughput": 2724.49, "total_tokens": 614209120} {"current_steps": 3402, "total_steps": 9134, "loss": 0.574, "learning_rate": 3.4751478066429156e-05, "epoch": 0.3724239853307425, "percentage": 37.25, "elapsed_time": "2 days, 14:38:27", "remaining_time": "4 days, 9:32:36", "throughput": 2724.52, "total_tokens": 614400640} {"current_steps": 3403, "total_steps": 9134, "loss": 0.79, "learning_rate": 3.474355996594445e-05, "epoch": 0.3725334574016804, "percentage": 37.26, "elapsed_time": "2 days, 14:39:34", "remaining_time": "4 days, 9:31:30", "throughput": 2724.61, "total_tokens": 614602016} {"current_steps": 3404, "total_steps": 9134, "loss": 0.8379, "learning_rate": 3.473564071281522e-05, "epoch": 0.3726429294726183, "percentage": 37.27, "elapsed_time": "2 days, 14:40:42", "remaining_time": "4 days, 9:30:27", "throughput": 2724.68, "total_tokens": 614802720} {"current_steps": 3405, "total_steps": 9134, "loss": 0.7605, "learning_rate": 3.472772030797832e-05, "epoch": 0.3727524015435562, "percentage": 37.28, "elapsed_time": "2 days, 14:41:46", "remaining_time": "4 days, 9:29:16", "throughput": 2724.67, "total_tokens": 614975648} {"current_steps": 3406, "total_steps": 9134, "loss": 0.6571, "learning_rate": 3.4719798752370694e-05, "epoch": 0.3728618736144941, "percentage": 37.29, "elapsed_time": "2 days, 14:42:55", "remaining_time": "4 days, 9:28:14", "throughput": 2724.8, "total_tokens": 615192704} {"current_steps": 3407, "total_steps": 9134, "loss": 0.7727, "learning_rate": 3.471187604692945e-05, "epoch": 0.372971345685432, "percentage": 37.3, "elapsed_time": "2 days, 14:44:03", "remaining_time": "4 days, 9:27:12", "throughput": 2724.79, "total_tokens": 615376160} {"current_steps": 3408, "total_steps": 9134, "loss": 0.6472, "learning_rate": 3.470395219259185e-05, "epoch": 0.3730808177563699, "percentage": 37.31, "elapsed_time": "2 days, 14:45:08", "remaining_time": "4 days, 9:26:02", "throughput": 2724.75, "total_tokens": 615542592} {"current_steps": 3409, "total_steps": 9134, "loss": 0.486, "learning_rate": 3.469602719029526e-05, "epoch": 0.3731902898273078, "percentage": 37.32, "elapsed_time": "2 days, 14:46:15", "remaining_time": "4 days, 9:24:57", "throughput": 2724.7, "total_tokens": 615714400} {"current_steps": 3410, "total_steps": 9134, "loss": 0.7045, "learning_rate": 3.4688101040977164e-05, "epoch": 0.3732997618982457, "percentage": 37.33, "elapsed_time": "2 days, 14:47:14", "remaining_time": "4 days, 9:23:40", "throughput": 2724.61, "total_tokens": 615856192} {"current_steps": 3411, "total_steps": 9134, "loss": 0.8153, "learning_rate": 3.468017374557526e-05, "epoch": 0.37340923396918363, "percentage": 37.34, "elapsed_time": "2 days, 14:48:23", "remaining_time": "4 days, 9:22:38", "throughput": 2724.69, "total_tokens": 616062048} {"current_steps": 3412, "total_steps": 9134, "loss": 0.8219, "learning_rate": 3.46722453050273e-05, "epoch": 0.3735187060401215, "percentage": 37.35, "elapsed_time": "2 days, 14:49:27", "remaining_time": "4 days, 9:21:27", "throughput": 2724.63, "total_tokens": 616221312} {"current_steps": 3413, "total_steps": 9134, "loss": 0.7456, "learning_rate": 3.466431572027121e-05, "epoch": 0.3736281781110594, "percentage": 37.37, "elapsed_time": "2 days, 14:50:33", "remaining_time": "4 days, 9:20:21", "throughput": 2724.65, "total_tokens": 616406336} {"current_steps": 3414, "total_steps": 9134, "loss": 0.7126, "learning_rate": 3.465638499224504e-05, "epoch": 0.37373765018199734, "percentage": 37.38, "elapsed_time": "2 days, 14:51:38", "remaining_time": "4 days, 9:19:13", "throughput": 2724.61, "total_tokens": 616576352} {"current_steps": 3415, "total_steps": 9134, "loss": 0.7554, "learning_rate": 3.4648453121886994e-05, "epoch": 0.3738471222529352, "percentage": 37.39, "elapsed_time": "2 days, 14:52:43", "remaining_time": "4 days, 9:18:04", "throughput": 2724.53, "total_tokens": 616733824} {"current_steps": 3416, "total_steps": 9134, "loss": 0.75, "learning_rate": 3.464052011013539e-05, "epoch": 0.3739565943238731, "percentage": 37.4, "elapsed_time": "2 days, 14:53:49", "remaining_time": "4 days, 9:16:57", "throughput": 2724.49, "total_tokens": 616903168} {"current_steps": 3417, "total_steps": 9134, "loss": 0.6599, "learning_rate": 3.463258595792867e-05, "epoch": 0.37406606639481105, "percentage": 37.41, "elapsed_time": "2 days, 14:54:58", "remaining_time": "4 days, 9:15:56", "throughput": 2724.6, "total_tokens": 617118880} {"current_steps": 3418, "total_steps": 9134, "loss": 0.7821, "learning_rate": 3.462465066620546e-05, "epoch": 0.3741755384657489, "percentage": 37.42, "elapsed_time": "2 days, 14:56:03", "remaining_time": "4 days, 9:14:47", "throughput": 2724.58, "total_tokens": 617292032} {"current_steps": 3419, "total_steps": 9134, "loss": 0.7024, "learning_rate": 3.461671423590447e-05, "epoch": 0.37428501053668684, "percentage": 37.43, "elapsed_time": "2 days, 14:57:06", "remaining_time": "4 days, 9:13:36", "throughput": 2724.59, "total_tokens": 617464288} {"current_steps": 3420, "total_steps": 9134, "loss": 0.7639, "learning_rate": 3.460877666796457e-05, "epoch": 0.37439448260762476, "percentage": 37.44, "elapsed_time": "2 days, 14:58:10", "remaining_time": "4 days, 9:12:25", "throughput": 2724.61, "total_tokens": 617644384} {"current_steps": 3421, "total_steps": 9134, "loss": 0.6281, "learning_rate": 3.460083796332476e-05, "epoch": 0.3745039546785626, "percentage": 37.45, "elapsed_time": "2 days, 14:59:13", "remaining_time": "4 days, 9:11:14", "throughput": 2724.57, "total_tokens": 617805664} {"current_steps": 3422, "total_steps": 9134, "loss": 0.8818, "learning_rate": 3.459289812292418e-05, "epoch": 0.37461342674950054, "percentage": 37.46, "elapsed_time": "2 days, 15:00:21", "remaining_time": "4 days, 9:10:09", "throughput": 2724.54, "total_tokens": 617983744} {"current_steps": 3423, "total_steps": 9134, "loss": 0.7425, "learning_rate": 3.458495714770208e-05, "epoch": 0.3747228988204384, "percentage": 37.48, "elapsed_time": "2 days, 15:01:25", "remaining_time": "4 days, 9:09:00", "throughput": 2724.58, "total_tokens": 618167200} {"current_steps": 3424, "total_steps": 9134, "loss": 0.5721, "learning_rate": 3.4577015038597874e-05, "epoch": 0.37483237089137633, "percentage": 37.49, "elapsed_time": "2 days, 15:02:25", "remaining_time": "4 days, 9:07:42", "throughput": 2724.5, "total_tokens": 618313248} {"current_steps": 3425, "total_steps": 9134, "loss": 0.7513, "learning_rate": 3.45690717965511e-05, "epoch": 0.37494184296231425, "percentage": 37.5, "elapsed_time": "2 days, 15:03:31", "remaining_time": "4 days, 9:06:36", "throughput": 2724.51, "total_tokens": 618495136} {"current_steps": 3426, "total_steps": 9134, "loss": 0.5456, "learning_rate": 3.456112742250143e-05, "epoch": 0.3750513150332521, "percentage": 37.51, "elapsed_time": "2 days, 15:04:36", "remaining_time": "4 days, 9:05:27", "throughput": 2724.46, "total_tokens": 618659104} {"current_steps": 3427, "total_steps": 9134, "loss": 0.5851, "learning_rate": 3.4553181917388664e-05, "epoch": 0.37516078710419004, "percentage": 37.52, "elapsed_time": "2 days, 15:05:44", "remaining_time": "4 days, 9:04:24", "throughput": 2724.43, "total_tokens": 618840096} {"current_steps": 3428, "total_steps": 9134, "loss": 0.9804, "learning_rate": 3.4545235282152724e-05, "epoch": 0.37527025917512796, "percentage": 37.53, "elapsed_time": "2 days, 15:06:48", "remaining_time": "4 days, 9:03:14", "throughput": 2724.38, "total_tokens": 619003392} {"current_steps": 3429, "total_steps": 9134, "loss": 0.555, "learning_rate": 3.4537287517733713e-05, "epoch": 0.37537973124606583, "percentage": 37.54, "elapsed_time": "2 days, 15:07:57", "remaining_time": "4 days, 9:02:13", "throughput": 2724.38, "total_tokens": 619192000} {"current_steps": 3430, "total_steps": 9134, "loss": 0.7426, "learning_rate": 3.452933862507182e-05, "epoch": 0.37548920331700375, "percentage": 37.55, "elapsed_time": "2 days, 15:09:01", "remaining_time": "4 days, 9:01:02", "throughput": 2724.36, "total_tokens": 619360224} {"current_steps": 3431, "total_steps": 9134, "loss": 0.7633, "learning_rate": 3.452138860510737e-05, "epoch": 0.37559867538794167, "percentage": 37.56, "elapsed_time": "2 days, 15:10:10", "remaining_time": "4 days, 9:00:00", "throughput": 2724.42, "total_tokens": 619561824} {"current_steps": 3432, "total_steps": 9134, "loss": 0.779, "learning_rate": 3.451343745878086e-05, "epoch": 0.37570814745887954, "percentage": 37.57, "elapsed_time": "2 days, 15:11:16", "remaining_time": "4 days, 8:58:54", "throughput": 2724.5, "total_tokens": 619759168} {"current_steps": 3433, "total_steps": 9134, "loss": 0.5906, "learning_rate": 3.4505485187032894e-05, "epoch": 0.37581761952981746, "percentage": 37.58, "elapsed_time": "2 days, 15:12:24", "remaining_time": "4 days, 8:57:51", "throughput": 2724.63, "total_tokens": 619975776} {"current_steps": 3434, "total_steps": 9134, "loss": 0.6173, "learning_rate": 3.4497531790804194e-05, "epoch": 0.3759270916007554, "percentage": 37.6, "elapsed_time": "2 days, 15:13:29", "remaining_time": "4 days, 8:56:43", "throughput": 2724.65, "total_tokens": 620158336} {"current_steps": 3435, "total_steps": 9134, "loss": 0.8563, "learning_rate": 3.448957727103564e-05, "epoch": 0.37603656367169325, "percentage": 37.61, "elapsed_time": "2 days, 15:14:35", "remaining_time": "4 days, 8:55:36", "throughput": 2724.69, "total_tokens": 620345376} {"current_steps": 3436, "total_steps": 9134, "loss": 0.5848, "learning_rate": 3.448162162866823e-05, "epoch": 0.37614603574263117, "percentage": 37.62, "elapsed_time": "2 days, 15:15:43", "remaining_time": "4 days, 8:54:31", "throughput": 2724.71, "total_tokens": 620533984} {"current_steps": 3437, "total_steps": 9134, "loss": 0.7495, "learning_rate": 3.447366486464312e-05, "epoch": 0.3762555078135691, "percentage": 37.63, "elapsed_time": "2 days, 15:16:51", "remaining_time": "4 days, 8:53:28", "throughput": 2724.79, "total_tokens": 620738272} {"current_steps": 3438, "total_steps": 9134, "loss": 0.7797, "learning_rate": 3.446570697990155e-05, "epoch": 0.37636497988450696, "percentage": 37.64, "elapsed_time": "2 days, 15:17:53", "remaining_time": "4 days, 8:52:16", "throughput": 2724.77, "total_tokens": 620902912} {"current_steps": 3439, "total_steps": 9134, "loss": 0.8431, "learning_rate": 3.445774797538495e-05, "epoch": 0.3764744519554449, "percentage": 37.65, "elapsed_time": "2 days, 15:19:00", "remaining_time": "4 days, 8:51:10", "throughput": 2724.81, "total_tokens": 621094432} {"current_steps": 3440, "total_steps": 9134, "loss": 0.5268, "learning_rate": 3.444978785203484e-05, "epoch": 0.37658392402638274, "percentage": 37.66, "elapsed_time": "2 days, 15:20:03", "remaining_time": "4 days, 8:49:58", "throughput": 2724.77, "total_tokens": 621257504} {"current_steps": 3441, "total_steps": 9134, "loss": 0.5065, "learning_rate": 3.44418266107929e-05, "epoch": 0.37669339609732067, "percentage": 37.67, "elapsed_time": "2 days, 15:21:07", "remaining_time": "4 days, 8:48:48", "throughput": 2724.67, "total_tokens": 621409600} {"current_steps": 3442, "total_steps": 9134, "loss": 0.7604, "learning_rate": 3.4433864252600916e-05, "epoch": 0.3768028681682586, "percentage": 37.68, "elapsed_time": "2 days, 15:22:13", "remaining_time": "4 days, 8:47:42", "throughput": 2724.73, "total_tokens": 621602464} {"current_steps": 3443, "total_steps": 9134, "loss": 0.5679, "learning_rate": 3.442590077840083e-05, "epoch": 0.37691234023919645, "percentage": 37.69, "elapsed_time": "2 days, 15:23:13", "remaining_time": "4 days, 8:46:25", "throughput": 2724.65, "total_tokens": 621746720} {"current_steps": 3444, "total_steps": 9134, "loss": 0.7557, "learning_rate": 3.441793618913469e-05, "epoch": 0.3770218123101344, "percentage": 37.71, "elapsed_time": "2 days, 15:24:14", "remaining_time": "4 days, 8:45:10", "throughput": 2724.5, "total_tokens": 621880000} {"current_steps": 3445, "total_steps": 9134, "loss": 0.5577, "learning_rate": 3.4409970485744714e-05, "epoch": 0.3771312843810723, "percentage": 37.72, "elapsed_time": "2 days, 15:25:18", "remaining_time": "4 days, 8:44:00", "throughput": 2724.52, "total_tokens": 622058528} {"current_steps": 3446, "total_steps": 9134, "loss": 0.604, "learning_rate": 3.440200366917321e-05, "epoch": 0.37724075645201016, "percentage": 37.73, "elapsed_time": "2 days, 15:26:22", "remaining_time": "4 days, 8:42:50", "throughput": 2724.44, "total_tokens": 622214208} {"current_steps": 3447, "total_steps": 9134, "loss": 0.6832, "learning_rate": 3.439403574036266e-05, "epoch": 0.3773502285229481, "percentage": 37.74, "elapsed_time": "2 days, 15:27:27", "remaining_time": "4 days, 8:41:42", "throughput": 2724.45, "total_tokens": 622395648} {"current_steps": 3448, "total_steps": 9134, "loss": 0.7479, "learning_rate": 3.438606670025563e-05, "epoch": 0.377459700593886, "percentage": 37.75, "elapsed_time": "2 days, 15:28:33", "remaining_time": "4 days, 8:40:35", "throughput": 2724.48, "total_tokens": 622581344} {"current_steps": 3449, "total_steps": 9134, "loss": 0.6944, "learning_rate": 3.437809654979485e-05, "epoch": 0.37756917266482387, "percentage": 37.76, "elapsed_time": "2 days, 15:29:42", "remaining_time": "4 days, 8:39:32", "throughput": 2724.51, "total_tokens": 622775104} {"current_steps": 3450, "total_steps": 9134, "loss": 0.7201, "learning_rate": 3.4370125289923176e-05, "epoch": 0.3776786447357618, "percentage": 37.77, "elapsed_time": "2 days, 15:30:45", "remaining_time": "4 days, 8:38:21", "throughput": 2724.41, "total_tokens": 622923392} {"current_steps": 3451, "total_steps": 9134, "loss": 0.752, "learning_rate": 3.436215292158359e-05, "epoch": 0.3777881168066997, "percentage": 37.78, "elapsed_time": "2 days, 15:31:54", "remaining_time": "4 days, 8:37:19", "throughput": 2724.44, "total_tokens": 623118272} {"current_steps": 3452, "total_steps": 9134, "loss": 0.6996, "learning_rate": 3.435417944571922e-05, "epoch": 0.3778975888776376, "percentage": 37.79, "elapsed_time": "2 days, 15:32:58", "remaining_time": "4 days, 8:36:10", "throughput": 2724.42, "total_tokens": 623289632} {"current_steps": 3453, "total_steps": 9134, "loss": 0.5636, "learning_rate": 3.4346204863273304e-05, "epoch": 0.3780070609485755, "percentage": 37.8, "elapsed_time": "2 days, 15:34:03", "remaining_time": "4 days, 8:35:00", "throughput": 2724.43, "total_tokens": 623467488} {"current_steps": 3454, "total_steps": 9134, "loss": 0.7555, "learning_rate": 3.433822917518921e-05, "epoch": 0.3781165330195134, "percentage": 37.81, "elapsed_time": "2 days, 15:35:12", "remaining_time": "4 days, 8:33:59", "throughput": 2724.46, "total_tokens": 623661920} {"current_steps": 3455, "total_steps": 9134, "loss": 0.6554, "learning_rate": 3.433025238241047e-05, "epoch": 0.3782260050904513, "percentage": 37.83, "elapsed_time": "2 days, 15:36:14", "remaining_time": "4 days, 8:32:47", "throughput": 2724.45, "total_tokens": 623831040} {"current_steps": 3456, "total_steps": 9134, "loss": 0.631, "learning_rate": 3.43222744858807e-05, "epoch": 0.3783354771613892, "percentage": 37.84, "elapsed_time": "2 days, 15:37:20", "remaining_time": "4 days, 8:31:39", "throughput": 2724.49, "total_tokens": 624018976} {"current_steps": 3457, "total_steps": 9134, "loss": 0.6552, "learning_rate": 3.431429548654368e-05, "epoch": 0.3784449492323271, "percentage": 37.85, "elapsed_time": "2 days, 15:38:27", "remaining_time": "4 days, 8:30:35", "throughput": 2724.43, "total_tokens": 624187648} {"current_steps": 3458, "total_steps": 9134, "loss": 0.714, "learning_rate": 3.4306315385343316e-05, "epoch": 0.378554421303265, "percentage": 37.86, "elapsed_time": "2 days, 15:39:35", "remaining_time": "4 days, 8:29:31", "throughput": 2724.45, "total_tokens": 624377600} {"current_steps": 3459, "total_steps": 9134, "loss": 0.5447, "learning_rate": 3.4298334183223624e-05, "epoch": 0.3786638933742029, "percentage": 37.87, "elapsed_time": "2 days, 15:40:40", "remaining_time": "4 days, 8:28:22", "throughput": 2724.42, "total_tokens": 624547392} {"current_steps": 3460, "total_steps": 9134, "loss": 0.7613, "learning_rate": 3.4290351881128767e-05, "epoch": 0.3787733654451408, "percentage": 37.88, "elapsed_time": "2 days, 15:41:46", "remaining_time": "4 days, 8:27:16", "throughput": 2724.48, "total_tokens": 624742720} {"current_steps": 3461, "total_steps": 9134, "loss": 0.6768, "learning_rate": 3.4282368480003056e-05, "epoch": 0.3788828375160787, "percentage": 37.89, "elapsed_time": "2 days, 15:42:55", "remaining_time": "4 days, 8:26:14", "throughput": 2724.61, "total_tokens": 624959776} {"current_steps": 3462, "total_steps": 9134, "loss": 0.6703, "learning_rate": 3.42743839807909e-05, "epoch": 0.37899230958701663, "percentage": 37.9, "elapsed_time": "2 days, 15:44:00", "remaining_time": "4 days, 8:25:05", "throughput": 2724.52, "total_tokens": 625115680} {"current_steps": 3463, "total_steps": 9134, "loss": 0.7018, "learning_rate": 3.426639838443684e-05, "epoch": 0.3791017816579545, "percentage": 37.91, "elapsed_time": "2 days, 15:45:07", "remaining_time": "4 days, 8:24:00", "throughput": 2724.55, "total_tokens": 625303616} {"current_steps": 3464, "total_steps": 9134, "loss": 0.5344, "learning_rate": 3.4258411691885575e-05, "epoch": 0.3792112537288924, "percentage": 37.92, "elapsed_time": "2 days, 15:46:14", "remaining_time": "4 days, 8:22:55", "throughput": 2724.54, "total_tokens": 625484384} {"current_steps": 3465, "total_steps": 9134, "loss": 0.6884, "learning_rate": 3.425042390408189e-05, "epoch": 0.37932072579983034, "percentage": 37.94, "elapsed_time": "2 days, 15:47:16", "remaining_time": "4 days, 8:21:41", "throughput": 2724.46, "total_tokens": 625635360} {"current_steps": 3466, "total_steps": 9134, "loss": 0.7606, "learning_rate": 3.424243502197076e-05, "epoch": 0.3794301978707682, "percentage": 37.95, "elapsed_time": "2 days, 15:48:21", "remaining_time": "4 days, 8:20:33", "throughput": 2724.49, "total_tokens": 625817696} {"current_steps": 3467, "total_steps": 9134, "loss": 0.723, "learning_rate": 3.4234445046497225e-05, "epoch": 0.3795396699417061, "percentage": 37.96, "elapsed_time": "2 days, 15:49:29", "remaining_time": "4 days, 8:19:31", "throughput": 2724.45, "total_tokens": 625996672} {"current_steps": 3468, "total_steps": 9134, "loss": 0.5086, "learning_rate": 3.42264539786065e-05, "epoch": 0.37964914201264405, "percentage": 37.97, "elapsed_time": "2 days, 15:50:32", "remaining_time": "4 days, 8:18:19", "throughput": 2724.43, "total_tokens": 626164224} {"current_steps": 3469, "total_steps": 9134, "loss": 0.8155, "learning_rate": 3.421846181924391e-05, "epoch": 0.3797586140835819, "percentage": 37.98, "elapsed_time": "2 days, 15:51:40", "remaining_time": "4 days, 8:17:15", "throughput": 2724.45, "total_tokens": 626350816} {"current_steps": 3470, "total_steps": 9134, "loss": 0.511, "learning_rate": 3.421046856935489e-05, "epoch": 0.37986808615451984, "percentage": 37.99, "elapsed_time": "2 days, 15:52:43", "remaining_time": "4 days, 8:16:04", "throughput": 2724.42, "total_tokens": 626517248} {"current_steps": 3471, "total_steps": 9134, "loss": 0.5787, "learning_rate": 3.420247422988506e-05, "epoch": 0.37997755822545776, "percentage": 38.0, "elapsed_time": "2 days, 15:53:49", "remaining_time": "4 days, 8:14:56", "throughput": 2724.31, "total_tokens": 626670464} {"current_steps": 3472, "total_steps": 9134, "loss": 0.6905, "learning_rate": 3.4194478801780116e-05, "epoch": 0.3800870302963956, "percentage": 38.01, "elapsed_time": "2 days, 15:54:52", "remaining_time": "4 days, 8:13:45", "throughput": 2724.34, "total_tokens": 626848544} {"current_steps": 3473, "total_steps": 9134, "loss": 0.645, "learning_rate": 3.4186482285985915e-05, "epoch": 0.38019650236733354, "percentage": 38.02, "elapsed_time": "2 days, 15:55:57", "remaining_time": "4 days, 8:12:36", "throughput": 2724.31, "total_tokens": 627019232} {"current_steps": 3474, "total_steps": 9134, "loss": 0.6214, "learning_rate": 3.417848468344842e-05, "epoch": 0.3803059744382714, "percentage": 38.03, "elapsed_time": "2 days, 15:57:05", "remaining_time": "4 days, 8:11:34", "throughput": 2724.34, "total_tokens": 627213664} {"current_steps": 3475, "total_steps": 9134, "loss": 0.726, "learning_rate": 3.417048599511373e-05, "epoch": 0.38041544650920933, "percentage": 38.04, "elapsed_time": "2 days, 15:58:09", "remaining_time": "4 days, 8:10:23", "throughput": 2724.31, "total_tokens": 627378752} {"current_steps": 3476, "total_steps": 9134, "loss": 0.5725, "learning_rate": 3.416248622192807e-05, "epoch": 0.38052491858014725, "percentage": 38.06, "elapsed_time": "2 days, 15:59:14", "remaining_time": "4 days, 8:09:15", "throughput": 2724.28, "total_tokens": 627549888} {"current_steps": 3477, "total_steps": 9134, "loss": 0.6593, "learning_rate": 3.415448536483782e-05, "epoch": 0.3806343906510851, "percentage": 38.07, "elapsed_time": "2 days, 16:00:15", "remaining_time": "4 days, 8:08:00", "throughput": 2724.25, "total_tokens": 627709152} {"current_steps": 3478, "total_steps": 9134, "loss": 0.8815, "learning_rate": 3.4146483424789445e-05, "epoch": 0.38074386272202304, "percentage": 38.08, "elapsed_time": "2 days, 16:01:20", "remaining_time": "4 days, 8:06:52", "throughput": 2724.28, "total_tokens": 627892160} {"current_steps": 3479, "total_steps": 9134, "loss": 0.6754, "learning_rate": 3.4138480402729564e-05, "epoch": 0.38085333479296096, "percentage": 38.09, "elapsed_time": "2 days, 16:02:24", "remaining_time": "4 days, 8:05:42", "throughput": 2724.27, "total_tokens": 628064640} {"current_steps": 3480, "total_steps": 9134, "loss": 0.9209, "learning_rate": 3.413047629960492e-05, "epoch": 0.38096280686389883, "percentage": 38.1, "elapsed_time": "2 days, 16:03:33", "remaining_time": "4 days, 8:04:40", "throughput": 2724.28, "total_tokens": 628253696} {"current_steps": 3481, "total_steps": 9134, "loss": 0.7456, "learning_rate": 3.412247111636239e-05, "epoch": 0.38107227893483675, "percentage": 38.11, "elapsed_time": "2 days, 16:04:39", "remaining_time": "4 days, 8:03:33", "throughput": 2724.24, "total_tokens": 628425280} {"current_steps": 3482, "total_steps": 9134, "loss": 0.781, "learning_rate": 3.411446485394896e-05, "epoch": 0.38118175100577467, "percentage": 38.12, "elapsed_time": "2 days, 16:05:45", "remaining_time": "4 days, 8:02:27", "throughput": 2724.25, "total_tokens": 628607616} {"current_steps": 3483, "total_steps": 9134, "loss": 0.5653, "learning_rate": 3.410645751331176e-05, "epoch": 0.38129122307671254, "percentage": 38.13, "elapsed_time": "2 days, 16:06:48", "remaining_time": "4 days, 8:01:15", "throughput": 2724.31, "total_tokens": 628793536} {"current_steps": 3484, "total_steps": 9134, "loss": 0.5763, "learning_rate": 3.4098449095398054e-05, "epoch": 0.38140069514765046, "percentage": 38.14, "elapsed_time": "2 days, 16:07:55", "remaining_time": "4 days, 8:00:11", "throughput": 2724.34, "total_tokens": 628984160} {"current_steps": 3485, "total_steps": 9134, "loss": 0.6494, "learning_rate": 3.409043960115521e-05, "epoch": 0.3815101672185884, "percentage": 38.15, "elapsed_time": "2 days, 16:08:58", "remaining_time": "4 days, 7:58:59", "throughput": 2724.28, "total_tokens": 629142304} {"current_steps": 3486, "total_steps": 9134, "loss": 0.7008, "learning_rate": 3.408242903153074e-05, "epoch": 0.38161963928952625, "percentage": 38.17, "elapsed_time": "2 days, 16:10:04", "remaining_time": "4 days, 7:57:52", "throughput": 2724.32, "total_tokens": 629330016} {"current_steps": 3487, "total_steps": 9134, "loss": 0.7423, "learning_rate": 3.4074417387472274e-05, "epoch": 0.38172911136046417, "percentage": 38.18, "elapsed_time": "2 days, 16:11:09", "remaining_time": "4 days, 7:56:43", "throughput": 2724.38, "total_tokens": 629520864} {"current_steps": 3488, "total_steps": 9134, "loss": 0.5757, "learning_rate": 3.406640466992758e-05, "epoch": 0.3818385834314021, "percentage": 38.19, "elapsed_time": "2 days, 16:12:14", "remaining_time": "4 days, 7:55:36", "throughput": 2724.42, "total_tokens": 629708128} {"current_steps": 3489, "total_steps": 9134, "loss": 0.5804, "learning_rate": 3.405839087984455e-05, "epoch": 0.38194805550233996, "percentage": 38.2, "elapsed_time": "2 days, 16:13:21", "remaining_time": "4 days, 7:54:29", "throughput": 2724.45, "total_tokens": 629896288} {"current_steps": 3490, "total_steps": 9134, "loss": 0.607, "learning_rate": 3.405037601817119e-05, "epoch": 0.3820575275732779, "percentage": 38.21, "elapsed_time": "2 days, 16:14:30", "remaining_time": "4 days, 7:53:27", "throughput": 2724.54, "total_tokens": 630104384} {"current_steps": 3491, "total_steps": 9134, "loss": 0.6528, "learning_rate": 3.4042360085855654e-05, "epoch": 0.38216699964421574, "percentage": 38.22, "elapsed_time": "2 days, 16:15:39", "remaining_time": "4 days, 7:52:26", "throughput": 2724.67, "total_tokens": 630323456} {"current_steps": 3492, "total_steps": 9134, "loss": 0.6488, "learning_rate": 3.40343430838462e-05, "epoch": 0.38227647171515367, "percentage": 38.23, "elapsed_time": "2 days, 16:16:39", "remaining_time": "4 days, 7:51:11", "throughput": 2724.6, "total_tokens": 630471296} {"current_steps": 3493, "total_steps": 9134, "loss": 0.5574, "learning_rate": 3.4026325013091224e-05, "epoch": 0.3823859437860916, "percentage": 38.24, "elapsed_time": "2 days, 16:17:45", "remaining_time": "4 days, 7:50:03", "throughput": 2724.58, "total_tokens": 630644224} {"current_steps": 3494, "total_steps": 9134, "loss": 0.4858, "learning_rate": 3.4018305874539264e-05, "epoch": 0.38249541585702945, "percentage": 38.25, "elapsed_time": "2 days, 16:18:51", "remaining_time": "4 days, 7:48:56", "throughput": 2724.54, "total_tokens": 630816256} {"current_steps": 3495, "total_steps": 9134, "loss": 0.6602, "learning_rate": 3.401028566913896e-05, "epoch": 0.3826048879279674, "percentage": 38.26, "elapsed_time": "2 days, 16:19:56", "remaining_time": "4 days, 7:47:49", "throughput": 2724.57, "total_tokens": 631001728} {"current_steps": 3496, "total_steps": 9134, "loss": 0.7076, "learning_rate": 3.400226439783908e-05, "epoch": 0.3827143599989053, "percentage": 38.27, "elapsed_time": "2 days, 16:21:02", "remaining_time": "4 days, 7:46:41", "throughput": 2724.5, "total_tokens": 631164800} {"current_steps": 3497, "total_steps": 9134, "loss": 0.7095, "learning_rate": 3.399424206158855e-05, "epoch": 0.38282383206984316, "percentage": 38.29, "elapsed_time": "2 days, 16:22:07", "remaining_time": "4 days, 7:45:33", "throughput": 2724.48, "total_tokens": 631336384} {"current_steps": 3498, "total_steps": 9134, "loss": 0.8616, "learning_rate": 3.3986218661336355e-05, "epoch": 0.3829333041407811, "percentage": 38.3, "elapsed_time": "2 days, 16:23:15", "remaining_time": "4 days, 7:44:31", "throughput": 2724.57, "total_tokens": 631544704} {"current_steps": 3499, "total_steps": 9134, "loss": 0.8851, "learning_rate": 3.397819419803168e-05, "epoch": 0.383042776211719, "percentage": 38.31, "elapsed_time": "2 days, 16:24:23", "remaining_time": "4 days, 7:43:26", "throughput": 2724.57, "total_tokens": 631728608} {"current_steps": 3500, "total_steps": 9134, "loss": 0.684, "learning_rate": 3.397016867262379e-05, "epoch": 0.38315224828265687, "percentage": 38.32, "elapsed_time": "2 days, 16:25:28", "remaining_time": "4 days, 7:42:18", "throughput": 2724.55, "total_tokens": 631898624} {"current_steps": 3501, "total_steps": 9134, "loss": 0.8396, "learning_rate": 3.39621420860621e-05, "epoch": 0.3832617203535948, "percentage": 38.33, "elapsed_time": "2 days, 16:26:36", "remaining_time": "4 days, 7:41:14", "throughput": 2724.49, "total_tokens": 632070656} {"current_steps": 3502, "total_steps": 9134, "loss": 0.6993, "learning_rate": 3.395411443929613e-05, "epoch": 0.3833711924245327, "percentage": 38.34, "elapsed_time": "2 days, 16:27:42", "remaining_time": "4 days, 7:40:08", "throughput": 2724.51, "total_tokens": 632255456} {"current_steps": 3503, "total_steps": 9134, "loss": 0.6201, "learning_rate": 3.394608573327554e-05, "epoch": 0.3834806644954706, "percentage": 38.35, "elapsed_time": "2 days, 16:28:48", "remaining_time": "4 days, 7:39:01", "throughput": 2724.47, "total_tokens": 632425696} {"current_steps": 3504, "total_steps": 9134, "loss": 0.7592, "learning_rate": 3.393805596895011e-05, "epoch": 0.3835901365664085, "percentage": 38.36, "elapsed_time": "2 days, 16:29:54", "remaining_time": "4 days, 7:37:54", "throughput": 2724.38, "total_tokens": 632585632} {"current_steps": 3505, "total_steps": 9134, "loss": 0.9398, "learning_rate": 3.3930025147269746e-05, "epoch": 0.3836996086373464, "percentage": 38.37, "elapsed_time": "2 days, 16:31:00", "remaining_time": "4 days, 7:36:48", "throughput": 2724.34, "total_tokens": 632756544} {"current_steps": 3506, "total_steps": 9134, "loss": 0.675, "learning_rate": 3.3921993269184474e-05, "epoch": 0.3838090807082843, "percentage": 38.38, "elapsed_time": "2 days, 16:32:03", "remaining_time": "4 days, 7:35:37", "throughput": 2724.25, "total_tokens": 632908416} {"current_steps": 3507, "total_steps": 9134, "loss": 0.7226, "learning_rate": 3.391396033564446e-05, "epoch": 0.3839185527792222, "percentage": 38.4, "elapsed_time": "2 days, 16:33:11", "remaining_time": "4 days, 7:34:33", "throughput": 2724.3, "total_tokens": 633104640} {"current_steps": 3508, "total_steps": 9134, "loss": 0.726, "learning_rate": 3.390592634759998e-05, "epoch": 0.3840280248501601, "percentage": 38.41, "elapsed_time": "2 days, 16:34:17", "remaining_time": "4 days, 7:33:27", "throughput": 2724.36, "total_tokens": 633298176} {"current_steps": 3509, "total_steps": 9134, "loss": 0.583, "learning_rate": 3.389789130600144e-05, "epoch": 0.384137496921098, "percentage": 38.42, "elapsed_time": "2 days, 16:35:21", "remaining_time": "4 days, 7:32:16", "throughput": 2724.37, "total_tokens": 633474688} {"current_steps": 3510, "total_steps": 9134, "loss": 0.6932, "learning_rate": 3.388985521179937e-05, "epoch": 0.3842469689920359, "percentage": 38.43, "elapsed_time": "2 days, 16:36:25", "remaining_time": "4 days, 7:31:07", "throughput": 2724.3, "total_tokens": 633633504} {"current_steps": 3511, "total_steps": 9134, "loss": 0.7529, "learning_rate": 3.3881818065944416e-05, "epoch": 0.3843564410629738, "percentage": 38.44, "elapsed_time": "2 days, 16:37:33", "remaining_time": "4 days, 7:30:03", "throughput": 2724.31, "total_tokens": 633821664} {"current_steps": 3512, "total_steps": 9134, "loss": 0.5711, "learning_rate": 3.3873779869387356e-05, "epoch": 0.3844659131339117, "percentage": 38.45, "elapsed_time": "2 days, 16:38:39", "remaining_time": "4 days, 7:28:56", "throughput": 2724.27, "total_tokens": 633989440} {"current_steps": 3513, "total_steps": 9134, "loss": 0.7372, "learning_rate": 3.3865740623079116e-05, "epoch": 0.38457538520484963, "percentage": 38.46, "elapsed_time": "2 days, 16:39:48", "remaining_time": "4 days, 7:27:54", "throughput": 2724.34, "total_tokens": 634195744} {"current_steps": 3514, "total_steps": 9134, "loss": 0.5626, "learning_rate": 3.3857700327970696e-05, "epoch": 0.3846848572757875, "percentage": 38.47, "elapsed_time": "2 days, 16:40:54", "remaining_time": "4 days, 7:26:48", "throughput": 2724.4, "total_tokens": 634389056} {"current_steps": 3515, "total_steps": 9134, "loss": 0.7285, "learning_rate": 3.384965898501327e-05, "epoch": 0.3847943293467254, "percentage": 38.48, "elapsed_time": "2 days, 16:42:00", "remaining_time": "4 days, 7:25:41", "throughput": 2724.46, "total_tokens": 634581920} {"current_steps": 3516, "total_steps": 9134, "loss": 0.6266, "learning_rate": 3.384161659515811e-05, "epoch": 0.38490380141766334, "percentage": 38.49, "elapsed_time": "2 days, 16:43:07", "remaining_time": "4 days, 7:24:36", "throughput": 2724.44, "total_tokens": 634760896} {"current_steps": 3517, "total_steps": 9134, "loss": 0.8768, "learning_rate": 3.38335731593566e-05, "epoch": 0.3850132734886012, "percentage": 38.5, "elapsed_time": "2 days, 16:44:10", "remaining_time": "4 days, 7:23:24", "throughput": 2724.45, "total_tokens": 634932704} {"current_steps": 3518, "total_steps": 9134, "loss": 0.5249, "learning_rate": 3.382552867856027e-05, "epoch": 0.3851227455595391, "percentage": 38.52, "elapsed_time": "2 days, 16:45:15", "remaining_time": "4 days, 7:22:16", "throughput": 2724.35, "total_tokens": 635088160} {"current_steps": 3519, "total_steps": 9134, "loss": 0.7001, "learning_rate": 3.381748315372077e-05, "epoch": 0.38523221763047705, "percentage": 38.53, "elapsed_time": "2 days, 16:46:20", "remaining_time": "4 days, 7:21:08", "throughput": 2724.31, "total_tokens": 635257056} {"current_steps": 3520, "total_steps": 9134, "loss": 0.6903, "learning_rate": 3.380943658578987e-05, "epoch": 0.3853416897014149, "percentage": 38.54, "elapsed_time": "2 days, 16:47:26", "remaining_time": "4 days, 7:20:01", "throughput": 2724.33, "total_tokens": 635440064} {"current_steps": 3521, "total_steps": 9134, "loss": 0.691, "learning_rate": 3.380138897571946e-05, "epoch": 0.38545116177235283, "percentage": 38.55, "elapsed_time": "2 days, 16:48:34", "remaining_time": "4 days, 7:18:57", "throughput": 2724.26, "total_tokens": 635608288} {"current_steps": 3522, "total_steps": 9134, "loss": 0.6702, "learning_rate": 3.379334032446157e-05, "epoch": 0.38556063384329076, "percentage": 38.56, "elapsed_time": "2 days, 16:49:39", "remaining_time": "4 days, 7:17:49", "throughput": 2724.21, "total_tokens": 635775168} {"current_steps": 3523, "total_steps": 9134, "loss": 0.7594, "learning_rate": 3.378529063296832e-05, "epoch": 0.3856701059142286, "percentage": 38.57, "elapsed_time": "2 days, 16:50:45", "remaining_time": "4 days, 7:16:43", "throughput": 2724.25, "total_tokens": 635963776} {"current_steps": 3524, "total_steps": 9134, "loss": 0.5231, "learning_rate": 3.377723990219198e-05, "epoch": 0.38577957798516654, "percentage": 38.58, "elapsed_time": "2 days, 16:51:52", "remaining_time": "4 days, 7:15:37", "throughput": 2724.22, "total_tokens": 636139840} {"current_steps": 3525, "total_steps": 9134, "loss": 0.6448, "learning_rate": 3.376918813308495e-05, "epoch": 0.3858890500561044, "percentage": 38.59, "elapsed_time": "2 days, 16:53:00", "remaining_time": "4 days, 7:14:34", "throughput": 2724.11, "total_tokens": 636298656} {"current_steps": 3526, "total_steps": 9134, "loss": 0.5687, "learning_rate": 3.3761135326599716e-05, "epoch": 0.38599852212704233, "percentage": 38.6, "elapsed_time": "2 days, 16:54:03", "remaining_time": "4 days, 7:13:22", "throughput": 2724.01, "total_tokens": 636446496} {"current_steps": 3527, "total_steps": 9134, "loss": 0.648, "learning_rate": 3.375308148368893e-05, "epoch": 0.38610799419798025, "percentage": 38.61, "elapsed_time": "2 days, 16:55:09", "remaining_time": "4 days, 7:12:16", "throughput": 2723.97, "total_tokens": 636618528} {"current_steps": 3528, "total_steps": 9134, "loss": 0.6723, "learning_rate": 3.374502660530534e-05, "epoch": 0.3862174662689181, "percentage": 38.62, "elapsed_time": "2 days, 16:56:15", "remaining_time": "4 days, 7:11:09", "throughput": 2723.97, "total_tokens": 636798176} {"current_steps": 3529, "total_steps": 9134, "loss": 0.6954, "learning_rate": 3.373697069240181e-05, "epoch": 0.38632693833985604, "percentage": 38.64, "elapsed_time": "2 days, 16:57:24", "remaining_time": "4 days, 7:10:08", "throughput": 2724.03, "total_tokens": 636998880} {"current_steps": 3530, "total_steps": 9134, "loss": 0.6488, "learning_rate": 3.3728913745931356e-05, "epoch": 0.38643641041079396, "percentage": 38.65, "elapsed_time": "2 days, 16:58:28", "remaining_time": "4 days, 7:08:57", "throughput": 2724.01, "total_tokens": 637168224} {"current_steps": 3531, "total_steps": 9134, "loss": 0.8162, "learning_rate": 3.372085576684709e-05, "epoch": 0.38654588248173183, "percentage": 38.66, "elapsed_time": "2 days, 16:59:37", "remaining_time": "4 days, 7:07:55", "throughput": 2724.08, "total_tokens": 637372960} {"current_steps": 3532, "total_steps": 9134, "loss": 0.6996, "learning_rate": 3.371279675610226e-05, "epoch": 0.38665535455266975, "percentage": 38.67, "elapsed_time": "2 days, 17:00:39", "remaining_time": "4 days, 7:06:42", "throughput": 2724.04, "total_tokens": 637532224} {"current_steps": 3533, "total_steps": 9134, "loss": 0.6445, "learning_rate": 3.370473671465022e-05, "epoch": 0.38676482662360767, "percentage": 38.68, "elapsed_time": "2 days, 17:01:41", "remaining_time": "4 days, 7:05:29", "throughput": 2724.0, "total_tokens": 637691264} {"current_steps": 3534, "total_steps": 9134, "loss": 0.838, "learning_rate": 3.369667564344449e-05, "epoch": 0.38687429869454554, "percentage": 38.69, "elapsed_time": "2 days, 17:02:41", "remaining_time": "4 days, 7:04:13", "throughput": 2723.92, "total_tokens": 637835744} {"current_steps": 3535, "total_steps": 9134, "loss": 0.8217, "learning_rate": 3.368861354343863e-05, "epoch": 0.38698377076548346, "percentage": 38.7, "elapsed_time": "2 days, 17:03:43", "remaining_time": "4 days, 7:03:00", "throughput": 2723.92, "total_tokens": 638006432} {"current_steps": 3536, "total_steps": 9134, "loss": 0.7862, "learning_rate": 3.3680550415586416e-05, "epoch": 0.3870932428364214, "percentage": 38.71, "elapsed_time": "2 days, 17:04:50", "remaining_time": "4 days, 7:01:56", "throughput": 2723.98, "total_tokens": 638203104} {"current_steps": 3537, "total_steps": 9134, "loss": 0.6576, "learning_rate": 3.367248626084168e-05, "epoch": 0.38720271490735925, "percentage": 38.72, "elapsed_time": "2 days, 17:05:58", "remaining_time": "4 days, 7:00:52", "throughput": 2724.02, "total_tokens": 638397088} {"current_steps": 3538, "total_steps": 9134, "loss": 0.8003, "learning_rate": 3.3664421080158394e-05, "epoch": 0.38731218697829717, "percentage": 38.73, "elapsed_time": "2 days, 17:07:04", "remaining_time": "4 days, 6:59:44", "throughput": 2723.97, "total_tokens": 638563968} {"current_steps": 3539, "total_steps": 9134, "loss": 0.7296, "learning_rate": 3.365635487449065e-05, "epoch": 0.3874216590492351, "percentage": 38.75, "elapsed_time": "2 days, 17:08:10", "remaining_time": "4 days, 6:58:38", "throughput": 2723.97, "total_tokens": 638744288} {"current_steps": 3540, "total_steps": 9134, "loss": 0.7647, "learning_rate": 3.364828764479269e-05, "epoch": 0.38753113112017296, "percentage": 38.76, "elapsed_time": "2 days, 17:09:16", "remaining_time": "4 days, 6:57:32", "throughput": 2723.99, "total_tokens": 638930432} {"current_steps": 3541, "total_steps": 9134, "loss": 0.9648, "learning_rate": 3.3640219392018824e-05, "epoch": 0.3876406031911109, "percentage": 38.77, "elapsed_time": "2 days, 17:10:25", "remaining_time": "4 days, 6:56:30", "throughput": 2724.1, "total_tokens": 639144352} {"current_steps": 3542, "total_steps": 9134, "loss": 0.5847, "learning_rate": 3.3632150117123524e-05, "epoch": 0.38775007526204874, "percentage": 38.78, "elapsed_time": "2 days, 17:11:31", "remaining_time": "4 days, 6:55:24", "throughput": 2724.07, "total_tokens": 639315712} {"current_steps": 3543, "total_steps": 9134, "loss": 0.7576, "learning_rate": 3.362407982106136e-05, "epoch": 0.38785954733298666, "percentage": 38.79, "elapsed_time": "2 days, 17:12:36", "remaining_time": "4 days, 6:54:15", "throughput": 2724.01, "total_tokens": 639479456} {"current_steps": 3544, "total_steps": 9134, "loss": 0.5505, "learning_rate": 3.361600850478704e-05, "epoch": 0.3879690194039246, "percentage": 38.8, "elapsed_time": "2 days, 17:13:42", "remaining_time": "4 days, 6:53:08", "throughput": 2724.01, "total_tokens": 639658208} {"current_steps": 3545, "total_steps": 9134, "loss": 0.7474, "learning_rate": 3.3607936169255396e-05, "epoch": 0.38807849147486245, "percentage": 38.81, "elapsed_time": "2 days, 17:14:49", "remaining_time": "4 days, 6:52:03", "throughput": 2724.03, "total_tokens": 639846368} {"current_steps": 3546, "total_steps": 9134, "loss": 0.6702, "learning_rate": 3.359986281542135e-05, "epoch": 0.3881879635458004, "percentage": 38.82, "elapsed_time": "2 days, 17:15:57", "remaining_time": "4 days, 6:51:00", "throughput": 2724.08, "total_tokens": 640042368} {"current_steps": 3547, "total_steps": 9134, "loss": 0.7807, "learning_rate": 3.359178844423998e-05, "epoch": 0.3882974356167383, "percentage": 38.83, "elapsed_time": "2 days, 17:17:02", "remaining_time": "4 days, 6:49:52", "throughput": 2723.98, "total_tokens": 640197824} {"current_steps": 3548, "total_steps": 9134, "loss": 0.5957, "learning_rate": 3.3583713056666454e-05, "epoch": 0.38840690768767616, "percentage": 38.84, "elapsed_time": "2 days, 17:18:11", "remaining_time": "4 days, 6:48:49", "throughput": 2723.96, "total_tokens": 640378592} {"current_steps": 3549, "total_steps": 9134, "loss": 0.8118, "learning_rate": 3.3575636653656094e-05, "epoch": 0.3885163797586141, "percentage": 38.85, "elapsed_time": "2 days, 17:19:17", "remaining_time": "4 days, 6:47:43", "throughput": 2724.03, "total_tokens": 640575936} {"current_steps": 3550, "total_steps": 9134, "loss": 0.6425, "learning_rate": 3.35675592361643e-05, "epoch": 0.388625851829552, "percentage": 38.87, "elapsed_time": "2 days, 17:20:23", "remaining_time": "4 days, 6:46:37", "throughput": 2724.05, "total_tokens": 640761856} {"current_steps": 3551, "total_steps": 9134, "loss": 0.9478, "learning_rate": 3.3559480805146634e-05, "epoch": 0.38873532390048987, "percentage": 38.88, "elapsed_time": "2 days, 17:21:29", "remaining_time": "4 days, 6:45:30", "throughput": 2724.12, "total_tokens": 640956512} {"current_steps": 3552, "total_steps": 9134, "loss": 0.6906, "learning_rate": 3.355140136155875e-05, "epoch": 0.3888447959714278, "percentage": 38.89, "elapsed_time": "2 days, 17:22:32", "remaining_time": "4 days, 6:44:19", "throughput": 2724.1, "total_tokens": 641124288} {"current_steps": 3553, "total_steps": 9134, "loss": 0.6998, "learning_rate": 3.354332090635643e-05, "epoch": 0.3889542680423657, "percentage": 38.9, "elapsed_time": "2 days, 17:23:41", "remaining_time": "4 days, 6:43:16", "throughput": 2724.09, "total_tokens": 641308416} {"current_steps": 3554, "total_steps": 9134, "loss": 0.6442, "learning_rate": 3.353523944049558e-05, "epoch": 0.3890637401133036, "percentage": 38.91, "elapsed_time": "2 days, 17:24:49", "remaining_time": "4 days, 6:42:13", "throughput": 2724.08, "total_tokens": 641491872} {"current_steps": 3555, "total_steps": 9134, "loss": 0.7195, "learning_rate": 3.352715696493222e-05, "epoch": 0.3891732121842415, "percentage": 38.92, "elapsed_time": "2 days, 17:25:51", "remaining_time": "4 days, 6:41:00", "throughput": 2724.0, "total_tokens": 641643520} {"current_steps": 3556, "total_steps": 9134, "loss": 0.6733, "learning_rate": 3.3519073480622495e-05, "epoch": 0.3892826842551794, "percentage": 38.93, "elapsed_time": "2 days, 17:27:00", "remaining_time": "4 days, 6:39:58", "throughput": 2724.08, "total_tokens": 641850272} {"current_steps": 3557, "total_steps": 9134, "loss": 0.8, "learning_rate": 3.351098898852266e-05, "epoch": 0.3893921563261173, "percentage": 38.94, "elapsed_time": "2 days, 17:28:08", "remaining_time": "4 days, 6:38:54", "throughput": 2724.03, "total_tokens": 642023200} {"current_steps": 3558, "total_steps": 9134, "loss": 0.7061, "learning_rate": 3.35029034895891e-05, "epoch": 0.3895016283970552, "percentage": 38.95, "elapsed_time": "2 days, 17:29:17", "remaining_time": "4 days, 6:37:52", "throughput": 2724.05, "total_tokens": 642213600} {"current_steps": 3559, "total_steps": 9134, "loss": 0.6759, "learning_rate": 3.349481698477831e-05, "epoch": 0.3896111004679931, "percentage": 38.96, "elapsed_time": "2 days, 17:30:22", "remaining_time": "4 days, 6:36:44", "throughput": 2723.98, "total_tokens": 642375328} {"current_steps": 3560, "total_steps": 9134, "loss": 0.7953, "learning_rate": 3.348672947504691e-05, "epoch": 0.389720572538931, "percentage": 38.98, "elapsed_time": "2 days, 17:31:26", "remaining_time": "4 days, 6:35:35", "throughput": 2723.99, "total_tokens": 642554976} {"current_steps": 3561, "total_steps": 9134, "loss": 0.596, "learning_rate": 3.3478640961351635e-05, "epoch": 0.3898300446098689, "percentage": 38.99, "elapsed_time": "2 days, 17:32:33", "remaining_time": "4 days, 6:34:30", "throughput": 2723.98, "total_tokens": 642734176} {"current_steps": 3562, "total_steps": 9134, "loss": 0.696, "learning_rate": 3.3470551444649346e-05, "epoch": 0.3899395166808068, "percentage": 39.0, "elapsed_time": "2 days, 17:33:42", "remaining_time": "4 days, 6:33:28", "throughput": 2723.91, "total_tokens": 642904864} {"current_steps": 3563, "total_steps": 9134, "loss": 0.7262, "learning_rate": 3.346246092589702e-05, "epoch": 0.3900489887517447, "percentage": 39.01, "elapsed_time": "2 days, 17:34:51", "remaining_time": "4 days, 6:32:26", "throughput": 2723.91, "total_tokens": 643093696} {"current_steps": 3564, "total_steps": 9134, "loss": 0.7172, "learning_rate": 3.3454369406051736e-05, "epoch": 0.39015846082268263, "percentage": 39.02, "elapsed_time": "2 days, 17:35:56", "remaining_time": "4 days, 6:31:17", "throughput": 2723.82, "total_tokens": 643247808} {"current_steps": 3565, "total_steps": 9134, "loss": 0.755, "learning_rate": 3.344627688607071e-05, "epoch": 0.3902679328936205, "percentage": 39.03, "elapsed_time": "2 days, 17:37:01", "remaining_time": "4 days, 6:30:09", "throughput": 2723.78, "total_tokens": 643417152} {"current_steps": 3566, "total_steps": 9134, "loss": 0.7633, "learning_rate": 3.343818336691128e-05, "epoch": 0.3903774049645584, "percentage": 39.04, "elapsed_time": "2 days, 17:38:08", "remaining_time": "4 days, 6:29:04", "throughput": 2723.84, "total_tokens": 643612928} {"current_steps": 3567, "total_steps": 9134, "loss": 0.8775, "learning_rate": 3.3430088849530886e-05, "epoch": 0.39048687703549634, "percentage": 39.05, "elapsed_time": "2 days, 17:39:18", "remaining_time": "4 days, 6:28:03", "throughput": 2723.87, "total_tokens": 643809600} {"current_steps": 3568, "total_steps": 9134, "loss": 0.8137, "learning_rate": 3.34219933348871e-05, "epoch": 0.3905963491064342, "percentage": 39.06, "elapsed_time": "2 days, 17:40:22", "remaining_time": "4 days, 6:26:54", "throughput": 2723.91, "total_tokens": 643994400} {"current_steps": 3569, "total_steps": 9134, "loss": 0.5446, "learning_rate": 3.34138968239376e-05, "epoch": 0.3907058211773721, "percentage": 39.07, "elapsed_time": "2 days, 17:41:30", "remaining_time": "4 days, 6:25:49", "throughput": 2723.93, "total_tokens": 644182784} {"current_steps": 3570, "total_steps": 9134, "loss": 0.5222, "learning_rate": 3.3405799317640196e-05, "epoch": 0.39081529324831005, "percentage": 39.08, "elapsed_time": "2 days, 17:42:38", "remaining_time": "4 days, 6:24:46", "throughput": 2724.0, "total_tokens": 644384832} {"current_steps": 3571, "total_steps": 9134, "loss": 0.7357, "learning_rate": 3.3397700816952795e-05, "epoch": 0.3909247653192479, "percentage": 39.1, "elapsed_time": "2 days, 17:43:45", "remaining_time": "4 days, 6:23:41", "throughput": 2723.91, "total_tokens": 644547008} {"current_steps": 3572, "total_steps": 9134, "loss": 0.7655, "learning_rate": 3.3389601322833454e-05, "epoch": 0.39103423739018583, "percentage": 39.11, "elapsed_time": "2 days, 17:44:50", "remaining_time": "4 days, 6:22:33", "throughput": 2723.84, "total_tokens": 644707616} {"current_steps": 3573, "total_steps": 9134, "loss": 0.6157, "learning_rate": 3.3381500836240296e-05, "epoch": 0.39114370946112376, "percentage": 39.12, "elapsed_time": "2 days, 17:45:53", "remaining_time": "4 days, 6:21:22", "throughput": 2723.81, "total_tokens": 644873152} {"current_steps": 3574, "total_steps": 9134, "loss": 0.6822, "learning_rate": 3.337339935813163e-05, "epoch": 0.3912531815320616, "percentage": 39.13, "elapsed_time": "2 days, 17:46:57", "remaining_time": "4 days, 6:20:11", "throughput": 2723.8, "total_tokens": 645043168} {"current_steps": 3575, "total_steps": 9134, "loss": 0.5988, "learning_rate": 3.3365296889465814e-05, "epoch": 0.39136265360299954, "percentage": 39.14, "elapsed_time": "2 days, 17:48:02", "remaining_time": "4 days, 6:19:04", "throughput": 2723.91, "total_tokens": 645246112} {"current_steps": 3576, "total_steps": 9134, "loss": 0.6227, "learning_rate": 3.3357193431201374e-05, "epoch": 0.3914721256739374, "percentage": 39.15, "elapsed_time": "2 days, 17:49:09", "remaining_time": "4 days, 6:17:58", "throughput": 2723.97, "total_tokens": 645443232} {"current_steps": 3577, "total_steps": 9134, "loss": 0.7044, "learning_rate": 3.3349088984296916e-05, "epoch": 0.39158159774487533, "percentage": 39.16, "elapsed_time": "2 days, 17:50:13", "remaining_time": "4 days, 6:16:49", "throughput": 2723.97, "total_tokens": 645619296} {"current_steps": 3578, "total_steps": 9134, "loss": 0.6025, "learning_rate": 3.33409835497112e-05, "epoch": 0.39169106981581325, "percentage": 39.17, "elapsed_time": "2 days, 17:51:21", "remaining_time": "4 days, 6:15:45", "throughput": 2724.0, "total_tokens": 645810816} {"current_steps": 3579, "total_steps": 9134, "loss": 0.5436, "learning_rate": 3.333287712840308e-05, "epoch": 0.3918005418867511, "percentage": 39.18, "elapsed_time": "2 days, 17:52:24", "remaining_time": "4 days, 6:14:34", "throughput": 2723.94, "total_tokens": 645967616} {"current_steps": 3580, "total_steps": 9134, "loss": 0.6143, "learning_rate": 3.3324769721331515e-05, "epoch": 0.39191001395768904, "percentage": 39.19, "elapsed_time": "2 days, 17:53:25", "remaining_time": "4 days, 6:13:19", "throughput": 2723.8, "total_tokens": 646097984} {"current_steps": 3581, "total_steps": 9134, "loss": 0.7269, "learning_rate": 3.331666132945562e-05, "epoch": 0.39201948602862696, "percentage": 39.21, "elapsed_time": "2 days, 17:54:30", "remaining_time": "4 days, 6:12:11", "throughput": 2723.75, "total_tokens": 646266656} {"current_steps": 3582, "total_steps": 9134, "loss": 0.7231, "learning_rate": 3.3308551953734576e-05, "epoch": 0.39212895809956483, "percentage": 39.22, "elapsed_time": "2 days, 17:55:36", "remaining_time": "4 days, 6:11:05", "throughput": 2723.74, "total_tokens": 646443168} {"current_steps": 3583, "total_steps": 9134, "loss": 0.6935, "learning_rate": 3.330044159512773e-05, "epoch": 0.39223843017050275, "percentage": 39.23, "elapsed_time": "2 days, 17:56:42", "remaining_time": "4 days, 6:09:58", "throughput": 2723.8, "total_tokens": 646636928} {"current_steps": 3584, "total_steps": 9134, "loss": 0.6439, "learning_rate": 3.3292330254594504e-05, "epoch": 0.39234790224144067, "percentage": 39.24, "elapsed_time": "2 days, 17:57:44", "remaining_time": "4 days, 6:08:45", "throughput": 2723.79, "total_tokens": 646803360} {"current_steps": 3585, "total_steps": 9134, "loss": 0.6084, "learning_rate": 3.3284217933094465e-05, "epoch": 0.39245737431237854, "percentage": 39.25, "elapsed_time": "2 days, 17:58:51", "remaining_time": "4 days, 6:07:39", "throughput": 2723.86, "total_tokens": 647002272} {"current_steps": 3586, "total_steps": 9134, "loss": 0.7016, "learning_rate": 3.3276104631587274e-05, "epoch": 0.39256684638331646, "percentage": 39.26, "elapsed_time": "2 days, 17:59:56", "remaining_time": "4 days, 6:06:32", "throughput": 2723.9, "total_tokens": 647190432} {"current_steps": 3587, "total_steps": 9134, "loss": 0.7, "learning_rate": 3.326799035103273e-05, "epoch": 0.3926763184542544, "percentage": 39.27, "elapsed_time": "2 days, 18:00:59", "remaining_time": "4 days, 6:05:21", "throughput": 2723.85, "total_tokens": 647349696} {"current_steps": 3588, "total_steps": 9134, "loss": 0.6261, "learning_rate": 3.325987509239074e-05, "epoch": 0.39278579052519225, "percentage": 39.28, "elapsed_time": "2 days, 18:02:08", "remaining_time": "4 days, 6:04:19", "throughput": 2723.89, "total_tokens": 647548160} {"current_steps": 3589, "total_steps": 9134, "loss": 0.6884, "learning_rate": 3.3251758856621303e-05, "epoch": 0.39289526259613017, "percentage": 39.29, "elapsed_time": "2 days, 18:03:16", "remaining_time": "4 days, 6:03:14", "throughput": 2723.87, "total_tokens": 647726016} {"current_steps": 3590, "total_steps": 9134, "loss": 0.5285, "learning_rate": 3.324364164468458e-05, "epoch": 0.3930047346670681, "percentage": 39.3, "elapsed_time": "2 days, 18:04:24", "remaining_time": "4 days, 6:02:11", "throughput": 2723.91, "total_tokens": 647920224} {"current_steps": 3591, "total_steps": 9134, "loss": 0.6309, "learning_rate": 3.3235523457540805e-05, "epoch": 0.39311420673800596, "percentage": 39.31, "elapsed_time": "2 days, 18:05:29", "remaining_time": "4 days, 6:01:02", "throughput": 2723.91, "total_tokens": 648098752} {"current_steps": 3592, "total_steps": 9134, "loss": 0.6196, "learning_rate": 3.322740429615035e-05, "epoch": 0.3932236788089439, "percentage": 39.33, "elapsed_time": "2 days, 18:06:36", "remaining_time": "4 days, 5:59:58", "throughput": 2723.91, "total_tokens": 648280864} {"current_steps": 3593, "total_steps": 9134, "loss": 0.8418, "learning_rate": 3.32192841614737e-05, "epoch": 0.39333315087988174, "percentage": 39.34, "elapsed_time": "2 days, 18:07:42", "remaining_time": "4 days, 5:58:51", "throughput": 2723.93, "total_tokens": 648464768} {"current_steps": 3594, "total_steps": 9134, "loss": 0.5551, "learning_rate": 3.321116305447143e-05, "epoch": 0.39344262295081966, "percentage": 39.35, "elapsed_time": "2 days, 18:08:46", "remaining_time": "4 days, 5:57:42", "throughput": 2723.89, "total_tokens": 648630528} {"current_steps": 3595, "total_steps": 9134, "loss": 0.6282, "learning_rate": 3.3203040976104285e-05, "epoch": 0.3935520950217576, "percentage": 39.36, "elapsed_time": "2 days, 18:09:54", "remaining_time": "4 days, 5:56:38", "throughput": 2723.92, "total_tokens": 648822048} {"current_steps": 3596, "total_steps": 9134, "loss": 0.7658, "learning_rate": 3.319491792733307e-05, "epoch": 0.39366156709269545, "percentage": 39.37, "elapsed_time": "2 days, 18:10:57", "remaining_time": "4 days, 5:55:27", "throughput": 2723.93, "total_tokens": 648998336} {"current_steps": 3597, "total_steps": 9134, "loss": 0.9055, "learning_rate": 3.318679390911873e-05, "epoch": 0.3937710391636334, "percentage": 39.38, "elapsed_time": "2 days, 18:12:06", "remaining_time": "4 days, 5:54:25", "throughput": 2723.99, "total_tokens": 649200608} {"current_steps": 3598, "total_steps": 9134, "loss": 0.6582, "learning_rate": 3.317866892242231e-05, "epoch": 0.3938805112345713, "percentage": 39.39, "elapsed_time": "2 days, 18:13:10", "remaining_time": "4 days, 5:53:15", "throughput": 2723.95, "total_tokens": 649363008} {"current_steps": 3599, "total_steps": 9134, "loss": 0.8219, "learning_rate": 3.3170542968205e-05, "epoch": 0.39398998330550916, "percentage": 39.4, "elapsed_time": "2 days, 18:14:18", "remaining_time": "4 days, 5:52:12", "throughput": 2724.0, "total_tokens": 649561248} {"current_steps": 3600, "total_steps": 9134, "loss": 0.7225, "learning_rate": 3.316241604742807e-05, "epoch": 0.3940994553764471, "percentage": 39.41, "elapsed_time": "2 days, 18:15:21", "remaining_time": "4 days, 5:51:00", "throughput": 2723.93, "total_tokens": 649715136} {"current_steps": 3601, "total_steps": 9134, "loss": 0.8177, "learning_rate": 3.3154288161052936e-05, "epoch": 0.394208927447385, "percentage": 39.42, "elapsed_time": "2 days, 18:16:27", "remaining_time": "4 days, 5:49:53", "throughput": 2723.94, "total_tokens": 649896576} {"current_steps": 3602, "total_steps": 9134, "loss": 0.6565, "learning_rate": 3.3146159310041095e-05, "epoch": 0.39431839951832287, "percentage": 39.44, "elapsed_time": "2 days, 18:17:34", "remaining_time": "4 days, 5:48:48", "throughput": 2723.99, "total_tokens": 650093024} {"current_steps": 3603, "total_steps": 9134, "loss": 0.9172, "learning_rate": 3.3138029495354184e-05, "epoch": 0.3944278715892608, "percentage": 39.45, "elapsed_time": "2 days, 18:18:40", "remaining_time": "4 days, 5:47:41", "throughput": 2724.0, "total_tokens": 650274912} {"current_steps": 3604, "total_steps": 9134, "loss": 0.6353, "learning_rate": 3.3129898717953946e-05, "epoch": 0.3945373436601987, "percentage": 39.46, "elapsed_time": "2 days, 18:19:45", "remaining_time": "4 days, 5:46:33", "throughput": 2724.05, "total_tokens": 650463296} {"current_steps": 3605, "total_steps": 9134, "loss": 0.661, "learning_rate": 3.312176697880222e-05, "epoch": 0.3946468157311366, "percentage": 39.47, "elapsed_time": "2 days, 18:20:52", "remaining_time": "4 days, 5:45:29", "throughput": 2724.0, "total_tokens": 650634208} {"current_steps": 3606, "total_steps": 9134, "loss": 0.6968, "learning_rate": 3.3113634278860994e-05, "epoch": 0.3947562878020745, "percentage": 39.48, "elapsed_time": "2 days, 18:22:01", "remaining_time": "4 days, 5:44:26", "throughput": 2723.99, "total_tokens": 650821024} {"current_steps": 3607, "total_steps": 9134, "loss": 0.8367, "learning_rate": 3.310550061909233e-05, "epoch": 0.3948657598730124, "percentage": 39.49, "elapsed_time": "2 days, 18:23:05", "remaining_time": "4 days, 5:43:17", "throughput": 2723.97, "total_tokens": 650989472} {"current_steps": 3608, "total_steps": 9134, "loss": 0.5892, "learning_rate": 3.3097366000458454e-05, "epoch": 0.3949752319439503, "percentage": 39.5, "elapsed_time": "2 days, 18:24:09", "remaining_time": "4 days, 5:42:08", "throughput": 2723.96, "total_tokens": 651161952} {"current_steps": 3609, "total_steps": 9134, "loss": 0.6177, "learning_rate": 3.308923042392165e-05, "epoch": 0.3950847040148882, "percentage": 39.51, "elapsed_time": "2 days, 18:25:15", "remaining_time": "4 days, 5:41:00", "throughput": 2723.92, "total_tokens": 651331072} {"current_steps": 3610, "total_steps": 9134, "loss": 0.6569, "learning_rate": 3.308109389044436e-05, "epoch": 0.3951941760858261, "percentage": 39.52, "elapsed_time": "2 days, 18:26:21", "remaining_time": "4 days, 5:39:54", "throughput": 2723.87, "total_tokens": 651499296} {"current_steps": 3611, "total_steps": 9134, "loss": 0.5741, "learning_rate": 3.3072956400989103e-05, "epoch": 0.395303648156764, "percentage": 39.53, "elapsed_time": "2 days, 18:27:25", "remaining_time": "4 days, 5:38:44", "throughput": 2723.86, "total_tokens": 651671552} {"current_steps": 3612, "total_steps": 9134, "loss": 0.7297, "learning_rate": 3.306481795651854e-05, "epoch": 0.3954131202277019, "percentage": 39.54, "elapsed_time": "2 days, 18:28:32", "remaining_time": "4 days, 5:37:39", "throughput": 2723.81, "total_tokens": 651842016} {"current_steps": 3613, "total_steps": 9134, "loss": 0.5838, "learning_rate": 3.3056678557995434e-05, "epoch": 0.3955225922986398, "percentage": 39.56, "elapsed_time": "2 days, 18:29:36", "remaining_time": "4 days, 5:36:30", "throughput": 2723.76, "total_tokens": 652005536} {"current_steps": 3614, "total_steps": 9134, "loss": 0.5869, "learning_rate": 3.3048538206382645e-05, "epoch": 0.3956320643695777, "percentage": 39.57, "elapsed_time": "2 days, 18:30:38", "remaining_time": "4 days, 5:35:16", "throughput": 2723.68, "total_tokens": 652154272} {"current_steps": 3615, "total_steps": 9134, "loss": 0.6406, "learning_rate": 3.3040396902643186e-05, "epoch": 0.39574153644051563, "percentage": 39.58, "elapsed_time": "2 days, 18:31:43", "remaining_time": "4 days, 5:34:08", "throughput": 2723.63, "total_tokens": 652318240} {"current_steps": 3616, "total_steps": 9134, "loss": 0.6463, "learning_rate": 3.3032254647740135e-05, "epoch": 0.3958510085114535, "percentage": 39.59, "elapsed_time": "2 days, 18:32:47", "remaining_time": "4 days, 5:32:59", "throughput": 2723.59, "total_tokens": 652484448} {"current_steps": 3617, "total_steps": 9134, "loss": 0.63, "learning_rate": 3.3024111442636716e-05, "epoch": 0.3959604805823914, "percentage": 39.6, "elapsed_time": "2 days, 18:33:53", "remaining_time": "4 days, 5:31:52", "throughput": 2723.52, "total_tokens": 652647968} {"current_steps": 3618, "total_steps": 9134, "loss": 0.7043, "learning_rate": 3.3015967288296256e-05, "epoch": 0.39606995265332934, "percentage": 39.61, "elapsed_time": "2 days, 18:34:55", "remaining_time": "4 days, 5:30:39", "throughput": 2723.48, "total_tokens": 652804992} {"current_steps": 3619, "total_steps": 9134, "loss": 0.6614, "learning_rate": 3.300782218568218e-05, "epoch": 0.3961794247242672, "percentage": 39.62, "elapsed_time": "2 days, 18:36:03", "remaining_time": "4 days, 5:29:36", "throughput": 2723.54, "total_tokens": 653006368} {"current_steps": 3620, "total_steps": 9134, "loss": 0.5085, "learning_rate": 3.299967613575806e-05, "epoch": 0.3962888967952051, "percentage": 39.63, "elapsed_time": "2 days, 18:37:10", "remaining_time": "4 days, 5:28:30", "throughput": 2723.6, "total_tokens": 653202144} {"current_steps": 3621, "total_steps": 9134, "loss": 0.7079, "learning_rate": 3.299152913948754e-05, "epoch": 0.39639836886614305, "percentage": 39.64, "elapsed_time": "2 days, 18:38:14", "remaining_time": "4 days, 5:27:20", "throughput": 2723.57, "total_tokens": 653367904} {"current_steps": 3622, "total_steps": 9134, "loss": 0.6152, "learning_rate": 3.298338119783439e-05, "epoch": 0.3965078409370809, "percentage": 39.65, "elapsed_time": "2 days, 18:39:23", "remaining_time": "4 days, 5:26:19", "throughput": 2723.66, "total_tokens": 653579584} {"current_steps": 3623, "total_steps": 9134, "loss": 0.6164, "learning_rate": 3.297523231176253e-05, "epoch": 0.39661731300801883, "percentage": 39.66, "elapsed_time": "2 days, 18:40:26", "remaining_time": "4 days, 5:25:08", "throughput": 2723.61, "total_tokens": 653740192} {"current_steps": 3624, "total_steps": 9134, "loss": 0.7469, "learning_rate": 3.296708248223592e-05, "epoch": 0.39672678507895676, "percentage": 39.68, "elapsed_time": "2 days, 18:41:33", "remaining_time": "4 days, 5:24:02", "throughput": 2723.6, "total_tokens": 653919168} {"current_steps": 3625, "total_steps": 9134, "loss": 0.7527, "learning_rate": 3.295893171021868e-05, "epoch": 0.3968362571498946, "percentage": 39.69, "elapsed_time": "2 days, 18:42:39", "remaining_time": "4 days, 5:22:55", "throughput": 2723.58, "total_tokens": 654093888} {"current_steps": 3626, "total_steps": 9134, "loss": 0.7998, "learning_rate": 3.295077999667504e-05, "epoch": 0.39694572922083254, "percentage": 39.7, "elapsed_time": "2 days, 18:43:46", "remaining_time": "4 days, 5:21:51", "throughput": 2723.69, "total_tokens": 654303776} {"current_steps": 3627, "total_steps": 9134, "loss": 0.5605, "learning_rate": 3.294262734256933e-05, "epoch": 0.3970552012917704, "percentage": 39.71, "elapsed_time": "2 days, 18:44:50", "remaining_time": "4 days, 5:20:41", "throughput": 2723.67, "total_tokens": 654472000} {"current_steps": 3628, "total_steps": 9134, "loss": 0.5277, "learning_rate": 3.2934473748865976e-05, "epoch": 0.39716467336270833, "percentage": 39.72, "elapsed_time": "2 days, 18:45:54", "remaining_time": "4 days, 5:19:31", "throughput": 2723.63, "total_tokens": 654634400} {"current_steps": 3629, "total_steps": 9134, "loss": 0.7428, "learning_rate": 3.292631921652955e-05, "epoch": 0.39727414543364625, "percentage": 39.73, "elapsed_time": "2 days, 18:47:03", "remaining_time": "4 days, 5:18:29", "throughput": 2723.63, "total_tokens": 654824576} {"current_steps": 3630, "total_steps": 9134, "loss": 0.6288, "learning_rate": 3.2918163746524714e-05, "epoch": 0.3973836175045841, "percentage": 39.74, "elapsed_time": "2 days, 18:48:09", "remaining_time": "4 days, 5:17:23", "throughput": 2723.57, "total_tokens": 654989888} {"current_steps": 3631, "total_steps": 9134, "loss": 0.7729, "learning_rate": 3.291000733981624e-05, "epoch": 0.39749308957552204, "percentage": 39.75, "elapsed_time": "2 days, 18:49:18", "remaining_time": "4 days, 5:16:20", "throughput": 2723.57, "total_tokens": 655178272} {"current_steps": 3632, "total_steps": 9134, "loss": 0.6577, "learning_rate": 3.290184999736903e-05, "epoch": 0.39760256164645996, "percentage": 39.76, "elapsed_time": "2 days, 18:50:23", "remaining_time": "4 days, 5:15:13", "throughput": 2723.65, "total_tokens": 655374944} {"current_steps": 3633, "total_steps": 9134, "loss": 0.8782, "learning_rate": 3.2893691720148064e-05, "epoch": 0.39771203371739783, "percentage": 39.77, "elapsed_time": "2 days, 18:51:30", "remaining_time": "4 days, 5:14:08", "throughput": 2723.66, "total_tokens": 655561312} {"current_steps": 3634, "total_steps": 9134, "loss": 0.7927, "learning_rate": 3.2885532509118446e-05, "epoch": 0.39782150578833575, "percentage": 39.79, "elapsed_time": "2 days, 18:52:39", "remaining_time": "4 days, 5:13:05", "throughput": 2723.71, "total_tokens": 655758656} {"current_steps": 3635, "total_steps": 9134, "loss": 0.6926, "learning_rate": 3.2877372365245426e-05, "epoch": 0.39793097785927367, "percentage": 39.8, "elapsed_time": "2 days, 18:53:44", "remaining_time": "4 days, 5:11:57", "throughput": 2723.73, "total_tokens": 655941888} {"current_steps": 3636, "total_steps": 9134, "loss": 0.7179, "learning_rate": 3.28692112894943e-05, "epoch": 0.39804044993021154, "percentage": 39.81, "elapsed_time": "2 days, 18:54:50", "remaining_time": "4 days, 5:10:50", "throughput": 2723.65, "total_tokens": 656100032} {"current_steps": 3637, "total_steps": 9134, "loss": 0.5905, "learning_rate": 3.286104928283054e-05, "epoch": 0.39814992200114946, "percentage": 39.82, "elapsed_time": "2 days, 18:55:56", "remaining_time": "4 days, 5:09:44", "throughput": 2723.71, "total_tokens": 656296704} {"current_steps": 3638, "total_steps": 9134, "loss": 0.6305, "learning_rate": 3.285288634621966e-05, "epoch": 0.3982593940720874, "percentage": 39.83, "elapsed_time": "2 days, 18:57:00", "remaining_time": "4 days, 5:08:34", "throughput": 2723.71, "total_tokens": 656470528} {"current_steps": 3639, "total_steps": 9134, "loss": 0.8518, "learning_rate": 3.2844722480627346e-05, "epoch": 0.39836886614302525, "percentage": 39.84, "elapsed_time": "2 days, 18:58:05", "remaining_time": "4 days, 5:07:26", "throughput": 2723.66, "total_tokens": 656636960} {"current_steps": 3640, "total_steps": 9134, "loss": 0.7705, "learning_rate": 3.2836557687019356e-05, "epoch": 0.39847833821396317, "percentage": 39.85, "elapsed_time": "2 days, 18:59:09", "remaining_time": "4 days, 5:06:16", "throughput": 2723.68, "total_tokens": 656814368} {"current_steps": 3641, "total_steps": 9134, "loss": 0.7442, "learning_rate": 3.2828391966361574e-05, "epoch": 0.3985878102849011, "percentage": 39.86, "elapsed_time": "2 days, 19:00:16", "remaining_time": "4 days, 5:05:11", "throughput": 2723.71, "total_tokens": 657002080} {"current_steps": 3642, "total_steps": 9134, "loss": 0.7696, "learning_rate": 3.2820225319619985e-05, "epoch": 0.39869728235583896, "percentage": 39.87, "elapsed_time": "2 days, 19:01:20", "remaining_time": "4 days, 5:04:02", "throughput": 2723.74, "total_tokens": 657186656} {"current_steps": 3643, "total_steps": 9134, "loss": 0.6857, "learning_rate": 3.281205774776069e-05, "epoch": 0.3988067544267769, "percentage": 39.88, "elapsed_time": "2 days, 19:02:22", "remaining_time": "4 days, 5:02:49", "throughput": 2723.7, "total_tokens": 657345696} {"current_steps": 3644, "total_steps": 9134, "loss": 0.6552, "learning_rate": 3.280388925174991e-05, "epoch": 0.39891622649771474, "percentage": 39.89, "elapsed_time": "2 days, 19:03:30", "remaining_time": "4 days, 5:01:46", "throughput": 2723.77, "total_tokens": 657547296} {"current_steps": 3645, "total_steps": 9134, "loss": 0.4807, "learning_rate": 3.279571983255394e-05, "epoch": 0.39902569856865266, "percentage": 39.91, "elapsed_time": "2 days, 19:04:32", "remaining_time": "4 days, 5:00:32", "throughput": 2723.69, "total_tokens": 657695584} {"current_steps": 3646, "total_steps": 9134, "loss": 0.5602, "learning_rate": 3.278754949113921e-05, "epoch": 0.3991351706395906, "percentage": 39.92, "elapsed_time": "2 days, 19:05:34", "remaining_time": "4 days, 4:59:20", "throughput": 2723.65, "total_tokens": 657857088} {"current_steps": 3647, "total_steps": 9134, "loss": 0.6172, "learning_rate": 3.277937822847228e-05, "epoch": 0.39924464271052845, "percentage": 39.93, "elapsed_time": "2 days, 19:06:40", "remaining_time": "4 days, 4:58:13", "throughput": 2723.57, "total_tokens": 658014784} {"current_steps": 3648, "total_steps": 9134, "loss": 0.5639, "learning_rate": 3.277120604551976e-05, "epoch": 0.3993541147814664, "percentage": 39.94, "elapsed_time": "2 days, 19:07:38", "remaining_time": "4 days, 4:56:54", "throughput": 2723.42, "total_tokens": 658137984} {"current_steps": 3649, "total_steps": 9134, "loss": 0.8239, "learning_rate": 3.276303294324843e-05, "epoch": 0.3994635868524043, "percentage": 39.95, "elapsed_time": "2 days, 19:08:46", "remaining_time": "4 days, 4:55:50", "throughput": 2723.47, "total_tokens": 658332864} {"current_steps": 3650, "total_steps": 9134, "loss": 0.7238, "learning_rate": 3.275485892262514e-05, "epoch": 0.39957305892334216, "percentage": 39.96, "elapsed_time": "2 days, 19:09:52", "remaining_time": "4 days, 4:54:44", "throughput": 2723.47, "total_tokens": 658513408} {"current_steps": 3651, "total_steps": 9134, "loss": 0.7913, "learning_rate": 3.274668398461686e-05, "epoch": 0.3996825309942801, "percentage": 39.97, "elapsed_time": "2 days, 19:10:59", "remaining_time": "4 days, 4:53:39", "throughput": 2723.45, "total_tokens": 658691712} {"current_steps": 3652, "total_steps": 9134, "loss": 0.8298, "learning_rate": 3.273850813019068e-05, "epoch": 0.399792003065218, "percentage": 39.98, "elapsed_time": "2 days, 19:12:06", "remaining_time": "4 days, 4:52:34", "throughput": 2723.52, "total_tokens": 658890400} {"current_steps": 3653, "total_steps": 9134, "loss": 0.6915, "learning_rate": 3.273033136031378e-05, "epoch": 0.39990147513615587, "percentage": 39.99, "elapsed_time": "2 days, 19:13:13", "remaining_time": "4 days, 4:51:29", "throughput": 2723.5, "total_tokens": 659069376} {"current_steps": 3654, "total_steps": 9134, "loss": 0.852, "learning_rate": 3.272215367595346e-05, "epoch": 0.4000109472070938, "percentage": 40.0, "elapsed_time": "2 days, 19:14:19", "remaining_time": "4 days, 4:50:22", "throughput": 2723.43, "total_tokens": 659232000} {"current_steps": 3655, "total_steps": 9134, "loss": 0.7987, "learning_rate": 3.271397507807712e-05, "epoch": 0.4001204192780317, "percentage": 40.02, "elapsed_time": "2 days, 19:15:23", "remaining_time": "4 days, 4:49:12", "throughput": 2723.49, "total_tokens": 659419264} {"current_steps": 3656, "total_steps": 9134, "loss": 0.7644, "learning_rate": 3.2705795567652276e-05, "epoch": 0.4002298913489696, "percentage": 40.03, "elapsed_time": "2 days, 19:16:31", "remaining_time": "4 days, 4:48:09", "throughput": 2723.44, "total_tokens": 659593536} {"current_steps": 3657, "total_steps": 9134, "loss": 0.8496, "learning_rate": 3.269761514564655e-05, "epoch": 0.4003393634199075, "percentage": 40.04, "elapsed_time": "2 days, 19:17:37", "remaining_time": "4 days, 4:47:03", "throughput": 2723.52, "total_tokens": 659793120} {"current_steps": 3658, "total_steps": 9134, "loss": 0.6602, "learning_rate": 3.268943381302767e-05, "epoch": 0.4004488354908454, "percentage": 40.05, "elapsed_time": "2 days, 19:18:45", "remaining_time": "4 days, 4:45:59", "throughput": 2723.58, "total_tokens": 659992032} {"current_steps": 3659, "total_steps": 9134, "loss": 0.8245, "learning_rate": 3.268125157076346e-05, "epoch": 0.4005583075617833, "percentage": 40.06, "elapsed_time": "2 days, 19:19:49", "remaining_time": "4 days, 4:44:49", "throughput": 2723.6, "total_tokens": 660171680} {"current_steps": 3660, "total_steps": 9134, "loss": 0.8781, "learning_rate": 3.267306841982188e-05, "epoch": 0.4006677796327212, "percentage": 40.07, "elapsed_time": "2 days, 19:20:54", "remaining_time": "4 days, 4:43:41", "throughput": 2723.51, "total_tokens": 660325792} {"current_steps": 3661, "total_steps": 9134, "loss": 0.7475, "learning_rate": 3.266488436117097e-05, "epoch": 0.4007772517036591, "percentage": 40.08, "elapsed_time": "2 days, 19:22:01", "remaining_time": "4 days, 4:42:37", "throughput": 2723.46, "total_tokens": 660498944} {"current_steps": 3662, "total_steps": 9134, "loss": 0.7077, "learning_rate": 3.265669939577889e-05, "epoch": 0.400886723774597, "percentage": 40.09, "elapsed_time": "2 days, 19:23:05", "remaining_time": "4 days, 4:41:27", "throughput": 2723.47, "total_tokens": 660675680} {"current_steps": 3663, "total_steps": 9134, "loss": 0.5512, "learning_rate": 3.264851352461391e-05, "epoch": 0.4009961958455349, "percentage": 40.1, "elapsed_time": "2 days, 19:24:11", "remaining_time": "4 days, 4:40:20", "throughput": 2723.55, "total_tokens": 660871904} {"current_steps": 3664, "total_steps": 9134, "loss": 0.8656, "learning_rate": 3.26403267486444e-05, "epoch": 0.4011056679164728, "percentage": 40.11, "elapsed_time": "2 days, 19:25:14", "remaining_time": "4 days, 4:39:08", "throughput": 2723.53, "total_tokens": 661040352} {"current_steps": 3665, "total_steps": 9134, "loss": 0.7723, "learning_rate": 3.263213906883885e-05, "epoch": 0.4012151399874107, "percentage": 40.12, "elapsed_time": "2 days, 19:26:21", "remaining_time": "4 days, 4:38:03", "throughput": 2723.6, "total_tokens": 661238816} {"current_steps": 3666, "total_steps": 9134, "loss": 0.6963, "learning_rate": 3.262395048616584e-05, "epoch": 0.40132461205834863, "percentage": 40.14, "elapsed_time": "2 days, 19:27:25", "remaining_time": "4 days, 4:36:54", "throughput": 2723.6, "total_tokens": 661412864} {"current_steps": 3667, "total_steps": 9134, "loss": 0.7936, "learning_rate": 3.2615761001594055e-05, "epoch": 0.4014340841292865, "percentage": 40.15, "elapsed_time": "2 days, 19:28:28", "remaining_time": "4 days, 4:35:43", "throughput": 2723.58, "total_tokens": 661580864} {"current_steps": 3668, "total_steps": 9134, "loss": 0.8228, "learning_rate": 3.26075706160923e-05, "epoch": 0.4015435562002244, "percentage": 40.16, "elapsed_time": "2 days, 19:29:36", "remaining_time": "4 days, 4:34:40", "throughput": 2723.61, "total_tokens": 661773952} {"current_steps": 3669, "total_steps": 9134, "loss": 0.7054, "learning_rate": 3.259937933062949e-05, "epoch": 0.40165302827116234, "percentage": 40.17, "elapsed_time": "2 days, 19:30:41", "remaining_time": "4 days, 4:33:31", "throughput": 2723.6, "total_tokens": 661946656} {"current_steps": 3670, "total_steps": 9134, "loss": 0.5957, "learning_rate": 3.2591187146174636e-05, "epoch": 0.4017625003421002, "percentage": 40.18, "elapsed_time": "2 days, 19:31:44", "remaining_time": "4 days, 4:32:21", "throughput": 2723.54, "total_tokens": 662106816} {"current_steps": 3671, "total_steps": 9134, "loss": 0.95, "learning_rate": 3.258299406369685e-05, "epoch": 0.4018719724130381, "percentage": 40.19, "elapsed_time": "2 days, 19:32:52", "remaining_time": "4 days, 4:31:17", "throughput": 2723.53, "total_tokens": 662288032} {"current_steps": 3672, "total_steps": 9134, "loss": 0.7413, "learning_rate": 3.257480008416536e-05, "epoch": 0.40198144448397605, "percentage": 40.2, "elapsed_time": "2 days, 19:34:01", "remaining_time": "4 days, 4:30:14", "throughput": 2723.61, "total_tokens": 662493888} {"current_steps": 3673, "total_steps": 9134, "loss": 0.7711, "learning_rate": 3.25666052085495e-05, "epoch": 0.4020909165549139, "percentage": 40.21, "elapsed_time": "2 days, 19:35:08", "remaining_time": "4 days, 4:29:10", "throughput": 2723.59, "total_tokens": 662673088} {"current_steps": 3674, "total_steps": 9134, "loss": 0.8008, "learning_rate": 3.2558409437818714e-05, "epoch": 0.40220038862585183, "percentage": 40.22, "elapsed_time": "2 days, 19:36:12", "remaining_time": "4 days, 4:28:00", "throughput": 2723.57, "total_tokens": 662841088} {"current_steps": 3675, "total_steps": 9134, "loss": 0.6629, "learning_rate": 3.255021277294253e-05, "epoch": 0.40230986069678976, "percentage": 40.23, "elapsed_time": "2 days, 19:37:16", "remaining_time": "4 days, 4:26:51", "throughput": 2723.53, "total_tokens": 663009088} {"current_steps": 3676, "total_steps": 9134, "loss": 0.801, "learning_rate": 3.254201521489062e-05, "epoch": 0.4024193327677276, "percentage": 40.25, "elapsed_time": "2 days, 19:38:22", "remaining_time": "4 days, 4:25:44", "throughput": 2723.52, "total_tokens": 663183808} {"current_steps": 3677, "total_steps": 9134, "loss": 0.8856, "learning_rate": 3.253381676463273e-05, "epoch": 0.40252880483866554, "percentage": 40.26, "elapsed_time": "2 days, 19:39:29", "remaining_time": "4 days, 4:24:38", "throughput": 2723.58, "total_tokens": 663379584} {"current_steps": 3678, "total_steps": 9134, "loss": 0.7237, "learning_rate": 3.252561742313871e-05, "epoch": 0.4026382769096034, "percentage": 40.27, "elapsed_time": "2 days, 19:40:33", "remaining_time": "4 days, 4:23:29", "throughput": 2723.54, "total_tokens": 663546688} {"current_steps": 3679, "total_steps": 9134, "loss": 0.7983, "learning_rate": 3.2517417191378544e-05, "epoch": 0.40274774898054133, "percentage": 40.28, "elapsed_time": "2 days, 19:41:40", "remaining_time": "4 days, 4:22:24", "throughput": 2723.66, "total_tokens": 663757248} {"current_steps": 3680, "total_steps": 9134, "loss": 0.7509, "learning_rate": 3.250921607032229e-05, "epoch": 0.40285722105147925, "percentage": 40.29, "elapsed_time": "2 days, 19:42:49", "remaining_time": "4 days, 4:21:21", "throughput": 2723.66, "total_tokens": 663943168} {"current_steps": 3681, "total_steps": 9134, "loss": 0.845, "learning_rate": 3.2501014060940135e-05, "epoch": 0.4029666931224171, "percentage": 40.3, "elapsed_time": "2 days, 19:43:55", "remaining_time": "4 days, 4:20:15", "throughput": 2723.7, "total_tokens": 664134912} {"current_steps": 3682, "total_steps": 9134, "loss": 0.661, "learning_rate": 3.249281116420234e-05, "epoch": 0.40307616519335504, "percentage": 40.31, "elapsed_time": "2 days, 19:45:03", "remaining_time": "4 days, 4:19:12", "throughput": 2723.77, "total_tokens": 664336288} {"current_steps": 3683, "total_steps": 9134, "loss": 0.7089, "learning_rate": 3.248460738107932e-05, "epoch": 0.40318563726429296, "percentage": 40.32, "elapsed_time": "2 days, 19:46:05", "remaining_time": "4 days, 4:17:59", "throughput": 2723.71, "total_tokens": 664490176} {"current_steps": 3684, "total_steps": 9134, "loss": 0.6887, "learning_rate": 3.2476402712541556e-05, "epoch": 0.40329510933523083, "percentage": 40.33, "elapsed_time": "2 days, 19:47:12", "remaining_time": "4 days, 4:16:54", "throughput": 2723.72, "total_tokens": 664677440} {"current_steps": 3685, "total_steps": 9134, "loss": 0.7156, "learning_rate": 3.246819715955964e-05, "epoch": 0.40340458140616875, "percentage": 40.34, "elapsed_time": "2 days, 19:48:19", "remaining_time": "4 days, 4:15:49", "throughput": 2723.74, "total_tokens": 664863360} {"current_steps": 3686, "total_steps": 9134, "loss": 0.691, "learning_rate": 3.2459990723104285e-05, "epoch": 0.40351405347710667, "percentage": 40.35, "elapsed_time": "2 days, 19:49:21", "remaining_time": "4 days, 4:14:37", "throughput": 2723.69, "total_tokens": 665021280} {"current_steps": 3687, "total_steps": 9134, "loss": 0.6117, "learning_rate": 3.245178340414628e-05, "epoch": 0.40362352554804454, "percentage": 40.37, "elapsed_time": "2 days, 19:50:29", "remaining_time": "4 days, 4:13:32", "throughput": 2723.76, "total_tokens": 665220864} {"current_steps": 3688, "total_steps": 9134, "loss": 0.6945, "learning_rate": 3.244357520365654e-05, "epoch": 0.40373299761898246, "percentage": 40.38, "elapsed_time": "2 days, 19:51:35", "remaining_time": "4 days, 4:12:26", "throughput": 2723.75, "total_tokens": 665399840} {"current_steps": 3689, "total_steps": 9134, "loss": 0.6683, "learning_rate": 3.243536612260609e-05, "epoch": 0.4038424696899204, "percentage": 40.39, "elapsed_time": "2 days, 19:52:40", "remaining_time": "4 days, 4:11:18", "throughput": 2723.74, "total_tokens": 665576128} {"current_steps": 3690, "total_steps": 9134, "loss": 0.507, "learning_rate": 3.242715616196604e-05, "epoch": 0.40395194176085825, "percentage": 40.4, "elapsed_time": "2 days, 19:53:45", "remaining_time": "4 days, 4:10:10", "throughput": 2723.71, "total_tokens": 665744576} {"current_steps": 3691, "total_steps": 9134, "loss": 0.6367, "learning_rate": 3.241894532270762e-05, "epoch": 0.40406141383179617, "percentage": 40.41, "elapsed_time": "2 days, 19:54:45", "remaining_time": "4 days, 4:08:54", "throughput": 2723.67, "total_tokens": 665898240} {"current_steps": 3692, "total_steps": 9134, "loss": 0.5868, "learning_rate": 3.2410733605802146e-05, "epoch": 0.4041708859027341, "percentage": 40.42, "elapsed_time": "2 days, 19:55:49", "remaining_time": "4 days, 4:07:46", "throughput": 2723.66, "total_tokens": 666071392} {"current_steps": 3693, "total_steps": 9134, "loss": 0.9129, "learning_rate": 3.240252101222105e-05, "epoch": 0.40428035797367196, "percentage": 40.43, "elapsed_time": "2 days, 19:56:52", "remaining_time": "4 days, 4:06:34", "throughput": 2723.61, "total_tokens": 666230208} {"current_steps": 3694, "total_steps": 9134, "loss": 0.8384, "learning_rate": 3.2394307542935876e-05, "epoch": 0.4043898300446099, "percentage": 40.44, "elapsed_time": "2 days, 19:58:01", "remaining_time": "4 days, 4:05:31", "throughput": 2723.71, "total_tokens": 666440768} {"current_steps": 3695, "total_steps": 9134, "loss": 0.6633, "learning_rate": 3.2386093198918246e-05, "epoch": 0.4044993021155478, "percentage": 40.45, "elapsed_time": "2 days, 19:59:04", "remaining_time": "4 days, 4:04:20", "throughput": 2723.67, "total_tokens": 666601376} {"current_steps": 3696, "total_steps": 9134, "loss": 0.7502, "learning_rate": 3.237787798113992e-05, "epoch": 0.40460877418648566, "percentage": 40.46, "elapsed_time": "2 days, 20:00:06", "remaining_time": "4 days, 4:03:08", "throughput": 2723.63, "total_tokens": 666761760} {"current_steps": 3697, "total_steps": 9134, "loss": 0.7542, "learning_rate": 3.236966189057273e-05, "epoch": 0.4047182462574236, "percentage": 40.48, "elapsed_time": "2 days, 20:01:12", "remaining_time": "4 days, 4:02:02", "throughput": 2723.65, "total_tokens": 666946784} {"current_steps": 3698, "total_steps": 9134, "loss": 0.6308, "learning_rate": 3.236144492818862e-05, "epoch": 0.40482771832836145, "percentage": 40.49, "elapsed_time": "2 days, 20:02:17", "remaining_time": "4 days, 4:00:54", "throughput": 2723.58, "total_tokens": 667107168} {"current_steps": 3699, "total_steps": 9134, "loss": 0.8963, "learning_rate": 3.235322709495966e-05, "epoch": 0.4049371903992994, "percentage": 40.5, "elapsed_time": "2 days, 20:03:21", "remaining_time": "4 days, 3:59:44", "throughput": 2723.59, "total_tokens": 667283008} {"current_steps": 3700, "total_steps": 9134, "loss": 0.7218, "learning_rate": 3.234500839185799e-05, "epoch": 0.4050466624702373, "percentage": 40.51, "elapsed_time": "2 days, 20:04:23", "remaining_time": "4 days, 3:58:31", "throughput": 2723.5, "total_tokens": 667429952} {"current_steps": 3701, "total_steps": 9134, "loss": 0.7665, "learning_rate": 3.233678881985586e-05, "epoch": 0.40515613454117516, "percentage": 40.52, "elapsed_time": "2 days, 20:05:31", "remaining_time": "4 days, 3:57:28", "throughput": 2723.57, "total_tokens": 667631776} {"current_steps": 3702, "total_steps": 9134, "loss": 0.9228, "learning_rate": 3.232856837992564e-05, "epoch": 0.4052656066121131, "percentage": 40.53, "elapsed_time": "2 days, 20:06:37", "remaining_time": "4 days, 3:56:21", "throughput": 2723.61, "total_tokens": 667821728} {"current_steps": 3703, "total_steps": 9134, "loss": 0.7327, "learning_rate": 3.232034707303979e-05, "epoch": 0.405375078683051, "percentage": 40.54, "elapsed_time": "2 days, 20:07:43", "remaining_time": "4 days, 3:55:15", "throughput": 2723.59, "total_tokens": 667997120} {"current_steps": 3704, "total_steps": 9134, "loss": 0.6943, "learning_rate": 3.231212490017088e-05, "epoch": 0.40548455075398887, "percentage": 40.55, "elapsed_time": "2 days, 20:08:51", "remaining_time": "4 days, 3:54:12", "throughput": 2723.65, "total_tokens": 668197152} {"current_steps": 3705, "total_steps": 9134, "loss": 0.6198, "learning_rate": 3.230390186229157e-05, "epoch": 0.4055940228249268, "percentage": 40.56, "elapsed_time": "2 days, 20:09:55", "remaining_time": "4 days, 3:53:02", "throughput": 2723.64, "total_tokens": 668370976} {"current_steps": 3706, "total_steps": 9134, "loss": 0.7217, "learning_rate": 3.229567796037463e-05, "epoch": 0.4057034948958647, "percentage": 40.57, "elapsed_time": "2 days, 20:10:58", "remaining_time": "4 days, 3:51:51", "throughput": 2723.67, "total_tokens": 668548832} {"current_steps": 3707, "total_steps": 9134, "loss": 0.5537, "learning_rate": 3.228745319539294e-05, "epoch": 0.4058129669668026, "percentage": 40.58, "elapsed_time": "2 days, 20:12:02", "remaining_time": "4 days, 3:50:41", "throughput": 2723.62, "total_tokens": 668709888} {"current_steps": 3708, "total_steps": 9134, "loss": 0.6726, "learning_rate": 3.227922756831947e-05, "epoch": 0.4059224390377405, "percentage": 40.6, "elapsed_time": "2 days, 20:13:06", "remaining_time": "4 days, 3:49:31", "throughput": 2723.57, "total_tokens": 668870496} {"current_steps": 3709, "total_steps": 9134, "loss": 0.7782, "learning_rate": 3.227100108012728e-05, "epoch": 0.4060319111086784, "percentage": 40.61, "elapsed_time": "2 days, 20:14:12", "remaining_time": "4 days, 3:48:25", "throughput": 2723.61, "total_tokens": 669060224} {"current_steps": 3710, "total_steps": 9134, "loss": 0.5244, "learning_rate": 3.226277373178957e-05, "epoch": 0.4061413831796163, "percentage": 40.62, "elapsed_time": "2 days, 20:15:14", "remaining_time": "4 days, 3:47:13", "throughput": 2723.56, "total_tokens": 669217024} {"current_steps": 3711, "total_steps": 9134, "loss": 0.6058, "learning_rate": 3.2254545524279626e-05, "epoch": 0.4062508552505542, "percentage": 40.63, "elapsed_time": "2 days, 20:16:19", "remaining_time": "4 days, 3:46:04", "throughput": 2723.56, "total_tokens": 669393984} {"current_steps": 3712, "total_steps": 9134, "loss": 0.6531, "learning_rate": 3.22463164585708e-05, "epoch": 0.40636032732149213, "percentage": 40.64, "elapsed_time": "2 days, 20:17:21", "remaining_time": "4 days, 3:44:53", "throughput": 2723.46, "total_tokens": 669539360} {"current_steps": 3713, "total_steps": 9134, "loss": 0.6643, "learning_rate": 3.223808653563659e-05, "epoch": 0.40646979939243, "percentage": 40.65, "elapsed_time": "2 days, 20:18:23", "remaining_time": "4 days, 3:43:40", "throughput": 2723.35, "total_tokens": 669680928} {"current_steps": 3714, "total_steps": 9134, "loss": 0.7938, "learning_rate": 3.222985575645058e-05, "epoch": 0.4065792714633679, "percentage": 40.66, "elapsed_time": "2 days, 20:19:30", "remaining_time": "4 days, 3:42:35", "throughput": 2723.43, "total_tokens": 669882976} {"current_steps": 3715, "total_steps": 9134, "loss": 0.7022, "learning_rate": 3.222162412198646e-05, "epoch": 0.4066887435343058, "percentage": 40.67, "elapsed_time": "2 days, 20:20:34", "remaining_time": "4 days, 3:41:25", "throughput": 2723.44, "total_tokens": 670060608} {"current_steps": 3716, "total_steps": 9134, "loss": 0.6649, "learning_rate": 3.221339163321801e-05, "epoch": 0.4067982156052437, "percentage": 40.68, "elapsed_time": "2 days, 20:21:36", "remaining_time": "4 days, 3:40:12", "throughput": 2723.32, "total_tokens": 670197920} {"current_steps": 3717, "total_steps": 9134, "loss": 0.6229, "learning_rate": 3.220515829111911e-05, "epoch": 0.40690768767618163, "percentage": 40.69, "elapsed_time": "2 days, 20:22:44", "remaining_time": "4 days, 3:39:10", "throughput": 2723.39, "total_tokens": 670403104} {"current_steps": 3718, "total_steps": 9134, "loss": 0.8802, "learning_rate": 3.219692409666377e-05, "epoch": 0.4070171597471195, "percentage": 40.71, "elapsed_time": "2 days, 20:23:53", "remaining_time": "4 days, 3:38:07", "throughput": 2723.48, "total_tokens": 670611200} {"current_steps": 3719, "total_steps": 9134, "loss": 0.6061, "learning_rate": 3.218868905082606e-05, "epoch": 0.4071266318180574, "percentage": 40.72, "elapsed_time": "2 days, 20:25:00", "remaining_time": "4 days, 3:37:02", "throughput": 2723.55, "total_tokens": 670811680} {"current_steps": 3720, "total_steps": 9134, "loss": 0.6817, "learning_rate": 3.218045315458018e-05, "epoch": 0.40723610388899534, "percentage": 40.73, "elapsed_time": "2 days, 20:26:01", "remaining_time": "4 days, 3:35:48", "throughput": 2723.44, "total_tokens": 670949888} {"current_steps": 3721, "total_steps": 9134, "loss": 0.6153, "learning_rate": 3.2172216408900426e-05, "epoch": 0.4073455759599332, "percentage": 40.74, "elapsed_time": "2 days, 20:27:05", "remaining_time": "4 days, 3:34:39", "throughput": 2723.42, "total_tokens": 671121024} {"current_steps": 3722, "total_steps": 9134, "loss": 0.7762, "learning_rate": 3.2163978814761174e-05, "epoch": 0.4074550480308711, "percentage": 40.75, "elapsed_time": "2 days, 20:28:12", "remaining_time": "4 days, 3:33:33", "throughput": 2723.45, "total_tokens": 671307840} {"current_steps": 3723, "total_steps": 9134, "loss": 0.7713, "learning_rate": 3.215574037313692e-05, "epoch": 0.40756452010180905, "percentage": 40.76, "elapsed_time": "2 days, 20:29:17", "remaining_time": "4 days, 3:32:26", "throughput": 2723.47, "total_tokens": 671491968} {"current_steps": 3724, "total_steps": 9134, "loss": 0.6724, "learning_rate": 3.214750108500227e-05, "epoch": 0.4076739921727469, "percentage": 40.77, "elapsed_time": "2 days, 20:30:22", "remaining_time": "4 days, 3:31:18", "throughput": 2723.54, "total_tokens": 671687072} {"current_steps": 3725, "total_steps": 9134, "loss": 0.7907, "learning_rate": 3.21392609513319e-05, "epoch": 0.40778346424368483, "percentage": 40.78, "elapsed_time": "2 days, 20:31:31", "remaining_time": "4 days, 3:30:15", "throughput": 2723.5, "total_tokens": 671864032} {"current_steps": 3726, "total_steps": 9134, "loss": 0.878, "learning_rate": 3.21310199731006e-05, "epoch": 0.40789293631462276, "percentage": 40.79, "elapsed_time": "2 days, 20:32:36", "remaining_time": "4 days, 3:29:07", "throughput": 2723.47, "total_tokens": 672034720} {"current_steps": 3727, "total_steps": 9134, "loss": 0.5762, "learning_rate": 3.212277815128328e-05, "epoch": 0.4080024083855606, "percentage": 40.8, "elapsed_time": "2 days, 20:33:40", "remaining_time": "4 days, 3:27:59", "throughput": 2723.47, "total_tokens": 672210336} {"current_steps": 3728, "total_steps": 9134, "loss": 0.6817, "learning_rate": 3.2114535486854915e-05, "epoch": 0.40811188045649854, "percentage": 40.81, "elapsed_time": "2 days, 20:34:48", "remaining_time": "4 days, 3:26:55", "throughput": 2723.37, "total_tokens": 672370944} {"current_steps": 3729, "total_steps": 9134, "loss": 0.7638, "learning_rate": 3.210629198079061e-05, "epoch": 0.40822135252743647, "percentage": 40.83, "elapsed_time": "2 days, 20:35:54", "remaining_time": "4 days, 3:25:47", "throughput": 2723.31, "total_tokens": 672532672} {"current_steps": 3730, "total_steps": 9134, "loss": 0.6333, "learning_rate": 3.209804763406554e-05, "epoch": 0.40833082459837433, "percentage": 40.84, "elapsed_time": "2 days, 20:36:53", "remaining_time": "4 days, 3:24:30", "throughput": 2723.2, "total_tokens": 672665056} {"current_steps": 3731, "total_steps": 9134, "loss": 0.7198, "learning_rate": 3.2089802447655006e-05, "epoch": 0.40844029666931225, "percentage": 40.85, "elapsed_time": "2 days, 20:37:56", "remaining_time": "4 days, 3:23:21", "throughput": 2723.24, "total_tokens": 672848512} {"current_steps": 3732, "total_steps": 9134, "loss": 0.7495, "learning_rate": 3.20815564225344e-05, "epoch": 0.4085497687402501, "percentage": 40.86, "elapsed_time": "2 days, 20:39:02", "remaining_time": "4 days, 3:22:14", "throughput": 2723.25, "total_tokens": 673031072} {"current_steps": 3733, "total_steps": 9134, "loss": 0.6638, "learning_rate": 3.20733095596792e-05, "epoch": 0.40865924081118804, "percentage": 40.87, "elapsed_time": "2 days, 20:40:08", "remaining_time": "4 days, 3:21:07", "throughput": 2723.23, "total_tokens": 673205568} {"current_steps": 3734, "total_steps": 9134, "loss": 0.809, "learning_rate": 3.2065061860065016e-05, "epoch": 0.40876871288212596, "percentage": 40.88, "elapsed_time": "2 days, 20:41:17", "remaining_time": "4 days, 3:20:05", "throughput": 2723.27, "total_tokens": 673403584} {"current_steps": 3735, "total_steps": 9134, "loss": 0.7813, "learning_rate": 3.20568133246675e-05, "epoch": 0.40887818495306383, "percentage": 40.89, "elapsed_time": "2 days, 20:42:20", "remaining_time": "4 days, 3:18:53", "throughput": 2723.26, "total_tokens": 673571808} {"current_steps": 3736, "total_steps": 9134, "loss": 0.6224, "learning_rate": 3.204856395446247e-05, "epoch": 0.40898765702400175, "percentage": 40.9, "elapsed_time": "2 days, 20:43:24", "remaining_time": "4 days, 3:17:45", "throughput": 2723.23, "total_tokens": 673741152} {"current_steps": 3737, "total_steps": 9134, "loss": 0.6876, "learning_rate": 3.204031375042579e-05, "epoch": 0.40909712909493967, "percentage": 40.91, "elapsed_time": "2 days, 20:44:33", "remaining_time": "4 days, 3:16:43", "throughput": 2723.26, "total_tokens": 673935584} {"current_steps": 3738, "total_steps": 9134, "loss": 0.6662, "learning_rate": 3.2032062713533464e-05, "epoch": 0.40920660116587754, "percentage": 40.92, "elapsed_time": "2 days, 20:45:42", "remaining_time": "4 days, 3:15:41", "throughput": 2723.31, "total_tokens": 674134944} {"current_steps": 3739, "total_steps": 9134, "loss": 0.7518, "learning_rate": 3.2023810844761554e-05, "epoch": 0.40931607323681546, "percentage": 40.93, "elapsed_time": "2 days, 20:46:48", "remaining_time": "4 days, 3:14:33", "throughput": 2723.27, "total_tokens": 674304736} {"current_steps": 3740, "total_steps": 9134, "loss": 0.7462, "learning_rate": 3.201555814508626e-05, "epoch": 0.4094255453077534, "percentage": 40.95, "elapsed_time": "2 days, 20:47:54", "remaining_time": "4 days, 3:13:27", "throughput": 2723.31, "total_tokens": 674494016} {"current_steps": 3741, "total_steps": 9134, "loss": 0.7647, "learning_rate": 3.200730461548384e-05, "epoch": 0.40953501737869125, "percentage": 40.96, "elapsed_time": "2 days, 20:48:57", "remaining_time": "4 days, 3:12:16", "throughput": 2723.26, "total_tokens": 674651488} {"current_steps": 3742, "total_steps": 9134, "loss": 0.6252, "learning_rate": 3.199905025693067e-05, "epoch": 0.40964448944962917, "percentage": 40.97, "elapsed_time": "2 days, 20:49:58", "remaining_time": "4 days, 3:11:03", "throughput": 2723.21, "total_tokens": 674807616} {"current_steps": 3743, "total_steps": 9134, "loss": 0.8545, "learning_rate": 3.199079507040324e-05, "epoch": 0.4097539615205671, "percentage": 40.98, "elapsed_time": "2 days, 20:51:03", "remaining_time": "4 days, 3:09:54", "throughput": 2723.19, "total_tokens": 674978080} {"current_steps": 3744, "total_steps": 9134, "loss": 0.6787, "learning_rate": 3.198253905687813e-05, "epoch": 0.40986343359150496, "percentage": 40.99, "elapsed_time": "2 days, 20:52:09", "remaining_time": "4 days, 3:08:49", "throughput": 2723.25, "total_tokens": 675174528} {"current_steps": 3745, "total_steps": 9134, "loss": 0.8089, "learning_rate": 3.1974282217331985e-05, "epoch": 0.4099729056624429, "percentage": 41.0, "elapsed_time": "2 days, 20:53:16", "remaining_time": "4 days, 3:07:42", "throughput": 2723.24, "total_tokens": 675353280} {"current_steps": 3746, "total_steps": 9134, "loss": 0.8599, "learning_rate": 3.1966024552741586e-05, "epoch": 0.4100823777333808, "percentage": 41.01, "elapsed_time": "2 days, 20:54:21", "remaining_time": "4 days, 3:06:35", "throughput": 2723.23, "total_tokens": 675527552} {"current_steps": 3747, "total_steps": 9134, "loss": 0.5155, "learning_rate": 3.1957766064083804e-05, "epoch": 0.41019184980431866, "percentage": 41.02, "elapsed_time": "2 days, 20:55:24", "remaining_time": "4 days, 3:05:24", "throughput": 2723.17, "total_tokens": 675685248} {"current_steps": 3748, "total_steps": 9134, "loss": 0.7574, "learning_rate": 3.19495067523356e-05, "epoch": 0.4103013218752566, "percentage": 41.03, "elapsed_time": "2 days, 20:56:33", "remaining_time": "4 days, 3:04:22", "throughput": 2723.17, "total_tokens": 675873856} {"current_steps": 3749, "total_steps": 9134, "loss": 0.7892, "learning_rate": 3.194124661847403e-05, "epoch": 0.41041079394619445, "percentage": 41.04, "elapsed_time": "2 days, 20:57:41", "remaining_time": "4 days, 3:03:18", "throughput": 2723.25, "total_tokens": 676078144} {"current_steps": 3750, "total_steps": 9134, "loss": 0.6695, "learning_rate": 3.193298566347625e-05, "epoch": 0.4105202660171324, "percentage": 41.06, "elapsed_time": "2 days, 20:58:48", "remaining_time": "4 days, 3:02:14", "throughput": 2723.25, "total_tokens": 676262272} {"current_steps": 3751, "total_steps": 9134, "loss": 0.7248, "learning_rate": 3.192472388831953e-05, "epoch": 0.4106297380880703, "percentage": 41.07, "elapsed_time": "2 days, 20:59:57", "remaining_time": "4 days, 3:01:11", "throughput": 2723.26, "total_tokens": 676450880} {"current_steps": 3752, "total_steps": 9134, "loss": 0.6391, "learning_rate": 3.19164612939812e-05, "epoch": 0.41073921015900816, "percentage": 41.08, "elapsed_time": "2 days, 21:01:01", "remaining_time": "4 days, 3:00:02", "throughput": 2723.13, "total_tokens": 676593568} {"current_steps": 3753, "total_steps": 9134, "loss": 0.7536, "learning_rate": 3.1908197881438727e-05, "epoch": 0.4108486822299461, "percentage": 41.09, "elapsed_time": "2 days, 21:02:09", "remaining_time": "4 days, 2:58:58", "throughput": 2723.1, "total_tokens": 676772096} {"current_steps": 3754, "total_steps": 9134, "loss": 0.5998, "learning_rate": 3.1899933651669656e-05, "epoch": 0.410958154300884, "percentage": 41.1, "elapsed_time": "2 days, 21:03:15", "remaining_time": "4 days, 2:57:51", "throughput": 2723.11, "total_tokens": 676950848} {"current_steps": 3755, "total_steps": 9134, "loss": 0.6238, "learning_rate": 3.1891668605651614e-05, "epoch": 0.41106762637182187, "percentage": 41.11, "elapsed_time": "2 days, 21:04:16", "remaining_time": "4 days, 2:56:37", "throughput": 2723.02, "total_tokens": 677095104} {"current_steps": 3756, "total_steps": 9134, "loss": 0.6728, "learning_rate": 3.1883402744362355e-05, "epoch": 0.4111770984427598, "percentage": 41.12, "elapsed_time": "2 days, 21:05:20", "remaining_time": "4 days, 2:55:29", "throughput": 2722.99, "total_tokens": 677263328} {"current_steps": 3757, "total_steps": 9134, "loss": 0.5951, "learning_rate": 3.1875136068779706e-05, "epoch": 0.4112865705136977, "percentage": 41.13, "elapsed_time": "2 days, 21:06:25", "remaining_time": "4 days, 2:54:21", "throughput": 2722.91, "total_tokens": 677422368} {"current_steps": 3758, "total_steps": 9134, "loss": 0.8697, "learning_rate": 3.186686857988161e-05, "epoch": 0.4113960425846356, "percentage": 41.14, "elapsed_time": "2 days, 21:07:32", "remaining_time": "4 days, 2:53:16", "throughput": 2722.97, "total_tokens": 677618816} {"current_steps": 3759, "total_steps": 9134, "loss": 0.698, "learning_rate": 3.1858600278646084e-05, "epoch": 0.4115055146555735, "percentage": 41.15, "elapsed_time": "2 days, 21:08:35", "remaining_time": "4 days, 2:52:04", "throughput": 2722.92, "total_tokens": 677778304} {"current_steps": 3760, "total_steps": 9134, "loss": 0.7378, "learning_rate": 3.185033116605126e-05, "epoch": 0.4116149867265114, "percentage": 41.16, "elapsed_time": "2 days, 21:09:40", "remaining_time": "4 days, 2:50:56", "throughput": 2722.88, "total_tokens": 677944736} {"current_steps": 3761, "total_steps": 9134, "loss": 0.5998, "learning_rate": 3.1842061243075353e-05, "epoch": 0.4117244587974493, "percentage": 41.18, "elapsed_time": "2 days, 21:10:46", "remaining_time": "4 days, 2:49:49", "throughput": 2722.95, "total_tokens": 678141408} {"current_steps": 3762, "total_steps": 9134, "loss": 0.7681, "learning_rate": 3.183379051069668e-05, "epoch": 0.4118339308683872, "percentage": 41.19, "elapsed_time": "2 days, 21:11:51", "remaining_time": "4 days, 2:48:42", "throughput": 2722.96, "total_tokens": 678320160} {"current_steps": 3763, "total_steps": 9134, "loss": 0.8954, "learning_rate": 3.182551896989365e-05, "epoch": 0.41194340293932513, "percentage": 41.2, "elapsed_time": "2 days, 21:12:59", "remaining_time": "4 days, 2:47:39", "throughput": 2723.01, "total_tokens": 678518848} {"current_steps": 3764, "total_steps": 9134, "loss": 0.845, "learning_rate": 3.181724662164478e-05, "epoch": 0.412052875010263, "percentage": 41.21, "elapsed_time": "2 days, 21:14:09", "remaining_time": "4 days, 2:46:37", "throughput": 2723.05, "total_tokens": 678717312} {"current_steps": 3765, "total_steps": 9134, "loss": 0.6463, "learning_rate": 3.180897346692867e-05, "epoch": 0.4121623470812009, "percentage": 41.22, "elapsed_time": "2 days, 21:15:15", "remaining_time": "4 days, 2:45:31", "throughput": 2723.11, "total_tokens": 678915104} {"current_steps": 3766, "total_steps": 9134, "loss": 0.6726, "learning_rate": 3.180069950672401e-05, "epoch": 0.4122718191521388, "percentage": 41.23, "elapsed_time": "2 days, 21:16:19", "remaining_time": "4 days, 2:44:21", "throughput": 2723.05, "total_tokens": 679072352} {"current_steps": 3767, "total_steps": 9134, "loss": 0.8163, "learning_rate": 3.17924247420096e-05, "epoch": 0.4123812912230767, "percentage": 41.24, "elapsed_time": "2 days, 21:17:24", "remaining_time": "4 days, 2:43:14", "throughput": 2723.03, "total_tokens": 679246400} {"current_steps": 3768, "total_steps": 9134, "loss": 0.8238, "learning_rate": 3.178414917376433e-05, "epoch": 0.41249076329401463, "percentage": 41.25, "elapsed_time": "2 days, 21:18:30", "remaining_time": "4 days, 2:42:07", "throughput": 2722.95, "total_tokens": 679406112} {"current_steps": 3769, "total_steps": 9134, "loss": 0.6491, "learning_rate": 3.1775872802967175e-05, "epoch": 0.4126002353649525, "percentage": 41.26, "elapsed_time": "2 days, 21:19:32", "remaining_time": "4 days, 2:40:55", "throughput": 2722.89, "total_tokens": 679558656} {"current_steps": 3770, "total_steps": 9134, "loss": 0.6192, "learning_rate": 3.176759563059722e-05, "epoch": 0.4127097074358904, "percentage": 41.27, "elapsed_time": "2 days, 21:20:34", "remaining_time": "4 days, 2:39:43", "throughput": 2722.82, "total_tokens": 679711424} {"current_steps": 3771, "total_steps": 9134, "loss": 0.8721, "learning_rate": 3.175931765763365e-05, "epoch": 0.41281917950682834, "percentage": 41.29, "elapsed_time": "2 days, 21:21:43", "remaining_time": "4 days, 2:38:40", "throughput": 2722.89, "total_tokens": 679914368} {"current_steps": 3772, "total_steps": 9134, "loss": 0.7846, "learning_rate": 3.175103888505572e-05, "epoch": 0.4129286515777662, "percentage": 41.3, "elapsed_time": "2 days, 21:22:47", "remaining_time": "4 days, 2:37:31", "throughput": 2722.9, "total_tokens": 680093344} {"current_steps": 3773, "total_steps": 9134, "loss": 0.7348, "learning_rate": 3.174275931384279e-05, "epoch": 0.4130381236487041, "percentage": 41.31, "elapsed_time": "2 days, 21:23:53", "remaining_time": "4 days, 2:36:25", "throughput": 2722.96, "total_tokens": 680287776} {"current_steps": 3774, "total_steps": 9134, "loss": 0.8077, "learning_rate": 3.173447894497433e-05, "epoch": 0.41314759571964205, "percentage": 41.32, "elapsed_time": "2 days, 21:25:00", "remaining_time": "4 days, 2:35:19", "throughput": 2722.93, "total_tokens": 680461600} {"current_steps": 3775, "total_steps": 9134, "loss": 0.5736, "learning_rate": 3.172619777942988e-05, "epoch": 0.4132570677905799, "percentage": 41.33, "elapsed_time": "2 days, 21:26:05", "remaining_time": "4 days, 2:34:11", "throughput": 2722.98, "total_tokens": 680650208} {"current_steps": 3776, "total_steps": 9134, "loss": 0.8898, "learning_rate": 3.1717915818189095e-05, "epoch": 0.41336653986151783, "percentage": 41.34, "elapsed_time": "2 days, 21:27:14", "remaining_time": "4 days, 2:33:08", "throughput": 2723.02, "total_tokens": 680848000} {"current_steps": 3777, "total_steps": 9134, "loss": 0.6552, "learning_rate": 3.17096330622317e-05, "epoch": 0.41347601193245576, "percentage": 41.35, "elapsed_time": "2 days, 21:28:20", "remaining_time": "4 days, 2:32:03", "throughput": 2722.99, "total_tokens": 681023168} {"current_steps": 3778, "total_steps": 9134, "loss": 0.5491, "learning_rate": 3.170134951253755e-05, "epoch": 0.4135854840033936, "percentage": 41.36, "elapsed_time": "2 days, 21:29:29", "remaining_time": "4 days, 2:31:01", "throughput": 2723.05, "total_tokens": 681224096} {"current_steps": 3779, "total_steps": 9134, "loss": 0.7226, "learning_rate": 3.169306517008656e-05, "epoch": 0.41369495607433154, "percentage": 41.37, "elapsed_time": "2 days, 21:30:32", "remaining_time": "4 days, 2:29:49", "throughput": 2723.0, "total_tokens": 681381120} {"current_steps": 3780, "total_steps": 9134, "loss": 0.7341, "learning_rate": 3.168478003585876e-05, "epoch": 0.41380442814526947, "percentage": 41.38, "elapsed_time": "2 days, 21:31:39", "remaining_time": "4 days, 2:28:44", "throughput": 2723.1, "total_tokens": 681590336} {"current_steps": 3781, "total_steps": 9134, "loss": 0.6995, "learning_rate": 3.167649411083425e-05, "epoch": 0.41391390021620733, "percentage": 41.39, "elapsed_time": "2 days, 21:32:46", "remaining_time": "4 days, 2:27:39", "throughput": 2723.17, "total_tokens": 681790144} {"current_steps": 3782, "total_steps": 9134, "loss": 0.7427, "learning_rate": 3.1668207395993265e-05, "epoch": 0.41402337228714525, "percentage": 41.41, "elapsed_time": "2 days, 21:33:55", "remaining_time": "4 days, 2:26:37", "throughput": 2723.18, "total_tokens": 681982112} {"current_steps": 3783, "total_steps": 9134, "loss": 0.8465, "learning_rate": 3.1659919892316084e-05, "epoch": 0.4141328443580831, "percentage": 41.42, "elapsed_time": "2 days, 21:35:03", "remaining_time": "4 days, 2:25:33", "throughput": 2723.25, "total_tokens": 682182816} {"current_steps": 3784, "total_steps": 9134, "loss": 0.7725, "learning_rate": 3.1651631600783114e-05, "epoch": 0.41424231642902104, "percentage": 41.43, "elapsed_time": "2 days, 21:36:08", "remaining_time": "4 days, 2:24:25", "throughput": 2723.26, "total_tokens": 682361792} {"current_steps": 3785, "total_steps": 9134, "loss": 0.8713, "learning_rate": 3.164334252237484e-05, "epoch": 0.41435178849995896, "percentage": 41.44, "elapsed_time": "2 days, 21:37:12", "remaining_time": "4 days, 2:23:16", "throughput": 2723.3, "total_tokens": 682547712} {"current_steps": 3786, "total_steps": 9134, "loss": 0.6638, "learning_rate": 3.163505265807185e-05, "epoch": 0.41446126057089683, "percentage": 41.45, "elapsed_time": "2 days, 21:38:17", "remaining_time": "4 days, 2:22:09", "throughput": 2723.34, "total_tokens": 682734976} {"current_steps": 3787, "total_steps": 9134, "loss": 0.584, "learning_rate": 3.162676200885481e-05, "epoch": 0.41457073264183475, "percentage": 41.46, "elapsed_time": "2 days, 21:39:23", "remaining_time": "4 days, 2:21:02", "throughput": 2723.31, "total_tokens": 682907680} {"current_steps": 3788, "total_steps": 9134, "loss": 0.7333, "learning_rate": 3.161847057570449e-05, "epoch": 0.41468020471277267, "percentage": 41.47, "elapsed_time": "2 days, 21:40:32", "remaining_time": "4 days, 2:19:59", "throughput": 2723.32, "total_tokens": 683095392} {"current_steps": 3789, "total_steps": 9134, "loss": 0.6066, "learning_rate": 3.161017835960176e-05, "epoch": 0.41478967678371054, "percentage": 41.48, "elapsed_time": "2 days, 21:41:37", "remaining_time": "4 days, 2:18:51", "throughput": 2723.28, "total_tokens": 683264736} {"current_steps": 3790, "total_steps": 9134, "loss": 0.6242, "learning_rate": 3.160188536152756e-05, "epoch": 0.41489914885464846, "percentage": 41.49, "elapsed_time": "2 days, 21:42:43", "remaining_time": "4 days, 2:17:45", "throughput": 2723.27, "total_tokens": 683442592} {"current_steps": 3791, "total_steps": 9134, "loss": 0.7106, "learning_rate": 3.159359158246294e-05, "epoch": 0.4150086209255864, "percentage": 41.5, "elapsed_time": "2 days, 21:43:52", "remaining_time": "4 days, 2:16:42", "throughput": 2723.23, "total_tokens": 683619776} {"current_steps": 3792, "total_steps": 9134, "loss": 0.7449, "learning_rate": 3.158529702338905e-05, "epoch": 0.41511809299652425, "percentage": 41.52, "elapsed_time": "2 days, 21:45:00", "remaining_time": "4 days, 2:15:39", "throughput": 2723.27, "total_tokens": 683815328} {"current_steps": 3793, "total_steps": 9134, "loss": 0.6822, "learning_rate": 3.157700168528711e-05, "epoch": 0.41522756506746217, "percentage": 41.53, "elapsed_time": "2 days, 21:46:05", "remaining_time": "4 days, 2:14:30", "throughput": 2723.26, "total_tokens": 683987136} {"current_steps": 3794, "total_steps": 9134, "loss": 0.7657, "learning_rate": 3.156870556913844e-05, "epoch": 0.4153370371384001, "percentage": 41.54, "elapsed_time": "2 days, 21:47:10", "remaining_time": "4 days, 2:13:23", "throughput": 2723.26, "total_tokens": 684166560} {"current_steps": 3795, "total_steps": 9134, "loss": 0.7369, "learning_rate": 3.156040867592446e-05, "epoch": 0.41544650920933796, "percentage": 41.55, "elapsed_time": "2 days, 21:48:19", "remaining_time": "4 days, 2:12:20", "throughput": 2723.31, "total_tokens": 684366368} {"current_steps": 3796, "total_steps": 9134, "loss": 0.7325, "learning_rate": 3.155211100662668e-05, "epoch": 0.4155559812802759, "percentage": 41.56, "elapsed_time": "2 days, 21:49:25", "remaining_time": "4 days, 2:11:14", "throughput": 2723.36, "total_tokens": 684557888} {"current_steps": 3797, "total_steps": 9134, "loss": 0.6887, "learning_rate": 3.1543812562226685e-05, "epoch": 0.4156654533512138, "percentage": 41.57, "elapsed_time": "2 days, 21:50:34", "remaining_time": "4 days, 2:10:12", "throughput": 2723.35, "total_tokens": 684743808} {"current_steps": 3798, "total_steps": 9134, "loss": 0.7659, "learning_rate": 3.153551334370617e-05, "epoch": 0.41577492542215166, "percentage": 41.58, "elapsed_time": "2 days, 21:51:43", "remaining_time": "4 days, 2:09:10", "throughput": 2723.44, "total_tokens": 684955264} {"current_steps": 3799, "total_steps": 9134, "loss": 0.8113, "learning_rate": 3.152721335204693e-05, "epoch": 0.4158843974930896, "percentage": 41.59, "elapsed_time": "2 days, 21:52:51", "remaining_time": "4 days, 2:08:05", "throughput": 2723.53, "total_tokens": 685160448} {"current_steps": 3800, "total_steps": 9134, "loss": 0.8624, "learning_rate": 3.151891258823082e-05, "epoch": 0.41599386956402745, "percentage": 41.6, "elapsed_time": "2 days, 21:53:57", "remaining_time": "4 days, 2:06:59", "throughput": 2723.58, "total_tokens": 685354880} {"current_steps": 3801, "total_steps": 9134, "loss": 0.6928, "learning_rate": 3.151061105323982e-05, "epoch": 0.4161033416349654, "percentage": 41.61, "elapsed_time": "2 days, 21:55:03", "remaining_time": "4 days, 2:05:52", "throughput": 2723.55, "total_tokens": 685527808} {"current_steps": 3802, "total_steps": 9134, "loss": 0.4996, "learning_rate": 3.1502308748055975e-05, "epoch": 0.4162128137059033, "percentage": 41.62, "elapsed_time": "2 days, 21:56:11", "remaining_time": "4 days, 2:04:49", "throughput": 2723.53, "total_tokens": 685706112} {"current_steps": 3803, "total_steps": 9134, "loss": 0.9452, "learning_rate": 3.1494005673661445e-05, "epoch": 0.41632228577684116, "percentage": 41.64, "elapsed_time": "2 days, 21:57:20", "remaining_time": "4 days, 2:03:46", "throughput": 2723.46, "total_tokens": 685876800} {"current_steps": 3804, "total_steps": 9134, "loss": 0.885, "learning_rate": 3.1485701831038436e-05, "epoch": 0.4164317578477791, "percentage": 41.65, "elapsed_time": "2 days, 21:58:28", "remaining_time": "4 days, 2:02:42", "throughput": 2723.49, "total_tokens": 686070112} {"current_steps": 3805, "total_steps": 9134, "loss": 0.6188, "learning_rate": 3.147739722116932e-05, "epoch": 0.416541229918717, "percentage": 41.66, "elapsed_time": "2 days, 21:59:33", "remaining_time": "4 days, 2:01:35", "throughput": 2723.46, "total_tokens": 686239456} {"current_steps": 3806, "total_steps": 9134, "loss": 0.6699, "learning_rate": 3.1469091845036486e-05, "epoch": 0.41665070198965487, "percentage": 41.67, "elapsed_time": "2 days, 22:00:40", "remaining_time": "4 days, 2:00:30", "throughput": 2723.49, "total_tokens": 686429632} {"current_steps": 3807, "total_steps": 9134, "loss": 0.6324, "learning_rate": 3.146078570362246e-05, "epoch": 0.4167601740605928, "percentage": 41.68, "elapsed_time": "2 days, 22:01:43", "remaining_time": "4 days, 1:59:18", "throughput": 2723.42, "total_tokens": 686583296} {"current_steps": 3808, "total_steps": 9134, "loss": 0.6235, "learning_rate": 3.145247879790983e-05, "epoch": 0.4168696461315307, "percentage": 41.69, "elapsed_time": "2 days, 22:02:49", "remaining_time": "4 days, 1:58:12", "throughput": 2723.44, "total_tokens": 686768544} {"current_steps": 3809, "total_steps": 9134, "loss": 0.6675, "learning_rate": 3.1444171128881294e-05, "epoch": 0.4169791182024686, "percentage": 41.7, "elapsed_time": "2 days, 22:03:53", "remaining_time": "4 days, 1:57:03", "throughput": 2723.41, "total_tokens": 686935424} {"current_steps": 3810, "total_steps": 9134, "loss": 0.7779, "learning_rate": 3.1435862697519636e-05, "epoch": 0.4170885902734065, "percentage": 41.71, "elapsed_time": "2 days, 22:05:00", "remaining_time": "4 days, 1:55:59", "throughput": 2723.44, "total_tokens": 687126272} {"current_steps": 3811, "total_steps": 9134, "loss": 0.949, "learning_rate": 3.142755350480772e-05, "epoch": 0.4171980623443444, "percentage": 41.72, "elapsed_time": "2 days, 22:06:06", "remaining_time": "4 days, 1:54:51", "throughput": 2723.41, "total_tokens": 687296064} {"current_steps": 3812, "total_steps": 9134, "loss": 0.5468, "learning_rate": 3.1419243551728513e-05, "epoch": 0.4173075344152823, "percentage": 41.73, "elapsed_time": "2 days, 22:07:06", "remaining_time": "4 days, 1:53:37", "throughput": 2723.35, "total_tokens": 687445472} {"current_steps": 3813, "total_steps": 9134, "loss": 0.5563, "learning_rate": 3.141093283926506e-05, "epoch": 0.4174170064862202, "percentage": 41.75, "elapsed_time": "2 days, 22:08:12", "remaining_time": "4 days, 1:52:30", "throughput": 2723.3, "total_tokens": 687612352} {"current_steps": 3814, "total_steps": 9134, "loss": 0.6637, "learning_rate": 3.140262136840052e-05, "epoch": 0.41752647855715813, "percentage": 41.76, "elapsed_time": "2 days, 22:09:17", "remaining_time": "4 days, 1:51:23", "throughput": 2723.33, "total_tokens": 687798720} {"current_steps": 3815, "total_steps": 9134, "loss": 0.6875, "learning_rate": 3.1394309140118104e-05, "epoch": 0.417635950628096, "percentage": 41.77, "elapsed_time": "2 days, 22:10:26", "remaining_time": "4 days, 1:50:19", "throughput": 2723.44, "total_tokens": 688012416} {"current_steps": 3816, "total_steps": 9134, "loss": 0.783, "learning_rate": 3.138599615540114e-05, "epoch": 0.4177454226990339, "percentage": 41.78, "elapsed_time": "2 days, 22:11:28", "remaining_time": "4 days, 1:49:07", "throughput": 2723.4, "total_tokens": 688170336} {"current_steps": 3817, "total_steps": 9134, "loss": 0.7636, "learning_rate": 3.137768241523305e-05, "epoch": 0.4178548947699718, "percentage": 41.79, "elapsed_time": "2 days, 22:12:34", "remaining_time": "4 days, 1:48:02", "throughput": 2723.38, "total_tokens": 688346624} {"current_steps": 3818, "total_steps": 9134, "loss": 0.7487, "learning_rate": 3.1369367920597306e-05, "epoch": 0.4179643668409097, "percentage": 41.8, "elapsed_time": "2 days, 22:13:42", "remaining_time": "4 days, 1:46:58", "throughput": 2723.44, "total_tokens": 688548000} {"current_steps": 3819, "total_steps": 9134, "loss": 0.6415, "learning_rate": 3.136105267247752e-05, "epoch": 0.41807383891184763, "percentage": 41.81, "elapsed_time": "2 days, 22:14:42", "remaining_time": "4 days, 1:45:43", "throughput": 2723.41, "total_tokens": 688703232} {"current_steps": 3820, "total_steps": 9134, "loss": 0.6731, "learning_rate": 3.1352736671857366e-05, "epoch": 0.4181833109827855, "percentage": 41.82, "elapsed_time": "2 days, 22:15:52", "remaining_time": "4 days, 1:44:41", "throughput": 2723.45, "total_tokens": 688902816} {"current_steps": 3821, "total_steps": 9134, "loss": 0.7449, "learning_rate": 3.13444199197206e-05, "epoch": 0.4182927830537234, "percentage": 41.83, "elapsed_time": "2 days, 22:16:57", "remaining_time": "4 days, 1:43:34", "throughput": 2723.39, "total_tokens": 689065440} {"current_steps": 3822, "total_steps": 9134, "loss": 0.7958, "learning_rate": 3.13361024170511e-05, "epoch": 0.41840225512466134, "percentage": 41.84, "elapsed_time": "2 days, 22:18:06", "remaining_time": "4 days, 1:42:32", "throughput": 2723.52, "total_tokens": 689287424} {"current_steps": 3823, "total_steps": 9134, "loss": 0.7449, "learning_rate": 3.1327784164832786e-05, "epoch": 0.4185117271955992, "percentage": 41.85, "elapsed_time": "2 days, 22:19:15", "remaining_time": "4 days, 1:41:28", "throughput": 2723.61, "total_tokens": 689496864} {"current_steps": 3824, "total_steps": 9134, "loss": 0.4806, "learning_rate": 3.13194651640497e-05, "epoch": 0.4186211992665371, "percentage": 41.87, "elapsed_time": "2 days, 22:20:22", "remaining_time": "4 days, 1:40:24", "throughput": 2723.65, "total_tokens": 689688160} {"current_steps": 3825, "total_steps": 9134, "loss": 0.7647, "learning_rate": 3.1311145415685975e-05, "epoch": 0.41873067133747505, "percentage": 41.88, "elapsed_time": "2 days, 22:21:23", "remaining_time": "4 days, 1:39:10", "throughput": 2723.58, "total_tokens": 689836672} {"current_steps": 3826, "total_steps": 9134, "loss": 0.6736, "learning_rate": 3.13028249207258e-05, "epoch": 0.4188401434084129, "percentage": 41.89, "elapsed_time": "2 days, 22:22:32", "remaining_time": "4 days, 1:38:07", "throughput": 2723.65, "total_tokens": 690042080} {"current_steps": 3827, "total_steps": 9134, "loss": 0.6007, "learning_rate": 3.1294503680153496e-05, "epoch": 0.41894961547935083, "percentage": 41.9, "elapsed_time": "2 days, 22:23:40", "remaining_time": "4 days, 1:37:05", "throughput": 2723.68, "total_tokens": 690237408} {"current_steps": 3828, "total_steps": 9134, "loss": 0.7314, "learning_rate": 3.128618169495344e-05, "epoch": 0.41905908755028876, "percentage": 41.91, "elapsed_time": "2 days, 22:24:46", "remaining_time": "4 days, 1:35:58", "throughput": 2723.75, "total_tokens": 690433408} {"current_steps": 3829, "total_steps": 9134, "loss": 0.7765, "learning_rate": 3.1277858966110105e-05, "epoch": 0.4191685596212266, "percentage": 41.92, "elapsed_time": "2 days, 22:25:53", "remaining_time": "4 days, 1:34:52", "throughput": 2723.71, "total_tokens": 690605440} {"current_steps": 3830, "total_steps": 9134, "loss": 0.7089, "learning_rate": 3.126953549460805e-05, "epoch": 0.41927803169216454, "percentage": 41.93, "elapsed_time": "2 days, 22:27:01", "remaining_time": "4 days, 1:33:48", "throughput": 2723.77, "total_tokens": 690805920} {"current_steps": 3831, "total_steps": 9134, "loss": 0.7027, "learning_rate": 3.126121128143194e-05, "epoch": 0.41938750376310246, "percentage": 41.94, "elapsed_time": "2 days, 22:28:07", "remaining_time": "4 days, 1:32:42", "throughput": 2723.8, "total_tokens": 690992960} {"current_steps": 3832, "total_steps": 9134, "loss": 0.9494, "learning_rate": 3.1252886327566494e-05, "epoch": 0.41949697583404033, "percentage": 41.95, "elapsed_time": "2 days, 22:29:15", "remaining_time": "4 days, 1:31:39", "throughput": 2723.81, "total_tokens": 691183136} {"current_steps": 3833, "total_steps": 9134, "loss": 0.5754, "learning_rate": 3.124456063399656e-05, "epoch": 0.41960644790497825, "percentage": 41.96, "elapsed_time": "2 days, 22:30:21", "remaining_time": "4 days, 1:30:32", "throughput": 2723.75, "total_tokens": 691346656} {"current_steps": 3834, "total_steps": 9134, "loss": 0.7342, "learning_rate": 3.123623420170703e-05, "epoch": 0.4197159199759161, "percentage": 41.98, "elapsed_time": "2 days, 22:31:27", "remaining_time": "4 days, 1:29:25", "throughput": 2723.75, "total_tokens": 691525184} {"current_steps": 3835, "total_steps": 9134, "loss": 0.8273, "learning_rate": 3.122790703168292e-05, "epoch": 0.41982539204685404, "percentage": 41.99, "elapsed_time": "2 days, 22:32:33", "remaining_time": "4 days, 1:28:19", "throughput": 2723.81, "total_tokens": 691719392} {"current_steps": 3836, "total_steps": 9134, "loss": 0.6077, "learning_rate": 3.1219579124909324e-05, "epoch": 0.41993486411779196, "percentage": 42.0, "elapsed_time": "2 days, 22:33:41", "remaining_time": "4 days, 1:27:16", "throughput": 2723.86, "total_tokens": 691919424} {"current_steps": 3837, "total_steps": 9134, "loss": 0.6405, "learning_rate": 3.121125048237139e-05, "epoch": 0.4200443361887298, "percentage": 42.01, "elapsed_time": "2 days, 22:34:51", "remaining_time": "4 days, 1:26:14", "throughput": 2723.78, "total_tokens": 692089664} {"current_steps": 3838, "total_steps": 9134, "loss": 0.7296, "learning_rate": 3.120292110505441e-05, "epoch": 0.42015380825966775, "percentage": 42.02, "elapsed_time": "2 days, 22:35:57", "remaining_time": "4 days, 1:25:08", "throughput": 2723.8, "total_tokens": 692274464} {"current_steps": 3839, "total_steps": 9134, "loss": 0.8796, "learning_rate": 3.119459099394372e-05, "epoch": 0.42026328033060567, "percentage": 42.03, "elapsed_time": "2 days, 22:37:06", "remaining_time": "4 days, 1:24:05", "throughput": 2723.87, "total_tokens": 692481216} {"current_steps": 3840, "total_steps": 9134, "loss": 0.5522, "learning_rate": 3.1186260150024755e-05, "epoch": 0.42037275240154354, "percentage": 42.04, "elapsed_time": "2 days, 22:38:13", "remaining_time": "4 days, 1:23:00", "throughput": 2723.83, "total_tokens": 692651456} {"current_steps": 3841, "total_steps": 9134, "loss": 0.5941, "learning_rate": 3.117792857428304e-05, "epoch": 0.42048222447248146, "percentage": 42.05, "elapsed_time": "2 days, 22:39:20", "remaining_time": "4 days, 1:21:55", "throughput": 2723.85, "total_tokens": 692840960} {"current_steps": 3842, "total_steps": 9134, "loss": 0.5999, "learning_rate": 3.116959626770418e-05, "epoch": 0.4205916965434194, "percentage": 42.06, "elapsed_time": "2 days, 22:40:26", "remaining_time": "4 days, 1:20:49", "throughput": 2723.82, "total_tokens": 693013664} {"current_steps": 3843, "total_steps": 9134, "loss": 0.7621, "learning_rate": 3.1161263231273884e-05, "epoch": 0.42070116861435725, "percentage": 42.07, "elapsed_time": "2 days, 22:41:36", "remaining_time": "4 days, 1:19:47", "throughput": 2723.83, "total_tokens": 693204960} {"current_steps": 3844, "total_steps": 9134, "loss": 0.7009, "learning_rate": 3.115292946597793e-05, "epoch": 0.42081064068529517, "percentage": 42.08, "elapsed_time": "2 days, 22:42:39", "remaining_time": "4 days, 1:18:37", "throughput": 2723.81, "total_tokens": 693371392} {"current_steps": 3845, "total_steps": 9134, "loss": 0.6409, "learning_rate": 3.1144594972802165e-05, "epoch": 0.4209201127562331, "percentage": 42.1, "elapsed_time": "2 days, 22:43:42", "remaining_time": "4 days, 1:17:27", "throughput": 2723.81, "total_tokens": 693544096} {"current_steps": 3846, "total_steps": 9134, "loss": 0.9093, "learning_rate": 3.1136259752732576e-05, "epoch": 0.42102958482717096, "percentage": 42.11, "elapsed_time": "2 days, 22:44:50", "remaining_time": "4 days, 1:16:22", "throughput": 2723.83, "total_tokens": 693732704} {"current_steps": 3847, "total_steps": 9134, "loss": 0.6878, "learning_rate": 3.112792380675519e-05, "epoch": 0.4211390568981089, "percentage": 42.12, "elapsed_time": "2 days, 22:45:50", "remaining_time": "4 days, 1:15:08", "throughput": 2723.72, "total_tokens": 693868000} {"current_steps": 3848, "total_steps": 9134, "loss": 0.5781, "learning_rate": 3.111958713585612e-05, "epoch": 0.4212485289690468, "percentage": 42.13, "elapsed_time": "2 days, 22:46:55", "remaining_time": "4 days, 1:14:00", "throughput": 2723.74, "total_tokens": 694052800} {"current_steps": 3849, "total_steps": 9134, "loss": 0.6043, "learning_rate": 3.1111249741021606e-05, "epoch": 0.42135800103998466, "percentage": 42.14, "elapsed_time": "2 days, 22:48:01", "remaining_time": "4 days, 1:12:53", "throughput": 2723.77, "total_tokens": 694238272} {"current_steps": 3850, "total_steps": 9134, "loss": 0.5407, "learning_rate": 3.110291162323792e-05, "epoch": 0.4214674731109226, "percentage": 42.15, "elapsed_time": "2 days, 22:49:05", "remaining_time": "4 days, 1:11:44", "throughput": 2723.78, "total_tokens": 694416128} {"current_steps": 3851, "total_steps": 9134, "loss": 0.678, "learning_rate": 3.109457278349145e-05, "epoch": 0.42157694518186045, "percentage": 42.16, "elapsed_time": "2 days, 22:50:11", "remaining_time": "4 days, 1:10:37", "throughput": 2723.86, "total_tokens": 694615040} {"current_steps": 3852, "total_steps": 9134, "loss": 0.6687, "learning_rate": 3.108623322276868e-05, "epoch": 0.4216864172527984, "percentage": 42.17, "elapsed_time": "2 days, 22:51:17", "remaining_time": "4 days, 1:09:31", "throughput": 2723.88, "total_tokens": 694802080} {"current_steps": 3853, "total_steps": 9134, "loss": 0.657, "learning_rate": 3.1077892942056153e-05, "epoch": 0.4217958893237363, "percentage": 42.18, "elapsed_time": "2 days, 22:52:21", "remaining_time": "4 days, 1:08:21", "throughput": 2723.84, "total_tokens": 694962912} {"current_steps": 3854, "total_steps": 9134, "loss": 0.7479, "learning_rate": 3.106955194234051e-05, "epoch": 0.42190536139467416, "percentage": 42.19, "elapsed_time": "2 days, 22:53:25", "remaining_time": "4 days, 1:07:12", "throughput": 2723.85, "total_tokens": 695140544} {"current_steps": 3855, "total_steps": 9134, "loss": 0.6215, "learning_rate": 3.106121022460847e-05, "epoch": 0.4220148334656121, "percentage": 42.2, "elapsed_time": "2 days, 22:54:28", "remaining_time": "4 days, 1:06:02", "throughput": 2723.84, "total_tokens": 695310336} {"current_steps": 3856, "total_steps": 9134, "loss": 0.7586, "learning_rate": 3.105286778984686e-05, "epoch": 0.42212430553655, "percentage": 42.22, "elapsed_time": "2 days, 22:55:34", "remaining_time": "4 days, 1:04:55", "throughput": 2723.9, "total_tokens": 695505664} {"current_steps": 3857, "total_steps": 9134, "loss": 0.8825, "learning_rate": 3.104452463904255e-05, "epoch": 0.42223377760748787, "percentage": 42.23, "elapsed_time": "2 days, 22:56:41", "remaining_time": "4 days, 1:03:50", "throughput": 2723.95, "total_tokens": 695699424} {"current_steps": 3858, "total_steps": 9134, "loss": 0.676, "learning_rate": 3.1036180773182535e-05, "epoch": 0.4223432496784258, "percentage": 42.24, "elapsed_time": "2 days, 22:57:46", "remaining_time": "4 days, 1:02:42", "throughput": 2724.01, "total_tokens": 695893632} {"current_steps": 3859, "total_steps": 9134, "loss": 0.6713, "learning_rate": 3.1027836193253874e-05, "epoch": 0.4224527217493637, "percentage": 42.25, "elapsed_time": "2 days, 22:58:51", "remaining_time": "4 days, 1:01:35", "throughput": 2724.02, "total_tokens": 696073504} {"current_steps": 3860, "total_steps": 9134, "loss": 0.7296, "learning_rate": 3.1019490900243716e-05, "epoch": 0.4225621938203016, "percentage": 42.26, "elapsed_time": "2 days, 22:59:59", "remaining_time": "4 days, 1:00:31", "throughput": 2724.06, "total_tokens": 696268832} {"current_steps": 3861, "total_steps": 9134, "loss": 0.8261, "learning_rate": 3.101114489513929e-05, "epoch": 0.4226716658912395, "percentage": 42.27, "elapsed_time": "2 days, 23:01:06", "remaining_time": "4 days, 0:59:25", "throughput": 2723.99, "total_tokens": 696430784} {"current_steps": 3862, "total_steps": 9134, "loss": 0.7216, "learning_rate": 3.100279817892792e-05, "epoch": 0.4227811379621774, "percentage": 42.28, "elapsed_time": "2 days, 23:02:11", "remaining_time": "4 days, 0:58:17", "throughput": 2723.97, "total_tokens": 696604160} {"current_steps": 3863, "total_steps": 9134, "loss": 0.7855, "learning_rate": 3.099445075259698e-05, "epoch": 0.4228906100331153, "percentage": 42.29, "elapsed_time": "2 days, 23:03:16", "remaining_time": "4 days, 0:57:10", "throughput": 2723.95, "total_tokens": 696777984} {"current_steps": 3864, "total_steps": 9134, "loss": 0.7956, "learning_rate": 3.098610261713399e-05, "epoch": 0.4230000821040532, "percentage": 42.3, "elapsed_time": "2 days, 23:04:24", "remaining_time": "4 days, 0:56:05", "throughput": 2724.01, "total_tokens": 696976448} {"current_steps": 3865, "total_steps": 9134, "loss": 0.7307, "learning_rate": 3.0977753773526505e-05, "epoch": 0.42310955417499113, "percentage": 42.31, "elapsed_time": "2 days, 23:05:27", "remaining_time": "4 days, 0:54:55", "throughput": 2723.99, "total_tokens": 697142880} {"current_steps": 3866, "total_steps": 9134, "loss": 0.9007, "learning_rate": 3.096940422276218e-05, "epoch": 0.423219026245929, "percentage": 42.33, "elapsed_time": "2 days, 23:06:36", "remaining_time": "4 days, 0:53:53", "throughput": 2724.14, "total_tokens": 697370464} {"current_steps": 3867, "total_steps": 9134, "loss": 0.6706, "learning_rate": 3.096105396582874e-05, "epoch": 0.4233284983168669, "percentage": 42.34, "elapsed_time": "2 days, 23:07:36", "remaining_time": "4 days, 0:52:39", "throughput": 2724.03, "total_tokens": 697506880} {"current_steps": 3868, "total_steps": 9134, "loss": 0.8648, "learning_rate": 3.095270300371401e-05, "epoch": 0.4234379703878048, "percentage": 42.35, "elapsed_time": "2 days, 23:08:38", "remaining_time": "4 days, 0:51:27", "throughput": 2724.03, "total_tokens": 697676672} {"current_steps": 3869, "total_steps": 9134, "loss": 0.899, "learning_rate": 3.0944351337405906e-05, "epoch": 0.4235474424587427, "percentage": 42.36, "elapsed_time": "2 days, 23:09:42", "remaining_time": "4 days, 0:50:17", "throughput": 2724.04, "total_tokens": 697852064} {"current_steps": 3870, "total_steps": 9134, "loss": 0.7229, "learning_rate": 3.09359989678924e-05, "epoch": 0.42365691452968063, "percentage": 42.37, "elapsed_time": "2 days, 23:10:48", "remaining_time": "4 days, 0:49:11", "throughput": 2724.01, "total_tokens": 698024992} {"current_steps": 3871, "total_steps": 9134, "loss": 0.797, "learning_rate": 3.092764589616155e-05, "epoch": 0.4237663866006185, "percentage": 42.38, "elapsed_time": "2 days, 23:11:57", "remaining_time": "4 days, 0:48:08", "throughput": 2724.07, "total_tokens": 698227264} {"current_steps": 3872, "total_steps": 9134, "loss": 0.7225, "learning_rate": 3.0919292123201524e-05, "epoch": 0.4238758586715564, "percentage": 42.39, "elapsed_time": "2 days, 23:13:06", "remaining_time": "4 days, 0:47:05", "throughput": 2724.13, "total_tokens": 698429312} {"current_steps": 3873, "total_steps": 9134, "loss": 0.9548, "learning_rate": 3.0910937650000565e-05, "epoch": 0.42398533074249434, "percentage": 42.4, "elapsed_time": "2 days, 23:14:11", "remaining_time": "4 days, 0:45:58", "throughput": 2724.16, "total_tokens": 698615904} {"current_steps": 3874, "total_steps": 9134, "loss": 0.7437, "learning_rate": 3.090258247754698e-05, "epoch": 0.4240948028134322, "percentage": 42.41, "elapsed_time": "2 days, 23:15:16", "remaining_time": "4 days, 0:44:50", "throughput": 2724.01, "total_tokens": 698752992} {"current_steps": 3875, "total_steps": 9134, "loss": 0.6731, "learning_rate": 3.0894226606829166e-05, "epoch": 0.4242042748843701, "percentage": 42.42, "elapsed_time": "2 days, 23:16:22", "remaining_time": "4 days, 0:43:43", "throughput": 2724.05, "total_tokens": 698941824} {"current_steps": 3876, "total_steps": 9134, "loss": 0.783, "learning_rate": 3.088587003883562e-05, "epoch": 0.42431374695530805, "percentage": 42.43, "elapsed_time": "2 days, 23:17:25", "remaining_time": "4 days, 0:42:32", "throughput": 2724.0, "total_tokens": 699101088} {"current_steps": 3877, "total_steps": 9134, "loss": 0.6962, "learning_rate": 3.08775127745549e-05, "epoch": 0.4244232190262459, "percentage": 42.45, "elapsed_time": "2 days, 23:18:33", "remaining_time": "4 days, 0:41:29", "throughput": 2724.0, "total_tokens": 699287680} {"current_steps": 3878, "total_steps": 9134, "loss": 0.7134, "learning_rate": 3.086915481497565e-05, "epoch": 0.42453269109718383, "percentage": 42.46, "elapsed_time": "2 days, 23:19:40", "remaining_time": "4 days, 0:40:23", "throughput": 2724.01, "total_tokens": 699472480} {"current_steps": 3879, "total_steps": 9134, "loss": 0.9097, "learning_rate": 3.08607961610866e-05, "epoch": 0.42464216316812176, "percentage": 42.47, "elapsed_time": "2 days, 23:20:49", "remaining_time": "4 days, 0:39:21", "throughput": 2724.02, "total_tokens": 699663776} {"current_steps": 3880, "total_steps": 9134, "loss": 0.7816, "learning_rate": 3.0852436813876576e-05, "epoch": 0.4247516352390596, "percentage": 42.48, "elapsed_time": "2 days, 23:21:56", "remaining_time": "4 days, 0:38:16", "throughput": 2724.09, "total_tokens": 699862016} {"current_steps": 3881, "total_steps": 9134, "loss": 0.5213, "learning_rate": 3.084407677433447e-05, "epoch": 0.42486110730999754, "percentage": 42.49, "elapsed_time": "2 days, 23:23:02", "remaining_time": "4 days, 0:37:10", "throughput": 2724.08, "total_tokens": 700039872} {"current_steps": 3882, "total_steps": 9134, "loss": 0.8626, "learning_rate": 3.083571604344925e-05, "epoch": 0.42497057938093546, "percentage": 42.5, "elapsed_time": "2 days, 23:24:10", "remaining_time": "4 days, 0:36:05", "throughput": 2724.05, "total_tokens": 700217952} {"current_steps": 3883, "total_steps": 9134, "loss": 0.6128, "learning_rate": 3.0827354622209976e-05, "epoch": 0.42508005145187333, "percentage": 42.51, "elapsed_time": "2 days, 23:25:12", "remaining_time": "4 days, 0:34:54", "throughput": 2724.0, "total_tokens": 700375648} {"current_steps": 3884, "total_steps": 9134, "loss": 0.8852, "learning_rate": 3.081899251160578e-05, "epoch": 0.42518952352281125, "percentage": 42.52, "elapsed_time": "2 days, 23:26:16", "remaining_time": "4 days, 0:33:44", "throughput": 2724.01, "total_tokens": 700551936} {"current_steps": 3885, "total_steps": 9134, "loss": 0.9995, "learning_rate": 3.081062971262591e-05, "epoch": 0.4252989955937491, "percentage": 42.53, "elapsed_time": "2 days, 23:27:24", "remaining_time": "4 days, 0:32:41", "throughput": 2724.02, "total_tokens": 700739200} {"current_steps": 3886, "total_steps": 9134, "loss": 0.765, "learning_rate": 3.080226622625964e-05, "epoch": 0.42540846766468704, "percentage": 42.54, "elapsed_time": "2 days, 23:28:33", "remaining_time": "4 days, 0:31:39", "throughput": 2724.02, "total_tokens": 700926912} {"current_steps": 3887, "total_steps": 9134, "loss": 0.5215, "learning_rate": 3.0793902053496374e-05, "epoch": 0.42551793973562496, "percentage": 42.56, "elapsed_time": "2 days, 23:29:38", "remaining_time": "4 days, 0:30:31", "throughput": 2724.03, "total_tokens": 701108576} {"current_steps": 3888, "total_steps": 9134, "loss": 0.8893, "learning_rate": 3.0785537195325574e-05, "epoch": 0.4256274118065628, "percentage": 42.57, "elapsed_time": "2 days, 23:30:46", "remaining_time": "4 days, 0:29:27", "throughput": 2724.11, "total_tokens": 701314208} {"current_steps": 3889, "total_steps": 9134, "loss": 0.7126, "learning_rate": 3.0777171652736784e-05, "epoch": 0.42573688387750075, "percentage": 42.58, "elapsed_time": "2 days, 23:31:52", "remaining_time": "4 days, 0:28:21", "throughput": 2724.12, "total_tokens": 701495872} {"current_steps": 3890, "total_steps": 9134, "loss": 0.5699, "learning_rate": 3.076880542671963e-05, "epoch": 0.42584635594843867, "percentage": 42.59, "elapsed_time": "2 days, 23:33:01", "remaining_time": "4 days, 0:27:18", "throughput": 2724.2, "total_tokens": 701705088} {"current_steps": 3891, "total_steps": 9134, "loss": 0.7596, "learning_rate": 3.0760438518263826e-05, "epoch": 0.42595582801937654, "percentage": 42.6, "elapsed_time": "2 days, 23:34:05", "remaining_time": "4 days, 0:26:09", "throughput": 2724.18, "total_tokens": 701872416} {"current_steps": 3892, "total_steps": 9134, "loss": 0.7499, "learning_rate": 3.0752070928359147e-05, "epoch": 0.42606530009031446, "percentage": 42.61, "elapsed_time": "2 days, 23:35:11", "remaining_time": "4 days, 0:25:02", "throughput": 2724.14, "total_tokens": 702043104} {"current_steps": 3893, "total_steps": 9134, "loss": 0.7803, "learning_rate": 3.0743702657995475e-05, "epoch": 0.4261747721612524, "percentage": 42.62, "elapsed_time": "2 days, 23:36:14", "remaining_time": "4 days, 0:23:52", "throughput": 2724.15, "total_tokens": 702218272} {"current_steps": 3894, "total_steps": 9134, "loss": 0.462, "learning_rate": 3.0735333708162763e-05, "epoch": 0.42628424423219025, "percentage": 42.63, "elapsed_time": "2 days, 23:37:19", "remaining_time": "4 days, 0:22:44", "throughput": 2724.2, "total_tokens": 702406432} {"current_steps": 3895, "total_steps": 9134, "loss": 0.568, "learning_rate": 3.0726964079851037e-05, "epoch": 0.42639371630312817, "percentage": 42.64, "elapsed_time": "2 days, 23:38:24", "remaining_time": "4 days, 0:21:36", "throughput": 2724.23, "total_tokens": 702590112} {"current_steps": 3896, "total_steps": 9134, "loss": 0.8496, "learning_rate": 3.071859377405041e-05, "epoch": 0.4265031883740661, "percentage": 42.65, "elapsed_time": "2 days, 23:39:32", "remaining_time": "4 days, 0:20:32", "throughput": 2724.3, "total_tokens": 702793280} {"current_steps": 3897, "total_steps": 9134, "loss": 0.8331, "learning_rate": 3.071022279175107e-05, "epoch": 0.42661266044500396, "percentage": 42.66, "elapsed_time": "2 days, 23:40:38", "remaining_time": "4 days, 0:19:26", "throughput": 2724.33, "total_tokens": 702982560} {"current_steps": 3898, "total_steps": 9134, "loss": 0.6637, "learning_rate": 3.070185113394329e-05, "epoch": 0.4267221325159419, "percentage": 42.68, "elapsed_time": "2 days, 23:41:45", "remaining_time": "4 days, 0:18:21", "throughput": 2724.3, "total_tokens": 703158400} {"current_steps": 3899, "total_steps": 9134, "loss": 0.5959, "learning_rate": 3.069347880161741e-05, "epoch": 0.4268316045868798, "percentage": 42.69, "elapsed_time": "2 days, 23:42:51", "remaining_time": "4 days, 0:17:13", "throughput": 2724.32, "total_tokens": 703340288} {"current_steps": 3900, "total_steps": 9134, "loss": 0.6411, "learning_rate": 3.068510579576389e-05, "epoch": 0.42694107665781766, "percentage": 42.7, "elapsed_time": "2 days, 23:43:55", "remaining_time": "4 days, 0:16:05", "throughput": 2724.32, "total_tokens": 703516576} {"current_steps": 3901, "total_steps": 9134, "loss": 0.6541, "learning_rate": 3.067673211737321e-05, "epoch": 0.4270505487287556, "percentage": 42.71, "elapsed_time": "2 days, 23:44:56", "remaining_time": "4 days, 0:14:51", "throughput": 2724.23, "total_tokens": 703659488} {"current_steps": 3902, "total_steps": 9134, "loss": 0.7273, "learning_rate": 3.066835776743598e-05, "epoch": 0.42716002079969345, "percentage": 42.72, "elapsed_time": "2 days, 23:46:03", "remaining_time": "4 days, 0:13:47", "throughput": 2724.28, "total_tokens": 703854368} {"current_steps": 3903, "total_steps": 9134, "loss": 0.5986, "learning_rate": 3.0659982746942864e-05, "epoch": 0.4272694928706314, "percentage": 42.73, "elapsed_time": "2 days, 23:47:08", "remaining_time": "4 days, 0:12:39", "throughput": 2724.28, "total_tokens": 704032672} {"current_steps": 3904, "total_steps": 9134, "loss": 0.7118, "learning_rate": 3.065160705688461e-05, "epoch": 0.4273789649415693, "percentage": 42.74, "elapsed_time": "2 days, 23:48:14", "remaining_time": "4 days, 0:11:32", "throughput": 2724.27, "total_tokens": 704210080} {"current_steps": 3905, "total_steps": 9134, "loss": 0.7934, "learning_rate": 3.064323069825203e-05, "epoch": 0.42748843701250716, "percentage": 42.75, "elapsed_time": "2 days, 23:49:21", "remaining_time": "4 days, 0:10:27", "throughput": 2724.26, "total_tokens": 704389728} {"current_steps": 3906, "total_steps": 9134, "loss": 0.764, "learning_rate": 3.0634853672036054e-05, "epoch": 0.4275979090834451, "percentage": 42.76, "elapsed_time": "2 days, 23:50:30", "remaining_time": "4 days, 0:09:24", "throughput": 2724.33, "total_tokens": 704595360} {"current_steps": 3907, "total_steps": 9134, "loss": 0.7848, "learning_rate": 3.0626475979227665e-05, "epoch": 0.427707381154383, "percentage": 42.77, "elapsed_time": "2 days, 23:51:37", "remaining_time": "4 days, 0:08:19", "throughput": 2724.35, "total_tokens": 704781504} {"current_steps": 3908, "total_steps": 9134, "loss": 0.923, "learning_rate": 3.061809762081792e-05, "epoch": 0.42781685322532087, "percentage": 42.79, "elapsed_time": "2 days, 23:52:45", "remaining_time": "4 days, 0:07:15", "throughput": 2724.45, "total_tokens": 704993184} {"current_steps": 3909, "total_steps": 9134, "loss": 0.7028, "learning_rate": 3.060971859779797e-05, "epoch": 0.4279263252962588, "percentage": 42.8, "elapsed_time": "2 days, 23:53:50", "remaining_time": "4 days, 0:06:08", "throughput": 2724.51, "total_tokens": 705187168} {"current_steps": 3910, "total_steps": 9134, "loss": 0.8451, "learning_rate": 3.060133891115903e-05, "epoch": 0.4280357973671967, "percentage": 42.81, "elapsed_time": "2 days, 23:55:00", "remaining_time": "4 days, 0:05:06", "throughput": 2724.54, "total_tokens": 705384960} {"current_steps": 3911, "total_steps": 9134, "loss": 0.5343, "learning_rate": 3.059295856189241e-05, "epoch": 0.4281452694381346, "percentage": 42.82, "elapsed_time": "2 days, 23:56:07", "remaining_time": "4 days, 0:04:01", "throughput": 2724.56, "total_tokens": 705570432} {"current_steps": 3912, "total_steps": 9134, "loss": 0.9712, "learning_rate": 3.058457755098948e-05, "epoch": 0.4282547415090725, "percentage": 42.83, "elapsed_time": "2 days, 23:57:16", "remaining_time": "4 days, 0:02:58", "throughput": 2724.57, "total_tokens": 705762176} {"current_steps": 3913, "total_steps": 9134, "loss": 0.5657, "learning_rate": 3.05761958794417e-05, "epoch": 0.4283642135800104, "percentage": 42.84, "elapsed_time": "2 days, 23:58:22", "remaining_time": "4 days, 0:01:52", "throughput": 2724.55, "total_tokens": 705937120} {"current_steps": 3914, "total_steps": 9134, "loss": 0.6916, "learning_rate": 3.056781354824061e-05, "epoch": 0.4284736856509483, "percentage": 42.85, "elapsed_time": "2 days, 23:59:25", "remaining_time": "4 days, 0:00:42", "throughput": 2724.49, "total_tokens": 706093920} {"current_steps": 3915, "total_steps": 9134, "loss": 0.6702, "learning_rate": 3.055943055837782e-05, "epoch": 0.4285831577218862, "percentage": 42.86, "elapsed_time": "3 days, 0:00:30", "remaining_time": "3 days, 23:59:33", "throughput": 2724.55, "total_tokens": 706283872} {"current_steps": 3916, "total_steps": 9134, "loss": 0.7949, "learning_rate": 3.055104691084502e-05, "epoch": 0.42869262979282413, "percentage": 42.87, "elapsed_time": "3 days, 0:01:37", "remaining_time": "3 days, 23:58:29", "throughput": 2724.59, "total_tokens": 706478752} {"current_steps": 3917, "total_steps": 9134, "loss": 0.7404, "learning_rate": 3.054266260663399e-05, "epoch": 0.428802101863762, "percentage": 42.88, "elapsed_time": "3 days, 0:02:39", "remaining_time": "3 days, 23:57:16", "throughput": 2724.57, "total_tokens": 706641152} {"current_steps": 3918, "total_steps": 9134, "loss": 0.5111, "learning_rate": 3.0534277646736564e-05, "epoch": 0.4289115739346999, "percentage": 42.89, "elapsed_time": "3 days, 0:03:44", "remaining_time": "3 days, 23:56:09", "throughput": 2724.56, "total_tokens": 706818336} {"current_steps": 3919, "total_steps": 9134, "loss": 0.7979, "learning_rate": 3.052589203214467e-05, "epoch": 0.4290210460056378, "percentage": 42.91, "elapsed_time": "3 days, 0:04:50", "remaining_time": "3 days, 23:55:02", "throughput": 2724.55, "total_tokens": 706994624} {"current_steps": 3920, "total_steps": 9134, "loss": 0.7122, "learning_rate": 3.0517505763850318e-05, "epoch": 0.4291305180765757, "percentage": 42.92, "elapsed_time": "3 days, 0:05:52", "remaining_time": "3 days, 23:53:51", "throughput": 2724.46, "total_tokens": 707141568} {"current_steps": 3921, "total_steps": 9134, "loss": 0.5327, "learning_rate": 3.050911884284558e-05, "epoch": 0.42923999014751363, "percentage": 42.93, "elapsed_time": "3 days, 0:06:54", "remaining_time": "3 days, 23:52:39", "throughput": 2724.38, "total_tokens": 707289632} {"current_steps": 3922, "total_steps": 9134, "loss": 0.4822, "learning_rate": 3.050073127012261e-05, "epoch": 0.4293494622184515, "percentage": 42.94, "elapsed_time": "3 days, 0:07:59", "remaining_time": "3 days, 23:51:32", "throughput": 2724.4, "total_tokens": 707471968} {"current_steps": 3923, "total_steps": 9134, "loss": 0.7077, "learning_rate": 3.0492343046673654e-05, "epoch": 0.4294589342893894, "percentage": 42.95, "elapsed_time": "3 days, 0:09:06", "remaining_time": "3 days, 23:50:26", "throughput": 2724.44, "total_tokens": 707663936} {"current_steps": 3924, "total_steps": 9134, "loss": 0.6574, "learning_rate": 3.0483954173491015e-05, "epoch": 0.42956840636032734, "percentage": 42.96, "elapsed_time": "3 days, 0:10:12", "remaining_time": "3 days, 23:49:19", "throughput": 2724.49, "total_tokens": 707855904} {"current_steps": 3925, "total_steps": 9134, "loss": 0.6901, "learning_rate": 3.047556465156708e-05, "epoch": 0.4296778784312652, "percentage": 42.97, "elapsed_time": "3 days, 0:11:17", "remaining_time": "3 days, 23:48:12", "throughput": 2724.48, "total_tokens": 708031744} {"current_steps": 3926, "total_steps": 9134, "loss": 0.612, "learning_rate": 3.04671744818943e-05, "epoch": 0.4297873505022031, "percentage": 42.98, "elapsed_time": "3 days, 0:12:18", "remaining_time": "3 days, 23:46:58", "throughput": 2724.37, "total_tokens": 708167264} {"current_steps": 3927, "total_steps": 9134, "loss": 0.7541, "learning_rate": 3.045878366546524e-05, "epoch": 0.42989682257314105, "percentage": 42.99, "elapsed_time": "3 days, 0:13:24", "remaining_time": "3 days, 23:45:52", "throughput": 2724.45, "total_tokens": 708370208} {"current_steps": 3928, "total_steps": 9134, "loss": 0.7001, "learning_rate": 3.045039220327251e-05, "epoch": 0.4300062946440789, "percentage": 43.0, "elapsed_time": "3 days, 0:14:31", "remaining_time": "3 days, 23:44:46", "throughput": 2724.38, "total_tokens": 708533504} {"current_steps": 3929, "total_steps": 9134, "loss": 0.7834, "learning_rate": 3.0442000096308802e-05, "epoch": 0.43011576671501683, "percentage": 43.02, "elapsed_time": "3 days, 0:15:40", "remaining_time": "3 days, 23:43:44", "throughput": 2724.45, "total_tokens": 708739360} {"current_steps": 3930, "total_steps": 9134, "loss": 0.6669, "learning_rate": 3.043360734556689e-05, "epoch": 0.43022523878595476, "percentage": 43.03, "elapsed_time": "3 days, 0:16:49", "remaining_time": "3 days, 23:42:42", "throughput": 2724.51, "total_tokens": 708942304} {"current_steps": 3931, "total_steps": 9134, "loss": 0.6135, "learning_rate": 3.0425213952039612e-05, "epoch": 0.4303347108568926, "percentage": 43.04, "elapsed_time": "3 days, 0:17:52", "remaining_time": "3 days, 23:41:31", "throughput": 2724.45, "total_tokens": 709099776} {"current_steps": 3932, "total_steps": 9134, "loss": 0.8763, "learning_rate": 3.0416819916719895e-05, "epoch": 0.43044418292783054, "percentage": 43.05, "elapsed_time": "3 days, 0:18:58", "remaining_time": "3 days, 23:40:25", "throughput": 2724.51, "total_tokens": 709296672} {"current_steps": 3933, "total_steps": 9134, "loss": 0.5249, "learning_rate": 3.040842524060073e-05, "epoch": 0.43055365499876846, "percentage": 43.06, "elapsed_time": "3 days, 0:20:07", "remaining_time": "3 days, 23:39:23", "throughput": 2724.52, "total_tokens": 709486176} {"current_steps": 3934, "total_steps": 9134, "loss": 0.6727, "learning_rate": 3.0400029924675206e-05, "epoch": 0.43066312706970633, "percentage": 43.07, "elapsed_time": "3 days, 0:21:14", "remaining_time": "3 days, 23:38:18", "throughput": 2724.57, "total_tokens": 709683072} {"current_steps": 3935, "total_steps": 9134, "loss": 0.5945, "learning_rate": 3.0391633969936468e-05, "epoch": 0.43077259914064425, "percentage": 43.08, "elapsed_time": "3 days, 0:22:19", "remaining_time": "3 days, 23:37:09", "throughput": 2724.59, "total_tokens": 709862048} {"current_steps": 3936, "total_steps": 9134, "loss": 0.6451, "learning_rate": 3.0383237377377734e-05, "epoch": 0.4308820712115821, "percentage": 43.09, "elapsed_time": "3 days, 0:23:26", "remaining_time": "3 days, 23:36:04", "throughput": 2724.56, "total_tokens": 710036320} {"current_steps": 3937, "total_steps": 9134, "loss": 0.8141, "learning_rate": 3.03748401479923e-05, "epoch": 0.43099154328252004, "percentage": 43.1, "elapsed_time": "3 days, 0:24:27", "remaining_time": "3 days, 23:34:51", "throughput": 2724.47, "total_tokens": 710179232} {"current_steps": 3938, "total_steps": 9134, "loss": 0.9026, "learning_rate": 3.0366442282773567e-05, "epoch": 0.43110101535345796, "percentage": 43.11, "elapsed_time": "3 days, 0:25:33", "remaining_time": "3 days, 23:33:45", "throughput": 2724.58, "total_tokens": 710389568} {"current_steps": 3939, "total_steps": 9134, "loss": 0.5485, "learning_rate": 3.035804378271496e-05, "epoch": 0.4312104874243958, "percentage": 43.12, "elapsed_time": "3 days, 0:26:38", "remaining_time": "3 days, 23:32:36", "throughput": 2724.5, "total_tokens": 710545024} {"current_steps": 3940, "total_steps": 9134, "loss": 0.8002, "learning_rate": 3.034964464881002e-05, "epoch": 0.43131995949533375, "percentage": 43.14, "elapsed_time": "3 days, 0:27:42", "remaining_time": "3 days, 23:31:28", "throughput": 2724.53, "total_tokens": 710726688} {"current_steps": 3941, "total_steps": 9134, "loss": 0.656, "learning_rate": 3.0341244882052346e-05, "epoch": 0.43142943156627167, "percentage": 43.15, "elapsed_time": "3 days, 0:28:42", "remaining_time": "3 days, 23:30:14", "throughput": 2724.48, "total_tokens": 710879904} {"current_steps": 3942, "total_steps": 9134, "loss": 0.7227, "learning_rate": 3.0332844483435614e-05, "epoch": 0.43153890363720954, "percentage": 43.16, "elapsed_time": "3 days, 0:29:50", "remaining_time": "3 days, 23:29:09", "throughput": 2724.48, "total_tokens": 711061344} {"current_steps": 3943, "total_steps": 9134, "loss": 0.977, "learning_rate": 3.0324443453953578e-05, "epoch": 0.43164837570814746, "percentage": 43.17, "elapsed_time": "3 days, 0:30:58", "remaining_time": "3 days, 23:28:06", "throughput": 2724.44, "total_tokens": 711240096} {"current_steps": 3944, "total_steps": 9134, "loss": 0.9692, "learning_rate": 3.0316041794600054e-05, "epoch": 0.4317578477790854, "percentage": 43.18, "elapsed_time": "3 days, 0:32:04", "remaining_time": "3 days, 23:26:59", "throughput": 2724.47, "total_tokens": 711425120} {"current_steps": 3945, "total_steps": 9134, "loss": 0.6132, "learning_rate": 3.030763950636895e-05, "epoch": 0.43186731985002325, "percentage": 43.19, "elapsed_time": "3 days, 0:33:11", "remaining_time": "3 days, 23:25:55", "throughput": 2724.42, "total_tokens": 711595584} {"current_steps": 3946, "total_steps": 9134, "loss": 0.8728, "learning_rate": 3.0299236590254236e-05, "epoch": 0.43197679192096117, "percentage": 43.2, "elapsed_time": "3 days, 0:34:15", "remaining_time": "3 days, 23:24:45", "throughput": 2724.43, "total_tokens": 711773216} {"current_steps": 3947, "total_steps": 9134, "loss": 0.6938, "learning_rate": 3.0290833047249966e-05, "epoch": 0.4320862639918991, "percentage": 43.21, "elapsed_time": "3 days, 0:35:21", "remaining_time": "3 days, 23:23:39", "throughput": 2724.47, "total_tokens": 711964288} {"current_steps": 3948, "total_steps": 9134, "loss": 0.4894, "learning_rate": 3.0282428878350256e-05, "epoch": 0.43219573606283695, "percentage": 43.22, "elapsed_time": "3 days, 0:36:28", "remaining_time": "3 days, 23:22:33", "throughput": 2724.5, "total_tokens": 712151776} {"current_steps": 3949, "total_steps": 9134, "loss": 0.6961, "learning_rate": 3.0274024084549312e-05, "epoch": 0.4323052081337749, "percentage": 43.23, "elapsed_time": "3 days, 0:37:31", "remaining_time": "3 days, 23:21:23", "throughput": 2724.52, "total_tokens": 712328736} {"current_steps": 3950, "total_steps": 9134, "loss": 0.8065, "learning_rate": 3.0265618666841405e-05, "epoch": 0.4324146802047128, "percentage": 43.25, "elapsed_time": "3 days, 0:38:39", "remaining_time": "3 days, 23:20:18", "throughput": 2724.48, "total_tokens": 712503008} {"current_steps": 3951, "total_steps": 9134, "loss": 0.6454, "learning_rate": 3.0257212626220872e-05, "epoch": 0.43252415227565066, "percentage": 43.26, "elapsed_time": "3 days, 0:39:46", "remaining_time": "3 days, 23:19:14", "throughput": 2724.5, "total_tokens": 712692512} {"current_steps": 3952, "total_steps": 9134, "loss": 0.5226, "learning_rate": 3.0248805963682135e-05, "epoch": 0.4326336243465886, "percentage": 43.27, "elapsed_time": "3 days, 0:40:43", "remaining_time": "3 days, 23:17:56", "throughput": 2724.38, "total_tokens": 712815488} {"current_steps": 3953, "total_steps": 9134, "loss": 0.7462, "learning_rate": 3.0240398680219685e-05, "epoch": 0.43274309641752645, "percentage": 43.28, "elapsed_time": "3 days, 0:41:51", "remaining_time": "3 days, 23:16:52", "throughput": 2724.5, "total_tokens": 713035232} {"current_steps": 3954, "total_steps": 9134, "loss": 0.5986, "learning_rate": 3.0231990776828096e-05, "epoch": 0.4328525684884644, "percentage": 43.29, "elapsed_time": "3 days, 0:42:55", "remaining_time": "3 days, 23:15:43", "throughput": 2724.55, "total_tokens": 713219808} {"current_steps": 3955, "total_steps": 9134, "loss": 0.5568, "learning_rate": 3.0223582254501993e-05, "epoch": 0.4329620405594023, "percentage": 43.3, "elapsed_time": "3 days, 0:43:53", "remaining_time": "3 days, 23:14:26", "throughput": 2724.45, "total_tokens": 713352192} {"current_steps": 3956, "total_steps": 9134, "loss": 0.704, "learning_rate": 3.02151731142361e-05, "epoch": 0.43307151263034016, "percentage": 43.31, "elapsed_time": "3 days, 0:44:59", "remaining_time": "3 days, 23:13:19", "throughput": 2724.41, "total_tokens": 713520416} {"current_steps": 3957, "total_steps": 9134, "loss": 0.7014, "learning_rate": 3.0206763357025196e-05, "epoch": 0.4331809847012781, "percentage": 43.32, "elapsed_time": "3 days, 0:46:02", "remaining_time": "3 days, 23:12:09", "throughput": 2724.41, "total_tokens": 713694240} {"current_steps": 3958, "total_steps": 9134, "loss": 0.8019, "learning_rate": 3.0198352983864138e-05, "epoch": 0.433290456772216, "percentage": 43.33, "elapsed_time": "3 days, 0:47:07", "remaining_time": "3 days, 23:11:02", "throughput": 2724.43, "total_tokens": 713876576} {"current_steps": 3959, "total_steps": 9134, "loss": 0.7661, "learning_rate": 3.0189941995747863e-05, "epoch": 0.43339992884315387, "percentage": 43.34, "elapsed_time": "3 days, 0:48:13", "remaining_time": "3 days, 23:09:54", "throughput": 2724.45, "total_tokens": 714059360} {"current_steps": 3960, "total_steps": 9134, "loss": 0.7001, "learning_rate": 3.0181530393671364e-05, "epoch": 0.4335094009140918, "percentage": 43.35, "elapsed_time": "3 days, 0:49:21", "remaining_time": "3 days, 23:08:51", "throughput": 2724.52, "total_tokens": 714263648} {"current_steps": 3961, "total_steps": 9134, "loss": 0.7705, "learning_rate": 3.0173118178629728e-05, "epoch": 0.4336188729850297, "percentage": 43.37, "elapsed_time": "3 days, 0:50:26", "remaining_time": "3 days, 23:07:43", "throughput": 2724.53, "total_tokens": 714441952} {"current_steps": 3962, "total_steps": 9134, "loss": 0.8372, "learning_rate": 3.0164705351618104e-05, "epoch": 0.4337283450559676, "percentage": 43.38, "elapsed_time": "3 days, 0:51:33", "remaining_time": "3 days, 23:06:38", "throughput": 2724.6, "total_tokens": 714646688} {"current_steps": 3963, "total_steps": 9134, "loss": 0.9654, "learning_rate": 3.0156291913631712e-05, "epoch": 0.4338378171269055, "percentage": 43.39, "elapsed_time": "3 days, 0:52:43", "remaining_time": "3 days, 23:05:37", "throughput": 2724.67, "total_tokens": 714853216} {"current_steps": 3964, "total_steps": 9134, "loss": 0.8553, "learning_rate": 3.0147877865665843e-05, "epoch": 0.4339472891978434, "percentage": 43.4, "elapsed_time": "3 days, 0:53:52", "remaining_time": "3 days, 23:04:34", "throughput": 2724.7, "total_tokens": 715050336} {"current_steps": 3965, "total_steps": 9134, "loss": 0.5535, "learning_rate": 3.013946320871586e-05, "epoch": 0.4340567612687813, "percentage": 43.41, "elapsed_time": "3 days, 0:54:59", "remaining_time": "3 days, 23:03:28", "throughput": 2724.72, "total_tokens": 715235808} {"current_steps": 3966, "total_steps": 9134, "loss": 0.6924, "learning_rate": 3.0131047943777207e-05, "epoch": 0.4341662333397192, "percentage": 43.42, "elapsed_time": "3 days, 0:56:08", "remaining_time": "3 days, 23:02:26", "throughput": 2724.73, "total_tokens": 715426656} {"current_steps": 3967, "total_steps": 9134, "loss": 0.6858, "learning_rate": 3.012263207184539e-05, "epoch": 0.43427570541065713, "percentage": 43.43, "elapsed_time": "3 days, 0:57:11", "remaining_time": "3 days, 23:01:15", "throughput": 2724.77, "total_tokens": 715608320} {"current_steps": 3968, "total_steps": 9134, "loss": 0.5542, "learning_rate": 3.011421559391599e-05, "epoch": 0.434385177481595, "percentage": 43.44, "elapsed_time": "3 days, 0:58:18", "remaining_time": "3 days, 23:00:10", "throughput": 2724.75, "total_tokens": 715787744} {"current_steps": 3969, "total_steps": 9134, "loss": 0.8148, "learning_rate": 3.010579851098466e-05, "epoch": 0.4344946495525329, "percentage": 43.45, "elapsed_time": "3 days, 0:59:27", "remaining_time": "3 days, 22:59:08", "throughput": 2724.8, "total_tokens": 715988448} {"current_steps": 3970, "total_steps": 9134, "loss": 0.5349, "learning_rate": 3.0097380824047132e-05, "epoch": 0.4346041216234708, "percentage": 43.46, "elapsed_time": "3 days, 1:00:33", "remaining_time": "3 days, 22:58:01", "throughput": 2724.8, "total_tokens": 716166528} {"current_steps": 3971, "total_steps": 9134, "loss": 0.614, "learning_rate": 3.0088962534099195e-05, "epoch": 0.4347135936944087, "percentage": 43.47, "elapsed_time": "3 days, 1:01:36", "remaining_time": "3 days, 22:56:51", "throughput": 2724.77, "total_tokens": 716331840} {"current_steps": 3972, "total_steps": 9134, "loss": 0.5818, "learning_rate": 3.0080543642136723e-05, "epoch": 0.43482306576534663, "percentage": 43.49, "elapsed_time": "3 days, 1:02:43", "remaining_time": "3 days, 22:55:46", "throughput": 2724.78, "total_tokens": 716518432} {"current_steps": 3973, "total_steps": 9134, "loss": 0.6332, "learning_rate": 3.007212414915565e-05, "epoch": 0.4349325378362845, "percentage": 43.5, "elapsed_time": "3 days, 1:03:46", "remaining_time": "3 days, 22:54:36", "throughput": 2724.76, "total_tokens": 716684416} {"current_steps": 3974, "total_steps": 9134, "loss": 0.7219, "learning_rate": 3.0063704056151975e-05, "epoch": 0.4350420099072224, "percentage": 43.51, "elapsed_time": "3 days, 1:04:55", "remaining_time": "3 days, 22:53:33", "throughput": 2724.83, "total_tokens": 716889824} {"current_steps": 3975, "total_steps": 9134, "loss": 0.6136, "learning_rate": 3.00552833641218e-05, "epoch": 0.43515148197816034, "percentage": 43.52, "elapsed_time": "3 days, 1:06:01", "remaining_time": "3 days, 22:52:27", "throughput": 2724.87, "total_tokens": 717082016} {"current_steps": 3976, "total_steps": 9134, "loss": 0.5752, "learning_rate": 3.0046862074061266e-05, "epoch": 0.4352609540490982, "percentage": 43.53, "elapsed_time": "3 days, 1:07:09", "remaining_time": "3 days, 22:51:23", "throughput": 2724.85, "total_tokens": 717262560} {"current_steps": 3977, "total_steps": 9134, "loss": 0.734, "learning_rate": 3.00384401869666e-05, "epoch": 0.4353704261200361, "percentage": 43.54, "elapsed_time": "3 days, 1:08:15", "remaining_time": "3 days, 22:50:17", "throughput": 2724.85, "total_tokens": 717441984} {"current_steps": 3978, "total_steps": 9134, "loss": 0.5059, "learning_rate": 3.003001770383409e-05, "epoch": 0.43547989819097405, "percentage": 43.55, "elapsed_time": "3 days, 1:09:21", "remaining_time": "3 days, 22:49:11", "throughput": 2724.85, "total_tokens": 717621856} {"current_steps": 3979, "total_steps": 9134, "loss": 0.7149, "learning_rate": 3.0021594625660095e-05, "epoch": 0.4355893702619119, "percentage": 43.56, "elapsed_time": "3 days, 1:10:29", "remaining_time": "3 days, 22:48:06", "throughput": 2724.9, "total_tokens": 717817408} {"current_steps": 3980, "total_steps": 9134, "loss": 0.8263, "learning_rate": 3.0013170953441062e-05, "epoch": 0.43569884233284983, "percentage": 43.57, "elapsed_time": "3 days, 1:11:37", "remaining_time": "3 days, 22:47:02", "throughput": 2724.86, "total_tokens": 717993024} {"current_steps": 3981, "total_steps": 9134, "loss": 0.7118, "learning_rate": 3.000474668817348e-05, "epoch": 0.43580831440378776, "percentage": 43.58, "elapsed_time": "3 days, 1:12:44", "remaining_time": "3 days, 22:45:57", "throughput": 2724.88, "total_tokens": 718182752} {"current_steps": 3982, "total_steps": 9134, "loss": 0.5441, "learning_rate": 2.999632183085394e-05, "epoch": 0.4359177864747256, "percentage": 43.6, "elapsed_time": "3 days, 1:13:47", "remaining_time": "3 days, 22:44:47", "throughput": 2724.92, "total_tokens": 718364640} {"current_steps": 3983, "total_steps": 9134, "loss": 0.659, "learning_rate": 2.998789638247908e-05, "epoch": 0.43602725854566354, "percentage": 43.61, "elapsed_time": "3 days, 1:14:56", "remaining_time": "3 days, 22:43:45", "throughput": 2725.02, "total_tokens": 718579904} {"current_steps": 3984, "total_steps": 9134, "loss": 0.5388, "learning_rate": 2.9979470344045614e-05, "epoch": 0.43613673061660146, "percentage": 43.62, "elapsed_time": "3 days, 1:16:04", "remaining_time": "3 days, 22:42:40", "throughput": 2725.02, "total_tokens": 718762912} {"current_steps": 3985, "total_steps": 9134, "loss": 0.6563, "learning_rate": 2.9971043716550316e-05, "epoch": 0.43624620268753933, "percentage": 43.63, "elapsed_time": "3 days, 1:17:09", "remaining_time": "3 days, 22:41:33", "throughput": 2724.96, "total_tokens": 718926432} {"current_steps": 3986, "total_steps": 9134, "loss": 0.7023, "learning_rate": 2.9962616500990058e-05, "epoch": 0.43635567475847725, "percentage": 43.64, "elapsed_time": "3 days, 1:18:17", "remaining_time": "3 days, 22:40:29", "throughput": 2725.01, "total_tokens": 719123552} {"current_steps": 3987, "total_steps": 9134, "loss": 0.8936, "learning_rate": 2.995418869836175e-05, "epoch": 0.4364651468294151, "percentage": 43.65, "elapsed_time": "3 days, 1:19:22", "remaining_time": "3 days, 22:39:21", "throughput": 2725.06, "total_tokens": 719313952} {"current_steps": 3988, "total_steps": 9134, "loss": 0.7088, "learning_rate": 2.9945760309662395e-05, "epoch": 0.43657461890035304, "percentage": 43.66, "elapsed_time": "3 days, 1:20:27", "remaining_time": "3 days, 22:38:14", "throughput": 2725.04, "total_tokens": 719485760} {"current_steps": 3989, "total_steps": 9134, "loss": 0.8447, "learning_rate": 2.9937331335889045e-05, "epoch": 0.43668409097129096, "percentage": 43.67, "elapsed_time": "3 days, 1:21:34", "remaining_time": "3 days, 22:37:07", "throughput": 2725.1, "total_tokens": 719684000} {"current_steps": 3990, "total_steps": 9134, "loss": 0.752, "learning_rate": 2.9928901778038837e-05, "epoch": 0.4367935630422288, "percentage": 43.68, "elapsed_time": "3 days, 1:22:43", "remaining_time": "3 days, 22:36:05", "throughput": 2725.2, "total_tokens": 719898368} {"current_steps": 3991, "total_steps": 9134, "loss": 0.8068, "learning_rate": 2.9920471637108977e-05, "epoch": 0.43690303511316675, "percentage": 43.69, "elapsed_time": "3 days, 1:23:50", "remaining_time": "3 days, 22:35:01", "throughput": 2725.24, "total_tokens": 720093472} {"current_steps": 3992, "total_steps": 9134, "loss": 0.9269, "learning_rate": 2.9912040914096724e-05, "epoch": 0.43701250718410467, "percentage": 43.7, "elapsed_time": "3 days, 1:24:57", "remaining_time": "3 days, 22:33:55", "throughput": 2725.26, "total_tokens": 720280064} {"current_steps": 3993, "total_steps": 9134, "loss": 0.7803, "learning_rate": 2.990360960999942e-05, "epoch": 0.43712197925504254, "percentage": 43.72, "elapsed_time": "3 days, 1:26:05", "remaining_time": "3 days, 22:32:51", "throughput": 2725.27, "total_tokens": 720468896} {"current_steps": 3994, "total_steps": 9134, "loss": 0.7404, "learning_rate": 2.989517772581447e-05, "epoch": 0.43723145132598046, "percentage": 43.73, "elapsed_time": "3 days, 1:27:12", "remaining_time": "3 days, 22:31:45", "throughput": 2725.31, "total_tokens": 720658400} {"current_steps": 3995, "total_steps": 9134, "loss": 1.0339, "learning_rate": 2.9886745262539362e-05, "epoch": 0.4373409233969184, "percentage": 43.74, "elapsed_time": "3 days, 1:28:21", "remaining_time": "3 days, 22:30:43", "throughput": 2725.36, "total_tokens": 720862016} {"current_steps": 3996, "total_steps": 9134, "loss": 0.9618, "learning_rate": 2.9878312221171627e-05, "epoch": 0.43745039546785625, "percentage": 43.75, "elapsed_time": "3 days, 1:29:26", "remaining_time": "3 days, 22:29:35", "throughput": 2725.39, "total_tokens": 721046592} {"current_steps": 3997, "total_steps": 9134, "loss": 0.6566, "learning_rate": 2.9869878602708885e-05, "epoch": 0.43755986753879417, "percentage": 43.76, "elapsed_time": "3 days, 1:30:29", "remaining_time": "3 days, 22:28:24", "throughput": 2725.34, "total_tokens": 721203168} {"current_steps": 3998, "total_steps": 9134, "loss": 0.6509, "learning_rate": 2.9861444408148815e-05, "epoch": 0.4376693396097321, "percentage": 43.77, "elapsed_time": "3 days, 1:31:31", "remaining_time": "3 days, 22:27:14", "throughput": 2725.28, "total_tokens": 721359296} {"current_steps": 3999, "total_steps": 9134, "loss": 0.6289, "learning_rate": 2.985300963848916e-05, "epoch": 0.43777881168066995, "percentage": 43.78, "elapsed_time": "3 days, 1:32:37", "remaining_time": "3 days, 22:26:06", "throughput": 2725.21, "total_tokens": 721518560} {"current_steps": 4000, "total_steps": 9134, "loss": 0.8155, "learning_rate": 2.984457429472774e-05, "epoch": 0.4378882837516079, "percentage": 43.79, "elapsed_time": "3 days, 1:33:41", "remaining_time": "3 days, 22:24:58", "throughput": 2725.18, "total_tokens": 721687008} {"current_steps": 4001, "total_steps": 9134, "loss": 0.5141, "learning_rate": 2.9836138377862442e-05, "epoch": 0.4379977558225458, "percentage": 43.8, "elapsed_time": "3 days, 1:37:03", "remaining_time": "3 days, 22:26:46", "throughput": 2723.71, "total_tokens": 721846048} {"current_steps": 4002, "total_steps": 9134, "loss": 0.5326, "learning_rate": 2.9827701888891223e-05, "epoch": 0.43810722789348366, "percentage": 43.81, "elapsed_time": "3 days, 1:38:10", "remaining_time": "3 days, 22:25:41", "throughput": 2723.67, "total_tokens": 722020096} {"current_steps": 4003, "total_steps": 9134, "loss": 0.6692, "learning_rate": 2.98192648288121e-05, "epoch": 0.4382166999644216, "percentage": 43.83, "elapsed_time": "3 days, 1:39:17", "remaining_time": "3 days, 22:24:35", "throughput": 2723.67, "total_tokens": 722201984} {"current_steps": 4004, "total_steps": 9134, "loss": 0.7519, "learning_rate": 2.9810827198623158e-05, "epoch": 0.43832617203535945, "percentage": 43.84, "elapsed_time": "3 days, 1:40:21", "remaining_time": "3 days, 22:23:27", "throughput": 2723.65, "total_tokens": 722371776} {"current_steps": 4005, "total_steps": 9134, "loss": 0.6478, "learning_rate": 2.980238899932256e-05, "epoch": 0.4384356441062974, "percentage": 43.85, "elapsed_time": "3 days, 1:41:24", "remaining_time": "3 days, 22:22:16", "throughput": 2723.6, "total_tokens": 722530368} {"current_steps": 4006, "total_steps": 9134, "loss": 0.8284, "learning_rate": 2.9793950231908523e-05, "epoch": 0.4385451161772353, "percentage": 43.86, "elapsed_time": "3 days, 1:42:27", "remaining_time": "3 days, 22:21:06", "throughput": 2723.6, "total_tokens": 722701728} {"current_steps": 4007, "total_steps": 9134, "loss": 0.7222, "learning_rate": 2.9785510897379337e-05, "epoch": 0.43865458824817316, "percentage": 43.87, "elapsed_time": "3 days, 1:43:35", "remaining_time": "3 days, 22:20:01", "throughput": 2723.56, "total_tokens": 722875776} {"current_steps": 4008, "total_steps": 9134, "loss": 0.8009, "learning_rate": 2.9777070996733354e-05, "epoch": 0.4387640603191111, "percentage": 43.88, "elapsed_time": "3 days, 1:44:43", "remaining_time": "3 days, 22:18:58", "throughput": 2723.59, "total_tokens": 723069312} {"current_steps": 4009, "total_steps": 9134, "loss": 0.7669, "learning_rate": 2.976863053096901e-05, "epoch": 0.438873532390049, "percentage": 43.89, "elapsed_time": "3 days, 1:45:50", "remaining_time": "3 days, 22:17:53", "throughput": 2723.61, "total_tokens": 723256128} {"current_steps": 4010, "total_steps": 9134, "loss": 0.9514, "learning_rate": 2.976018950108479e-05, "epoch": 0.43898300446098687, "percentage": 43.9, "elapsed_time": "3 days, 1:47:00", "remaining_time": "3 days, 22:16:50", "throughput": 2723.68, "total_tokens": 723463104} {"current_steps": 4011, "total_steps": 9134, "loss": 0.7664, "learning_rate": 2.9751747908079246e-05, "epoch": 0.4390924765319248, "percentage": 43.91, "elapsed_time": "3 days, 1:48:07", "remaining_time": "3 days, 22:15:46", "throughput": 2723.7, "total_tokens": 723652832} {"current_steps": 4012, "total_steps": 9134, "loss": 0.8466, "learning_rate": 2.9743305752951016e-05, "epoch": 0.4392019486028627, "percentage": 43.92, "elapsed_time": "3 days, 1:49:13", "remaining_time": "3 days, 22:14:39", "throughput": 2723.67, "total_tokens": 723823744} {"current_steps": 4013, "total_steps": 9134, "loss": 0.6108, "learning_rate": 2.9734863036698784e-05, "epoch": 0.4393114206738006, "percentage": 43.93, "elapsed_time": "3 days, 1:50:21", "remaining_time": "3 days, 22:13:35", "throughput": 2723.69, "total_tokens": 724015040} {"current_steps": 4014, "total_steps": 9134, "loss": 0.6806, "learning_rate": 2.97264197603213e-05, "epoch": 0.4394208927447385, "percentage": 43.95, "elapsed_time": "3 days, 1:51:31", "remaining_time": "3 days, 22:12:33", "throughput": 2723.73, "total_tokens": 724216192} {"current_steps": 4015, "total_steps": 9134, "loss": 0.8554, "learning_rate": 2.97179759248174e-05, "epoch": 0.4395303648156764, "percentage": 43.96, "elapsed_time": "3 days, 1:52:37", "remaining_time": "3 days, 22:11:27", "throughput": 2723.79, "total_tokens": 724410176} {"current_steps": 4016, "total_steps": 9134, "loss": 0.7449, "learning_rate": 2.9709531531185964e-05, "epoch": 0.4396398368866143, "percentage": 43.97, "elapsed_time": "3 days, 1:53:45", "remaining_time": "3 days, 22:10:23", "throughput": 2723.86, "total_tokens": 724615136} {"current_steps": 4017, "total_steps": 9134, "loss": 0.7408, "learning_rate": 2.9701086580425954e-05, "epoch": 0.4397493089575522, "percentage": 43.98, "elapsed_time": "3 days, 1:54:50", "remaining_time": "3 days, 22:09:15", "throughput": 2723.83, "total_tokens": 724784704} {"current_steps": 4018, "total_steps": 9134, "loss": 0.6664, "learning_rate": 2.969264107353638e-05, "epoch": 0.43985878102849013, "percentage": 43.99, "elapsed_time": "3 days, 1:55:55", "remaining_time": "3 days, 22:08:08", "throughput": 2723.82, "total_tokens": 724959200} {"current_steps": 4019, "total_steps": 9134, "loss": 0.5817, "learning_rate": 2.9684195011516347e-05, "epoch": 0.439968253099428, "percentage": 44.0, "elapsed_time": "3 days, 1:57:04", "remaining_time": "3 days, 22:07:05", "throughput": 2723.84, "total_tokens": 725153408} {"current_steps": 4020, "total_steps": 9134, "loss": 0.7197, "learning_rate": 2.9675748395365e-05, "epoch": 0.4400777251703659, "percentage": 44.01, "elapsed_time": "3 days, 1:58:08", "remaining_time": "3 days, 22:05:56", "throughput": 2723.8, "total_tokens": 725315584} {"current_steps": 4021, "total_steps": 9134, "loss": 0.6023, "learning_rate": 2.9667301226081546e-05, "epoch": 0.4401871972413038, "percentage": 44.02, "elapsed_time": "3 days, 1:59:11", "remaining_time": "3 days, 22:04:46", "throughput": 2723.75, "total_tokens": 725476864} {"current_steps": 4022, "total_steps": 9134, "loss": 0.5936, "learning_rate": 2.9658853504665286e-05, "epoch": 0.4402966693122417, "percentage": 44.03, "elapsed_time": "3 days, 2:00:17", "remaining_time": "3 days, 22:03:39", "throughput": 2723.77, "total_tokens": 725659648} {"current_steps": 4023, "total_steps": 9134, "loss": 0.5967, "learning_rate": 2.965040523211556e-05, "epoch": 0.44040614138317963, "percentage": 44.04, "elapsed_time": "3 days, 2:01:26", "remaining_time": "3 days, 22:02:36", "throughput": 2723.9, "total_tokens": 725884544} {"current_steps": 4024, "total_steps": 9134, "loss": 0.7454, "learning_rate": 2.964195640943178e-05, "epoch": 0.4405156134541175, "percentage": 44.06, "elapsed_time": "3 days, 2:02:30", "remaining_time": "3 days, 22:01:27", "throughput": 2723.84, "total_tokens": 726042016} {"current_steps": 4025, "total_steps": 9134, "loss": 0.8161, "learning_rate": 2.9633507037613446e-05, "epoch": 0.4406250855250554, "percentage": 44.07, "elapsed_time": "3 days, 2:03:39", "remaining_time": "3 days, 22:00:24", "throughput": 2723.86, "total_tokens": 726232416} {"current_steps": 4026, "total_steps": 9134, "loss": 0.7472, "learning_rate": 2.9625057117660077e-05, "epoch": 0.44073455759599334, "percentage": 44.08, "elapsed_time": "3 days, 2:04:48", "remaining_time": "3 days, 21:59:21", "throughput": 2723.92, "total_tokens": 726436480} {"current_steps": 4027, "total_steps": 9134, "loss": 0.659, "learning_rate": 2.9616606650571292e-05, "epoch": 0.4408440296669312, "percentage": 44.09, "elapsed_time": "3 days, 2:05:56", "remaining_time": "3 days, 21:58:17", "throughput": 2723.91, "total_tokens": 726621504} {"current_steps": 4028, "total_steps": 9134, "loss": 0.6183, "learning_rate": 2.960815563734677e-05, "epoch": 0.4409535017378691, "percentage": 44.1, "elapsed_time": "3 days, 2:06:59", "remaining_time": "3 days, 21:57:07", "throughput": 2723.9, "total_tokens": 726790624} {"current_steps": 4029, "total_steps": 9134, "loss": 0.7642, "learning_rate": 2.959970407898624e-05, "epoch": 0.44106297380880705, "percentage": 44.11, "elapsed_time": "3 days, 2:08:03", "remaining_time": "3 days, 21:55:57", "throughput": 2723.87, "total_tokens": 726954816} {"current_steps": 4030, "total_steps": 9134, "loss": 0.6425, "learning_rate": 2.9591251976489514e-05, "epoch": 0.4411724458797449, "percentage": 44.12, "elapsed_time": "3 days, 2:09:07", "remaining_time": "3 days, 21:54:49", "throughput": 2723.85, "total_tokens": 727126176} {"current_steps": 4031, "total_steps": 9134, "loss": 0.53, "learning_rate": 2.9582799330856458e-05, "epoch": 0.44128191795068283, "percentage": 44.13, "elapsed_time": "3 days, 2:10:13", "remaining_time": "3 days, 21:53:42", "throughput": 2723.88, "total_tokens": 727312544} {"current_steps": 4032, "total_steps": 9134, "loss": 0.6328, "learning_rate": 2.9574346143086994e-05, "epoch": 0.44139139002162076, "percentage": 44.14, "elapsed_time": "3 days, 2:11:16", "remaining_time": "3 days, 21:52:32", "throughput": 2723.83, "total_tokens": 727469792} {"current_steps": 4033, "total_steps": 9134, "loss": 0.8226, "learning_rate": 2.9565892414181133e-05, "epoch": 0.4415008620925586, "percentage": 44.15, "elapsed_time": "3 days, 2:12:22", "remaining_time": "3 days, 21:51:25", "throughput": 2723.78, "total_tokens": 727636224} {"current_steps": 4034, "total_steps": 9134, "loss": 0.7232, "learning_rate": 2.9557438145138933e-05, "epoch": 0.44161033416349654, "percentage": 44.16, "elapsed_time": "3 days, 2:13:31", "remaining_time": "3 days, 21:50:23", "throughput": 2723.86, "total_tokens": 727848128} {"current_steps": 4035, "total_steps": 9134, "loss": 0.601, "learning_rate": 2.9548983336960502e-05, "epoch": 0.44171980623443446, "percentage": 44.18, "elapsed_time": "3 days, 2:14:37", "remaining_time": "3 days, 21:49:17", "throughput": 2723.83, "total_tokens": 728020608} {"current_steps": 4036, "total_steps": 9134, "loss": 0.7301, "learning_rate": 2.9540527990646045e-05, "epoch": 0.44182927830537233, "percentage": 44.19, "elapsed_time": "3 days, 2:15:46", "remaining_time": "3 days, 21:48:14", "throughput": 2723.86, "total_tokens": 728214592} {"current_steps": 4037, "total_steps": 9134, "loss": 0.7351, "learning_rate": 2.953207210719581e-05, "epoch": 0.44193875037631025, "percentage": 44.2, "elapsed_time": "3 days, 2:16:54", "remaining_time": "3 days, 21:47:09", "throughput": 2723.89, "total_tokens": 728406560} {"current_steps": 4038, "total_steps": 9134, "loss": 0.8148, "learning_rate": 2.9523615687610102e-05, "epoch": 0.4420482224472481, "percentage": 44.21, "elapsed_time": "3 days, 2:17:57", "remaining_time": "3 days, 21:45:59", "throughput": 2723.85, "total_tokens": 728570080} {"current_steps": 4039, "total_steps": 9134, "loss": 0.7182, "learning_rate": 2.9515158732889305e-05, "epoch": 0.44215769451818604, "percentage": 44.22, "elapsed_time": "3 days, 2:19:00", "remaining_time": "3 days, 21:44:49", "throughput": 2723.81, "total_tokens": 728728672} {"current_steps": 4040, "total_steps": 9134, "loss": 0.6441, "learning_rate": 2.9506701244033864e-05, "epoch": 0.44226716658912396, "percentage": 44.23, "elapsed_time": "3 days, 2:20:06", "remaining_time": "3 days, 21:43:42", "throughput": 2723.85, "total_tokens": 728919296} {"current_steps": 4041, "total_steps": 9134, "loss": 0.6377, "learning_rate": 2.9498243222044282e-05, "epoch": 0.4423766386600618, "percentage": 44.24, "elapsed_time": "3 days, 2:21:10", "remaining_time": "3 days, 21:42:34", "throughput": 2723.83, "total_tokens": 729089312} {"current_steps": 4042, "total_steps": 9134, "loss": 0.619, "learning_rate": 2.9489784667921122e-05, "epoch": 0.44248611073099975, "percentage": 44.25, "elapsed_time": "3 days, 2:22:18", "remaining_time": "3 days, 21:41:29", "throughput": 2723.84, "total_tokens": 729277696} {"current_steps": 4043, "total_steps": 9134, "loss": 0.7955, "learning_rate": 2.9481325582665013e-05, "epoch": 0.44259558280193767, "percentage": 44.26, "elapsed_time": "3 days, 2:23:25", "remaining_time": "3 days, 21:40:23", "throughput": 2723.81, "total_tokens": 729449280} {"current_steps": 4044, "total_steps": 9134, "loss": 0.5415, "learning_rate": 2.9472865967276668e-05, "epoch": 0.44270505487287554, "percentage": 44.27, "elapsed_time": "3 days, 2:24:30", "remaining_time": "3 days, 21:39:16", "throughput": 2723.78, "total_tokens": 729620416} {"current_steps": 4045, "total_steps": 9134, "loss": 0.8005, "learning_rate": 2.9464405822756823e-05, "epoch": 0.44281452694381346, "percentage": 44.29, "elapsed_time": "3 days, 2:25:39", "remaining_time": "3 days, 21:38:13", "throughput": 2723.77, "total_tokens": 729805216} {"current_steps": 4046, "total_steps": 9134, "loss": 1.1538, "learning_rate": 2.9455945150106314e-05, "epoch": 0.4429239990147514, "percentage": 44.3, "elapsed_time": "3 days, 2:26:46", "remaining_time": "3 days, 21:37:08", "throughput": 2723.88, "total_tokens": 730016896} {"current_steps": 4047, "total_steps": 9134, "loss": 0.7595, "learning_rate": 2.9447483950326e-05, "epoch": 0.44303347108568925, "percentage": 44.31, "elapsed_time": "3 days, 2:27:48", "remaining_time": "3 days, 21:35:56", "throughput": 2723.82, "total_tokens": 730171456} {"current_steps": 4048, "total_steps": 9134, "loss": 0.7009, "learning_rate": 2.9439022224416833e-05, "epoch": 0.44314294315662717, "percentage": 44.32, "elapsed_time": "3 days, 2:28:51", "remaining_time": "3 days, 21:34:46", "throughput": 2723.82, "total_tokens": 730342144} {"current_steps": 4049, "total_steps": 9134, "loss": 0.5701, "learning_rate": 2.9430559973379834e-05, "epoch": 0.4432524152275651, "percentage": 44.33, "elapsed_time": "3 days, 2:29:57", "remaining_time": "3 days, 21:33:40", "throughput": 2723.7, "total_tokens": 730490656} {"current_steps": 4050, "total_steps": 9134, "loss": 0.642, "learning_rate": 2.942209719821606e-05, "epoch": 0.44336188729850295, "percentage": 44.34, "elapsed_time": "3 days, 2:31:00", "remaining_time": "3 days, 21:32:30", "throughput": 2723.63, "total_tokens": 730642304} {"current_steps": 4051, "total_steps": 9134, "loss": 0.6884, "learning_rate": 2.9413633899926634e-05, "epoch": 0.4434713593694409, "percentage": 44.35, "elapsed_time": "3 days, 2:32:10", "remaining_time": "3 days, 21:31:27", "throughput": 2723.71, "total_tokens": 730853312} {"current_steps": 4052, "total_steps": 9134, "loss": 0.619, "learning_rate": 2.940517007951276e-05, "epoch": 0.4435808314403788, "percentage": 44.36, "elapsed_time": "3 days, 2:33:08", "remaining_time": "3 days, 21:30:11", "throughput": 2723.6, "total_tokens": 730983008} {"current_steps": 4053, "total_steps": 9134, "loss": 0.6903, "learning_rate": 2.9396705737975683e-05, "epoch": 0.44369030351131666, "percentage": 44.37, "elapsed_time": "3 days, 2:34:17", "remaining_time": "3 days, 21:29:09", "throughput": 2723.67, "total_tokens": 731190432} {"current_steps": 4054, "total_steps": 9134, "loss": 0.4793, "learning_rate": 2.9388240876316727e-05, "epoch": 0.4437997755822546, "percentage": 44.38, "elapsed_time": "3 days, 2:35:18", "remaining_time": "3 days, 21:27:56", "throughput": 2723.6, "total_tokens": 731336480} {"current_steps": 4055, "total_steps": 9134, "loss": 0.8048, "learning_rate": 2.9379775495537254e-05, "epoch": 0.4439092476531925, "percentage": 44.39, "elapsed_time": "3 days, 2:36:25", "remaining_time": "3 days, 21:26:50", "throughput": 2723.57, "total_tokens": 731510528} {"current_steps": 4056, "total_steps": 9134, "loss": 0.5982, "learning_rate": 2.9371309596638725e-05, "epoch": 0.4440187197241304, "percentage": 44.41, "elapsed_time": "3 days, 2:37:32", "remaining_time": "3 days, 21:25:45", "throughput": 2723.6, "total_tokens": 731703392} {"current_steps": 4057, "total_steps": 9134, "loss": 0.9146, "learning_rate": 2.9362843180622624e-05, "epoch": 0.4441281917950683, "percentage": 44.42, "elapsed_time": "3 days, 2:38:41", "remaining_time": "3 days, 21:24:42", "throughput": 2723.67, "total_tokens": 731908576} {"current_steps": 4058, "total_steps": 9134, "loss": 0.5755, "learning_rate": 2.935437624849051e-05, "epoch": 0.44423766386600616, "percentage": 44.43, "elapsed_time": "3 days, 2:39:47", "remaining_time": "3 days, 21:23:36", "throughput": 2723.6, "total_tokens": 732071200} {"current_steps": 4059, "total_steps": 9134, "loss": 0.5786, "learning_rate": 2.9345908801244015e-05, "epoch": 0.4443471359369441, "percentage": 44.44, "elapsed_time": "3 days, 2:40:55", "remaining_time": "3 days, 21:22:32", "throughput": 2723.61, "total_tokens": 732257120} {"current_steps": 4060, "total_steps": 9134, "loss": 0.5651, "learning_rate": 2.9337440839884817e-05, "epoch": 0.444456608007882, "percentage": 44.45, "elapsed_time": "3 days, 2:42:01", "remaining_time": "3 days, 21:21:25", "throughput": 2723.62, "total_tokens": 732438336} {"current_steps": 4061, "total_steps": 9134, "loss": 0.7945, "learning_rate": 2.932897236541466e-05, "epoch": 0.44456608007881987, "percentage": 44.46, "elapsed_time": "3 days, 2:43:10", "remaining_time": "3 days, 21:20:22", "throughput": 2723.72, "total_tokens": 732654048} {"current_steps": 4062, "total_steps": 9134, "loss": 0.5544, "learning_rate": 2.932050337883534e-05, "epoch": 0.4446755521497578, "percentage": 44.47, "elapsed_time": "3 days, 2:44:08", "remaining_time": "3 days, 21:19:06", "throughput": 2723.61, "total_tokens": 732783296} {"current_steps": 4063, "total_steps": 9134, "loss": 0.9232, "learning_rate": 2.9312033881148738e-05, "epoch": 0.4447850242206957, "percentage": 44.48, "elapsed_time": "3 days, 2:45:17", "remaining_time": "3 days, 21:18:03", "throughput": 2723.62, "total_tokens": 732972352} {"current_steps": 4064, "total_steps": 9134, "loss": 0.6307, "learning_rate": 2.9303563873356767e-05, "epoch": 0.4448944962916336, "percentage": 44.49, "elapsed_time": "3 days, 2:46:21", "remaining_time": "3 days, 21:16:54", "throughput": 2723.65, "total_tokens": 733154240} {"current_steps": 4065, "total_steps": 9134, "loss": 0.9087, "learning_rate": 2.9295093356461416e-05, "epoch": 0.4450039683625715, "percentage": 44.5, "elapsed_time": "3 days, 2:47:27", "remaining_time": "3 days, 21:15:47", "throughput": 2723.64, "total_tokens": 733333664} {"current_steps": 4066, "total_steps": 9134, "loss": 0.8427, "learning_rate": 2.9286622331464736e-05, "epoch": 0.4451134404335094, "percentage": 44.51, "elapsed_time": "3 days, 2:48:34", "remaining_time": "3 days, 21:14:43", "throughput": 2723.69, "total_tokens": 733531456} {"current_steps": 4067, "total_steps": 9134, "loss": 0.7133, "learning_rate": 2.9278150799368825e-05, "epoch": 0.4452229125044473, "percentage": 44.53, "elapsed_time": "3 days, 2:49:44", "remaining_time": "3 days, 21:13:41", "throughput": 2723.8, "total_tokens": 733751200} {"current_steps": 4068, "total_steps": 9134, "loss": 0.7294, "learning_rate": 2.9269678761175857e-05, "epoch": 0.4453323845753852, "percentage": 44.54, "elapsed_time": "3 days, 2:50:54", "remaining_time": "3 days, 21:12:39", "throughput": 2723.77, "total_tokens": 733933088} {"current_steps": 4069, "total_steps": 9134, "loss": 0.7485, "learning_rate": 2.9261206217888048e-05, "epoch": 0.44544185664632313, "percentage": 44.55, "elapsed_time": "3 days, 2:51:57", "remaining_time": "3 days, 21:11:29", "throughput": 2723.76, "total_tokens": 734102656} {"current_steps": 4070, "total_steps": 9134, "loss": 0.7672, "learning_rate": 2.925273317050769e-05, "epoch": 0.445551328717261, "percentage": 44.56, "elapsed_time": "3 days, 2:53:04", "remaining_time": "3 days, 21:10:24", "throughput": 2723.75, "total_tokens": 734280960} {"current_steps": 4071, "total_steps": 9134, "loss": 0.772, "learning_rate": 2.9244259620037135e-05, "epoch": 0.4456608007881989, "percentage": 44.57, "elapsed_time": "3 days, 2:54:12", "remaining_time": "3 days, 21:09:19", "throughput": 2723.73, "total_tokens": 734458592} {"current_steps": 4072, "total_steps": 9134, "loss": 0.7832, "learning_rate": 2.9235785567478774e-05, "epoch": 0.44577027285913684, "percentage": 44.58, "elapsed_time": "3 days, 2:55:15", "remaining_time": "3 days, 21:08:09", "throughput": 2723.75, "total_tokens": 734637792} {"current_steps": 4073, "total_steps": 9134, "loss": 0.7481, "learning_rate": 2.9227311013835084e-05, "epoch": 0.4458797449300747, "percentage": 44.59, "elapsed_time": "3 days, 2:56:19", "remaining_time": "3 days, 21:07:00", "throughput": 2723.76, "total_tokens": 734814304} {"current_steps": 4074, "total_steps": 9134, "loss": 0.5067, "learning_rate": 2.921883596010857e-05, "epoch": 0.44598921700101263, "percentage": 44.6, "elapsed_time": "3 days, 2:57:25", "remaining_time": "3 days, 21:05:53", "throughput": 2723.71, "total_tokens": 734980288} {"current_steps": 4075, "total_steps": 9134, "loss": 0.6887, "learning_rate": 2.921036040730184e-05, "epoch": 0.4460986890719505, "percentage": 44.61, "elapsed_time": "3 days, 2:58:30", "remaining_time": "3 days, 21:04:46", "throughput": 2723.77, "total_tokens": 735175392} {"current_steps": 4076, "total_steps": 9134, "loss": 0.6144, "learning_rate": 2.9201884356417514e-05, "epoch": 0.4462081611428884, "percentage": 44.62, "elapsed_time": "3 days, 2:59:34", "remaining_time": "3 days, 21:03:37", "throughput": 2723.73, "total_tokens": 735339584} {"current_steps": 4077, "total_steps": 9134, "loss": 0.7013, "learning_rate": 2.9193407808458308e-05, "epoch": 0.44631763321382634, "percentage": 44.64, "elapsed_time": "3 days, 3:00:39", "remaining_time": "3 days, 21:02:30", "throughput": 2723.72, "total_tokens": 735512960} {"current_steps": 4078, "total_steps": 9134, "loss": 0.8481, "learning_rate": 2.918493076442697e-05, "epoch": 0.4464271052847642, "percentage": 44.65, "elapsed_time": "3 days, 3:01:46", "remaining_time": "3 days, 21:01:24", "throughput": 2723.67, "total_tokens": 735680288} {"current_steps": 4079, "total_steps": 9134, "loss": 0.6095, "learning_rate": 2.9176453225326328e-05, "epoch": 0.4465365773557021, "percentage": 44.66, "elapsed_time": "3 days, 3:02:50", "remaining_time": "3 days, 21:00:14", "throughput": 2723.64, "total_tokens": 735845152} {"current_steps": 4080, "total_steps": 9134, "loss": 0.7467, "learning_rate": 2.9167975192159247e-05, "epoch": 0.44664604942664005, "percentage": 44.67, "elapsed_time": "3 days, 3:03:58", "remaining_time": "3 days, 20:59:11", "throughput": 2723.71, "total_tokens": 736051232} {"current_steps": 4081, "total_steps": 9134, "loss": 0.9203, "learning_rate": 2.9159496665928677e-05, "epoch": 0.4467555214975779, "percentage": 44.68, "elapsed_time": "3 days, 3:05:06", "remaining_time": "3 days, 20:58:07", "throughput": 2723.75, "total_tokens": 736245888} {"current_steps": 4082, "total_steps": 9134, "loss": 0.8306, "learning_rate": 2.915101764763759e-05, "epoch": 0.44686499356851583, "percentage": 44.69, "elapsed_time": "3 days, 3:06:07", "remaining_time": "3 days, 20:56:54", "throughput": 2723.64, "total_tokens": 736385216} {"current_steps": 4083, "total_steps": 9134, "loss": 0.7493, "learning_rate": 2.914253813828906e-05, "epoch": 0.44697446563945376, "percentage": 44.7, "elapsed_time": "3 days, 3:07:15", "remaining_time": "3 days, 20:55:50", "throughput": 2723.7, "total_tokens": 736585248} {"current_steps": 4084, "total_steps": 9134, "loss": 0.7806, "learning_rate": 2.9134058138886188e-05, "epoch": 0.4470839377103916, "percentage": 44.71, "elapsed_time": "3 days, 3:08:24", "remaining_time": "3 days, 20:54:48", "throughput": 2723.72, "total_tokens": 736779008} {"current_steps": 4085, "total_steps": 9134, "loss": 0.5471, "learning_rate": 2.9125577650432133e-05, "epoch": 0.44719340978132954, "percentage": 44.72, "elapsed_time": "3 days, 3:09:28", "remaining_time": "3 days, 20:53:39", "throughput": 2723.73, "total_tokens": 736956416} {"current_steps": 4086, "total_steps": 9134, "loss": 0.7088, "learning_rate": 2.9117096673930138e-05, "epoch": 0.44730288185226746, "percentage": 44.73, "elapsed_time": "3 days, 3:10:36", "remaining_time": "3 days, 20:52:34", "throughput": 2723.69, "total_tokens": 737128672} {"current_steps": 4087, "total_steps": 9134, "loss": 0.6709, "learning_rate": 2.910861521038347e-05, "epoch": 0.44741235392320533, "percentage": 44.74, "elapsed_time": "3 days, 3:11:40", "remaining_time": "3 days, 20:51:25", "throughput": 2723.71, "total_tokens": 737310560} {"current_steps": 4088, "total_steps": 9134, "loss": 0.6609, "learning_rate": 2.9100133260795488e-05, "epoch": 0.44752182599414325, "percentage": 44.76, "elapsed_time": "3 days, 3:12:47", "remaining_time": "3 days, 20:50:20", "throughput": 2723.7, "total_tokens": 737491776} {"current_steps": 4089, "total_steps": 9134, "loss": 0.5555, "learning_rate": 2.9091650826169565e-05, "epoch": 0.4476312980650812, "percentage": 44.77, "elapsed_time": "3 days, 3:13:46", "remaining_time": "3 days, 20:49:05", "throughput": 2723.65, "total_tokens": 737637600} {"current_steps": 4090, "total_steps": 9134, "loss": 0.6714, "learning_rate": 2.9083167907509178e-05, "epoch": 0.44774077013601904, "percentage": 44.78, "elapsed_time": "3 days, 3:14:51", "remaining_time": "3 days, 20:47:57", "throughput": 2723.66, "total_tokens": 737818592} {"current_steps": 4091, "total_steps": 9134, "loss": 0.7428, "learning_rate": 2.9074684505817835e-05, "epoch": 0.44785024220695696, "percentage": 44.79, "elapsed_time": "3 days, 3:15:58", "remaining_time": "3 days, 20:46:51", "throughput": 2723.69, "total_tokens": 738006528} {"current_steps": 4092, "total_steps": 9134, "loss": 0.8535, "learning_rate": 2.9066200622099106e-05, "epoch": 0.4479597142778948, "percentage": 44.8, "elapsed_time": "3 days, 3:17:06", "remaining_time": "3 days, 20:45:47", "throughput": 2723.77, "total_tokens": 738213728} {"current_steps": 4093, "total_steps": 9134, "loss": 0.7829, "learning_rate": 2.9057716257356614e-05, "epoch": 0.44806918634883275, "percentage": 44.81, "elapsed_time": "3 days, 3:18:15", "remaining_time": "3 days, 20:44:45", "throughput": 2723.82, "total_tokens": 738416896} {"current_steps": 4094, "total_steps": 9134, "loss": 0.6918, "learning_rate": 2.9049231412594046e-05, "epoch": 0.44817865841977067, "percentage": 44.82, "elapsed_time": "3 days, 3:19:24", "remaining_time": "3 days, 20:43:43", "throughput": 2723.88, "total_tokens": 738621408} {"current_steps": 4095, "total_steps": 9134, "loss": 0.638, "learning_rate": 2.9040746088815142e-05, "epoch": 0.44828813049070854, "percentage": 44.83, "elapsed_time": "3 days, 3:20:31", "remaining_time": "3 days, 20:42:37", "throughput": 2723.86, "total_tokens": 738798368} {"current_steps": 4096, "total_steps": 9134, "loss": 0.8713, "learning_rate": 2.9032260287023698e-05, "epoch": 0.44839760256164646, "percentage": 44.84, "elapsed_time": "3 days, 3:21:40", "remaining_time": "3 days, 20:41:33", "throughput": 2723.87, "total_tokens": 738984960} {"current_steps": 4097, "total_steps": 9134, "loss": 0.7486, "learning_rate": 2.902377400822357e-05, "epoch": 0.4485070746325844, "percentage": 44.85, "elapsed_time": "3 days, 3:22:46", "remaining_time": "3 days, 20:40:28", "throughput": 2723.93, "total_tokens": 739185216} {"current_steps": 4098, "total_steps": 9134, "loss": 0.7816, "learning_rate": 2.9015287253418672e-05, "epoch": 0.44861654670352225, "percentage": 44.87, "elapsed_time": "3 days, 3:23:51", "remaining_time": "3 days, 20:39:19", "throughput": 2723.87, "total_tokens": 739343360} {"current_steps": 4099, "total_steps": 9134, "loss": 0.6913, "learning_rate": 2.900680002361297e-05, "epoch": 0.44872601877446017, "percentage": 44.88, "elapsed_time": "3 days, 3:24:52", "remaining_time": "3 days, 20:38:07", "throughput": 2723.79, "total_tokens": 739489856} {"current_steps": 4100, "total_steps": 9134, "loss": 0.5013, "learning_rate": 2.8998312319810482e-05, "epoch": 0.4488354908453981, "percentage": 44.89, "elapsed_time": "3 days, 3:25:57", "remaining_time": "3 days, 20:36:59", "throughput": 2723.78, "total_tokens": 739663008} {"current_steps": 4101, "total_steps": 9134, "loss": 0.7365, "learning_rate": 2.8989824143015286e-05, "epoch": 0.44894496291633595, "percentage": 44.9, "elapsed_time": "3 days, 3:27:03", "remaining_time": "3 days, 20:35:52", "throughput": 2723.79, "total_tokens": 739844672} {"current_steps": 4102, "total_steps": 9134, "loss": 0.7275, "learning_rate": 2.8981335494231533e-05, "epoch": 0.4490544349872739, "percentage": 44.91, "elapsed_time": "3 days, 3:28:10", "remaining_time": "3 days, 20:34:48", "throughput": 2723.85, "total_tokens": 740044256} {"current_steps": 4103, "total_steps": 9134, "loss": 0.899, "learning_rate": 2.8972846374463387e-05, "epoch": 0.4491639070582118, "percentage": 44.92, "elapsed_time": "3 days, 3:29:15", "remaining_time": "3 days, 20:33:40", "throughput": 2723.84, "total_tokens": 740218976} {"current_steps": 4104, "total_steps": 9134, "loss": 0.6348, "learning_rate": 2.896435678471512e-05, "epoch": 0.44927337912914966, "percentage": 44.93, "elapsed_time": "3 days, 3:30:24", "remaining_time": "3 days, 20:32:37", "throughput": 2723.91, "total_tokens": 740425056} {"current_steps": 4105, "total_steps": 9134, "loss": 0.7896, "learning_rate": 2.895586672599102e-05, "epoch": 0.4493828512000876, "percentage": 44.94, "elapsed_time": "3 days, 3:31:30", "remaining_time": "3 days, 20:31:30", "throughput": 2723.92, "total_tokens": 740608288} {"current_steps": 4106, "total_steps": 9134, "loss": 0.7365, "learning_rate": 2.894737619929545e-05, "epoch": 0.4494923232710255, "percentage": 44.95, "elapsed_time": "3 days, 3:32:36", "remaining_time": "3 days, 20:30:24", "throughput": 2723.96, "total_tokens": 740798240} {"current_steps": 4107, "total_steps": 9134, "loss": 0.9102, "learning_rate": 2.893888520563282e-05, "epoch": 0.4496017953419634, "percentage": 44.96, "elapsed_time": "3 days, 3:33:43", "remaining_time": "3 days, 20:29:18", "throughput": 2723.94, "total_tokens": 740975424} {"current_steps": 4108, "total_steps": 9134, "loss": 0.6858, "learning_rate": 2.8930393746007606e-05, "epoch": 0.4497112674129013, "percentage": 44.97, "elapsed_time": "3 days, 3:34:44", "remaining_time": "3 days, 20:28:06", "throughput": 2723.85, "total_tokens": 741119232} {"current_steps": 4109, "total_steps": 9134, "loss": 0.6842, "learning_rate": 2.8921901821424313e-05, "epoch": 0.44982073948383916, "percentage": 44.99, "elapsed_time": "3 days, 3:35:50", "remaining_time": "3 days, 20:26:59", "throughput": 2723.86, "total_tokens": 741298656} {"current_steps": 4110, "total_steps": 9134, "loss": 0.8468, "learning_rate": 2.8913409432887546e-05, "epoch": 0.4499302115547771, "percentage": 45.0, "elapsed_time": "3 days, 3:36:57", "remaining_time": "3 days, 20:25:53", "throughput": 2723.9, "total_tokens": 741493088} {"current_steps": 4111, "total_steps": 9134, "loss": 0.7091, "learning_rate": 2.8904916581401913e-05, "epoch": 0.450039683625715, "percentage": 45.01, "elapsed_time": "3 days, 3:38:02", "remaining_time": "3 days, 20:24:46", "throughput": 2723.92, "total_tokens": 741676992} {"current_steps": 4112, "total_steps": 9134, "loss": 0.7575, "learning_rate": 2.8896423267972123e-05, "epoch": 0.45014915569665287, "percentage": 45.02, "elapsed_time": "3 days, 3:39:08", "remaining_time": "3 days, 20:23:40", "throughput": 2723.96, "total_tokens": 741867168} {"current_steps": 4113, "total_steps": 9134, "loss": 0.7856, "learning_rate": 2.8887929493602905e-05, "epoch": 0.4502586277675908, "percentage": 45.03, "elapsed_time": "3 days, 3:40:15", "remaining_time": "3 days, 20:22:34", "throughput": 2723.93, "total_tokens": 742041664} {"current_steps": 4114, "total_steps": 9134, "loss": 0.7802, "learning_rate": 2.8879435259299065e-05, "epoch": 0.4503680998385287, "percentage": 45.04, "elapsed_time": "3 days, 3:41:24", "remaining_time": "3 days, 20:21:32", "throughput": 2724.03, "total_tokens": 742257600} {"current_steps": 4115, "total_steps": 9134, "loss": 0.6139, "learning_rate": 2.8870940566065442e-05, "epoch": 0.4504775719094666, "percentage": 45.05, "elapsed_time": "3 days, 3:42:31", "remaining_time": "3 days, 20:20:26", "throughput": 2723.97, "total_tokens": 742423136} {"current_steps": 4116, "total_steps": 9134, "loss": 0.6623, "learning_rate": 2.8862445414906953e-05, "epoch": 0.4505870439804045, "percentage": 45.06, "elapsed_time": "3 days, 3:43:35", "remaining_time": "3 days, 20:19:17", "throughput": 2723.98, "total_tokens": 742599648} {"current_steps": 4117, "total_steps": 9134, "loss": 0.8687, "learning_rate": 2.8853949806828558e-05, "epoch": 0.4506965160513424, "percentage": 45.07, "elapsed_time": "3 days, 3:44:43", "remaining_time": "3 days, 20:18:14", "throughput": 2724.05, "total_tokens": 742803488} {"current_steps": 4118, "total_steps": 9134, "loss": 0.6805, "learning_rate": 2.884545374283526e-05, "epoch": 0.4508059881222803, "percentage": 45.08, "elapsed_time": "3 days, 3:45:52", "remaining_time": "3 days, 20:17:11", "throughput": 2724.09, "total_tokens": 743003968} {"current_steps": 4119, "total_steps": 9134, "loss": 0.7523, "learning_rate": 2.8836957223932137e-05, "epoch": 0.4509154601932182, "percentage": 45.1, "elapsed_time": "3 days, 3:46:59", "remaining_time": "3 days, 20:16:05", "throughput": 2724.04, "total_tokens": 743171744} {"current_steps": 4120, "total_steps": 9134, "loss": 0.7095, "learning_rate": 2.8828460251124317e-05, "epoch": 0.45102493226415613, "percentage": 45.11, "elapsed_time": "3 days, 3:48:07", "remaining_time": "3 days, 20:15:01", "throughput": 2724.08, "total_tokens": 743366624} {"current_steps": 4121, "total_steps": 9134, "loss": 0.7463, "learning_rate": 2.881996282541697e-05, "epoch": 0.451134404335094, "percentage": 45.12, "elapsed_time": "3 days, 3:49:14", "remaining_time": "3 days, 20:13:56", "throughput": 2724.05, "total_tokens": 743542688} {"current_steps": 4122, "total_steps": 9134, "loss": 0.5331, "learning_rate": 2.8811464947815314e-05, "epoch": 0.4512438764060319, "percentage": 45.13, "elapsed_time": "3 days, 3:50:18", "remaining_time": "3 days, 20:12:47", "throughput": 2724.01, "total_tokens": 743706208} {"current_steps": 4123, "total_steps": 9134, "loss": 0.794, "learning_rate": 2.8802966619324645e-05, "epoch": 0.45135334847696984, "percentage": 45.14, "elapsed_time": "3 days, 3:51:27", "remaining_time": "3 days, 20:11:44", "throughput": 2724.14, "total_tokens": 743927968} {"current_steps": 4124, "total_steps": 9134, "loss": 0.6574, "learning_rate": 2.8794467840950295e-05, "epoch": 0.4514628205479077, "percentage": 45.15, "elapsed_time": "3 days, 3:52:33", "remaining_time": "3 days, 20:10:37", "throughput": 2724.14, "total_tokens": 744106720} {"current_steps": 4125, "total_steps": 9134, "loss": 0.5533, "learning_rate": 2.8785968613697655e-05, "epoch": 0.4515722926188456, "percentage": 45.16, "elapsed_time": "3 days, 3:53:40", "remaining_time": "3 days, 20:09:32", "throughput": 2724.19, "total_tokens": 744302496} {"current_steps": 4126, "total_steps": 9134, "loss": 0.8233, "learning_rate": 2.877746893857216e-05, "epoch": 0.4516817646897835, "percentage": 45.17, "elapsed_time": "3 days, 3:54:44", "remaining_time": "3 days, 20:08:23", "throughput": 2724.24, "total_tokens": 744490432} {"current_steps": 4127, "total_steps": 9134, "loss": 0.7654, "learning_rate": 2.8768968816579312e-05, "epoch": 0.4517912367607214, "percentage": 45.18, "elapsed_time": "3 days, 3:55:49", "remaining_time": "3 days, 20:07:16", "throughput": 2724.22, "total_tokens": 744665152} {"current_steps": 4128, "total_steps": 9134, "loss": 0.6564, "learning_rate": 2.8760468248724665e-05, "epoch": 0.45190070883165934, "percentage": 45.19, "elapsed_time": "3 days, 3:56:57", "remaining_time": "3 days, 20:06:11", "throughput": 2724.23, "total_tokens": 744849728} {"current_steps": 4129, "total_steps": 9134, "loss": 0.5281, "learning_rate": 2.875196723601381e-05, "epoch": 0.4520101809025972, "percentage": 45.2, "elapsed_time": "3 days, 3:58:01", "remaining_time": "3 days, 20:05:02", "throughput": 2724.24, "total_tokens": 745029600} {"current_steps": 4130, "total_steps": 9134, "loss": 0.6389, "learning_rate": 2.8743465779452394e-05, "epoch": 0.4521196529735351, "percentage": 45.22, "elapsed_time": "3 days, 3:59:09", "remaining_time": "3 days, 20:03:59", "throughput": 2724.2, "total_tokens": 745204096} {"current_steps": 4131, "total_steps": 9134, "loss": 0.5771, "learning_rate": 2.8734963880046145e-05, "epoch": 0.45222912504447305, "percentage": 45.23, "elapsed_time": "3 days, 4:00:16", "remaining_time": "3 days, 20:02:53", "throughput": 2724.15, "total_tokens": 745374336} {"current_steps": 4132, "total_steps": 9134, "loss": 0.5602, "learning_rate": 2.8726461538800802e-05, "epoch": 0.4523385971154109, "percentage": 45.24, "elapsed_time": "3 days, 4:01:14", "remaining_time": "3 days, 20:01:37", "throughput": 2724.07, "total_tokens": 745508288} {"current_steps": 4133, "total_steps": 9134, "loss": 0.5364, "learning_rate": 2.871795875672219e-05, "epoch": 0.45244806918634883, "percentage": 45.25, "elapsed_time": "3 days, 4:02:22", "remaining_time": "3 days, 20:00:33", "throughput": 2724.11, "total_tokens": 745704512} {"current_steps": 4134, "total_steps": 9134, "loss": 0.6495, "learning_rate": 2.870945553481616e-05, "epoch": 0.45255754125728676, "percentage": 45.26, "elapsed_time": "3 days, 4:03:28", "remaining_time": "3 days, 19:59:26", "throughput": 2724.05, "total_tokens": 745868032} {"current_steps": 4135, "total_steps": 9134, "loss": 0.5812, "learning_rate": 2.8700951874088634e-05, "epoch": 0.4526670133282246, "percentage": 45.27, "elapsed_time": "3 days, 4:04:36", "remaining_time": "3 days, 19:58:22", "throughput": 2724.0, "total_tokens": 746040960} {"current_steps": 4136, "total_steps": 9134, "loss": 0.7929, "learning_rate": 2.869244777554557e-05, "epoch": 0.45277648539916254, "percentage": 45.28, "elapsed_time": "3 days, 4:05:46", "remaining_time": "3 days, 19:57:20", "throughput": 2724.06, "total_tokens": 746244576} {"current_steps": 4137, "total_steps": 9134, "loss": 0.6314, "learning_rate": 2.8683943240192997e-05, "epoch": 0.45288595747010046, "percentage": 45.29, "elapsed_time": "3 days, 4:06:55", "remaining_time": "3 days, 19:56:17", "throughput": 2724.05, "total_tokens": 746431840} {"current_steps": 4138, "total_steps": 9134, "loss": 0.8459, "learning_rate": 2.867543826903698e-05, "epoch": 0.45299542954103833, "percentage": 45.3, "elapsed_time": "3 days, 4:07:57", "remaining_time": "3 days, 19:55:06", "throughput": 2724.01, "total_tokens": 746588416} {"current_steps": 4139, "total_steps": 9134, "loss": 0.8173, "learning_rate": 2.866693286308364e-05, "epoch": 0.45310490161197625, "percentage": 45.31, "elapsed_time": "3 days, 4:09:05", "remaining_time": "3 days, 19:54:02", "throughput": 2723.98, "total_tokens": 746765152} {"current_steps": 4140, "total_steps": 9134, "loss": 0.755, "learning_rate": 2.8658427023339156e-05, "epoch": 0.4532143736829142, "percentage": 45.33, "elapsed_time": "3 days, 4:10:12", "remaining_time": "3 days, 19:52:56", "throughput": 2723.99, "total_tokens": 746951072} {"current_steps": 4141, "total_steps": 9134, "loss": 1.021, "learning_rate": 2.864992075080975e-05, "epoch": 0.45332384575385204, "percentage": 45.34, "elapsed_time": "3 days, 4:11:21", "remaining_time": "3 days, 19:51:54", "throughput": 2724.05, "total_tokens": 747156480} {"current_steps": 4142, "total_steps": 9134, "loss": 0.7432, "learning_rate": 2.8641414046501697e-05, "epoch": 0.45343331782478996, "percentage": 45.35, "elapsed_time": "3 days, 4:12:27", "remaining_time": "3 days, 19:50:47", "throughput": 2724.04, "total_tokens": 747331648} {"current_steps": 4143, "total_steps": 9134, "loss": 0.7253, "learning_rate": 2.8632906911421313e-05, "epoch": 0.4535427898957278, "percentage": 45.36, "elapsed_time": "3 days, 4:13:31", "remaining_time": "3 days, 19:49:39", "throughput": 2724.02, "total_tokens": 747502560} {"current_steps": 4144, "total_steps": 9134, "loss": 0.7932, "learning_rate": 2.8624399346575e-05, "epoch": 0.45365226196666575, "percentage": 45.37, "elapsed_time": "3 days, 4:14:40", "remaining_time": "3 days, 19:48:35", "throughput": 2724.09, "total_tokens": 747707296} {"current_steps": 4145, "total_steps": 9134, "loss": 0.5306, "learning_rate": 2.861589135296917e-05, "epoch": 0.45376173403760367, "percentage": 45.38, "elapsed_time": "3 days, 4:15:40", "remaining_time": "3 days, 19:47:22", "throughput": 2724.04, "total_tokens": 747858944} {"current_steps": 4146, "total_steps": 9134, "loss": 0.6339, "learning_rate": 2.8607382931610306e-05, "epoch": 0.45387120610854154, "percentage": 45.39, "elapsed_time": "3 days, 4:16:47", "remaining_time": "3 days, 19:46:16", "throughput": 2724.09, "total_tokens": 748054496} {"current_steps": 4147, "total_steps": 9134, "loss": 0.949, "learning_rate": 2.8598874083504933e-05, "epoch": 0.45398067817947946, "percentage": 45.4, "elapsed_time": "3 days, 4:17:55", "remaining_time": "3 days, 19:45:12", "throughput": 2724.17, "total_tokens": 748261248} {"current_steps": 4148, "total_steps": 9134, "loss": 0.7696, "learning_rate": 2.8590364809659632e-05, "epoch": 0.4540901502504174, "percentage": 45.41, "elapsed_time": "3 days, 4:18:56", "remaining_time": "3 days, 19:44:00", "throughput": 2724.15, "total_tokens": 748423424} {"current_steps": 4149, "total_steps": 9134, "loss": 0.7185, "learning_rate": 2.858185511108104e-05, "epoch": 0.45419962232135525, "percentage": 45.42, "elapsed_time": "3 days, 4:20:04", "remaining_time": "3 days, 19:42:55", "throughput": 2724.16, "total_tokens": 748609792} {"current_steps": 4150, "total_steps": 9134, "loss": 0.822, "learning_rate": 2.8573344988775834e-05, "epoch": 0.45430909439229317, "percentage": 45.43, "elapsed_time": "3 days, 4:21:13", "remaining_time": "3 days, 19:41:52", "throughput": 2724.17, "total_tokens": 748801760} {"current_steps": 4151, "total_steps": 9134, "loss": 0.5067, "learning_rate": 2.8564834443750753e-05, "epoch": 0.4544185664632311, "percentage": 45.45, "elapsed_time": "3 days, 4:22:17", "remaining_time": "3 days, 19:40:44", "throughput": 2724.14, "total_tokens": 748969536} {"current_steps": 4152, "total_steps": 9134, "loss": 0.6684, "learning_rate": 2.8556323477012577e-05, "epoch": 0.45452803853416895, "percentage": 45.46, "elapsed_time": "3 days, 4:23:22", "remaining_time": "3 days, 19:39:36", "throughput": 2724.12, "total_tokens": 749141344} {"current_steps": 4153, "total_steps": 9134, "loss": 0.6541, "learning_rate": 2.8547812089568128e-05, "epoch": 0.4546375106051069, "percentage": 45.47, "elapsed_time": "3 days, 4:24:31", "remaining_time": "3 days, 19:38:33", "throughput": 2724.17, "total_tokens": 749343168} {"current_steps": 4154, "total_steps": 9134, "loss": 0.8786, "learning_rate": 2.8539300282424288e-05, "epoch": 0.4547469826760448, "percentage": 45.48, "elapsed_time": "3 days, 4:25:36", "remaining_time": "3 days, 19:37:26", "throughput": 2724.15, "total_tokens": 749514304} {"current_steps": 4155, "total_steps": 9134, "loss": 0.5559, "learning_rate": 2.8530788056587993e-05, "epoch": 0.45485645474698266, "percentage": 45.49, "elapsed_time": "3 days, 4:26:41", "remaining_time": "3 days, 19:36:18", "throughput": 2724.15, "total_tokens": 749690592} {"current_steps": 4156, "total_steps": 9134, "loss": 0.8524, "learning_rate": 2.852227541306622e-05, "epoch": 0.4549659268179206, "percentage": 45.5, "elapsed_time": "3 days, 4:27:49", "remaining_time": "3 days, 19:35:14", "throughput": 2724.18, "total_tokens": 749885248} {"current_steps": 4157, "total_steps": 9134, "loss": 1.0456, "learning_rate": 2.851376235286599e-05, "epoch": 0.4550753988888585, "percentage": 45.51, "elapsed_time": "3 days, 4:28:57", "remaining_time": "3 days, 19:34:09", "throughput": 2724.19, "total_tokens": 750072736} {"current_steps": 4158, "total_steps": 9134, "loss": 0.7398, "learning_rate": 2.85052488769944e-05, "epoch": 0.4551848709597964, "percentage": 45.52, "elapsed_time": "3 days, 4:30:01", "remaining_time": "3 days, 19:33:00", "throughput": 2724.21, "total_tokens": 750250816} {"current_steps": 4159, "total_steps": 9134, "loss": 0.9143, "learning_rate": 2.849673498645857e-05, "epoch": 0.4552943430307343, "percentage": 45.53, "elapsed_time": "3 days, 4:31:07", "remaining_time": "3 days, 19:31:54", "throughput": 2724.24, "total_tokens": 750441664} {"current_steps": 4160, "total_steps": 9134, "loss": 0.4653, "learning_rate": 2.848822068226567e-05, "epoch": 0.45540381510167216, "percentage": 45.54, "elapsed_time": "3 days, 4:32:11", "remaining_time": "3 days, 19:30:45", "throughput": 2724.18, "total_tokens": 750596672} {"current_steps": 4161, "total_steps": 9134, "loss": 0.5955, "learning_rate": 2.8479705965422937e-05, "epoch": 0.4555132871726101, "percentage": 45.56, "elapsed_time": "3 days, 4:33:16", "remaining_time": "3 days, 19:29:38", "throughput": 2724.05, "total_tokens": 750740480} {"current_steps": 4162, "total_steps": 9134, "loss": 0.7815, "learning_rate": 2.8471190836937638e-05, "epoch": 0.455622759243548, "percentage": 45.57, "elapsed_time": "3 days, 4:34:22", "remaining_time": "3 days, 19:28:31", "throughput": 2724.07, "total_tokens": 750924384} {"current_steps": 4163, "total_steps": 9134, "loss": 0.5404, "learning_rate": 2.84626752978171e-05, "epoch": 0.45573223131448587, "percentage": 45.58, "elapsed_time": "3 days, 4:35:25", "remaining_time": "3 days, 19:27:21", "throughput": 2724.1, "total_tokens": 751105376} {"current_steps": 4164, "total_steps": 9134, "loss": 0.7871, "learning_rate": 2.845415934906869e-05, "epoch": 0.4558417033854238, "percentage": 45.59, "elapsed_time": "3 days, 4:36:30", "remaining_time": "3 days, 19:26:13", "throughput": 2724.11, "total_tokens": 751283680} {"current_steps": 4165, "total_steps": 9134, "loss": 0.6632, "learning_rate": 2.8445642991699835e-05, "epoch": 0.4559511754563617, "percentage": 45.6, "elapsed_time": "3 days, 4:37:35", "remaining_time": "3 days, 19:25:05", "throughput": 2724.07, "total_tokens": 751448992} {"current_steps": 4166, "total_steps": 9134, "loss": 0.8513, "learning_rate": 2.8437126226718e-05, "epoch": 0.4560606475272996, "percentage": 45.61, "elapsed_time": "3 days, 4:38:43", "remaining_time": "3 days, 19:24:01", "throughput": 2724.1, "total_tokens": 751643648} {"current_steps": 4167, "total_steps": 9134, "loss": 0.9216, "learning_rate": 2.8428609055130707e-05, "epoch": 0.4561701195982375, "percentage": 45.62, "elapsed_time": "3 days, 4:39:48", "remaining_time": "3 days, 19:22:54", "throughput": 2724.16, "total_tokens": 751836736} {"current_steps": 4168, "total_steps": 9134, "loss": 0.6976, "learning_rate": 2.8420091477945514e-05, "epoch": 0.4562795916691754, "percentage": 45.63, "elapsed_time": "3 days, 4:40:52", "remaining_time": "3 days, 19:21:45", "throughput": 2724.14, "total_tokens": 752004736} {"current_steps": 4169, "total_steps": 9134, "loss": 0.7811, "learning_rate": 2.8411573496170034e-05, "epoch": 0.4563890637401133, "percentage": 45.64, "elapsed_time": "3 days, 4:41:59", "remaining_time": "3 days, 19:20:40", "throughput": 2724.22, "total_tokens": 752211712} {"current_steps": 4170, "total_steps": 9134, "loss": 0.796, "learning_rate": 2.840305511081194e-05, "epoch": 0.4564985358110512, "percentage": 45.65, "elapsed_time": "3 days, 4:43:05", "remaining_time": "3 days, 19:19:33", "throughput": 2724.22, "total_tokens": 752391136} {"current_steps": 4171, "total_steps": 9134, "loss": 0.5451, "learning_rate": 2.8394536322878916e-05, "epoch": 0.45660800788198913, "percentage": 45.66, "elapsed_time": "3 days, 4:44:09", "remaining_time": "3 days, 19:18:24", "throughput": 2724.14, "total_tokens": 752544128} {"current_steps": 4172, "total_steps": 9134, "loss": 0.8127, "learning_rate": 2.838601713337875e-05, "epoch": 0.456717479952927, "percentage": 45.68, "elapsed_time": "3 days, 4:45:18", "remaining_time": "3 days, 19:17:20", "throughput": 2724.2, "total_tokens": 752744160} {"current_steps": 4173, "total_steps": 9134, "loss": 0.8205, "learning_rate": 2.8377497543319227e-05, "epoch": 0.4568269520238649, "percentage": 45.69, "elapsed_time": "3 days, 4:46:24", "remaining_time": "3 days, 19:16:14", "throughput": 2724.13, "total_tokens": 752907008} {"current_steps": 4174, "total_steps": 9134, "loss": 0.8, "learning_rate": 2.8368977553708198e-05, "epoch": 0.45693642409480284, "percentage": 45.7, "elapsed_time": "3 days, 4:47:29", "remaining_time": "3 days, 19:15:07", "throughput": 2724.17, "total_tokens": 753096288} {"current_steps": 4175, "total_steps": 9134, "loss": 0.739, "learning_rate": 2.836045716555357e-05, "epoch": 0.4570458961657407, "percentage": 45.71, "elapsed_time": "3 days, 4:48:35", "remaining_time": "3 days, 19:14:01", "throughput": 2724.15, "total_tokens": 753271456} {"current_steps": 4176, "total_steps": 9134, "loss": 0.4571, "learning_rate": 2.835193637986328e-05, "epoch": 0.4571553682366786, "percentage": 45.72, "elapsed_time": "3 days, 4:49:44", "remaining_time": "3 days, 19:12:57", "throughput": 2724.23, "total_tokens": 753479776} {"current_steps": 4177, "total_steps": 9134, "loss": 0.5259, "learning_rate": 2.8343415197645317e-05, "epoch": 0.4572648403076165, "percentage": 45.73, "elapsed_time": "3 days, 4:50:51", "remaining_time": "3 days, 19:11:52", "throughput": 2724.22, "total_tokens": 753660320} {"current_steps": 4178, "total_steps": 9134, "loss": 0.5846, "learning_rate": 2.8334893619907737e-05, "epoch": 0.4573743123785544, "percentage": 45.74, "elapsed_time": "3 days, 4:52:00", "remaining_time": "3 days, 19:10:49", "throughput": 2724.16, "total_tokens": 753830784} {"current_steps": 4179, "total_steps": 9134, "loss": 0.8426, "learning_rate": 2.8326371647658618e-05, "epoch": 0.45748378444949234, "percentage": 45.75, "elapsed_time": "3 days, 4:53:09", "remaining_time": "3 days, 19:09:46", "throughput": 2724.16, "total_tokens": 754016480} {"current_steps": 4180, "total_steps": 9134, "loss": 0.6645, "learning_rate": 2.831784928190609e-05, "epoch": 0.4575932565204302, "percentage": 45.76, "elapsed_time": "3 days, 4:54:12", "remaining_time": "3 days, 19:08:36", "throughput": 2724.17, "total_tokens": 754192768} {"current_steps": 4181, "total_steps": 9134, "loss": 0.5332, "learning_rate": 2.8309326523658324e-05, "epoch": 0.4577027285913681, "percentage": 45.77, "elapsed_time": "3 days, 4:55:18", "remaining_time": "3 days, 19:07:30", "throughput": 2724.18, "total_tokens": 754377120} {"current_steps": 4182, "total_steps": 9134, "loss": 0.7576, "learning_rate": 2.830080337392357e-05, "epoch": 0.45781220066230605, "percentage": 45.78, "elapsed_time": "3 days, 4:56:27", "remaining_time": "3 days, 19:06:26", "throughput": 2724.22, "total_tokens": 754573568} {"current_steps": 4183, "total_steps": 9134, "loss": 0.9079, "learning_rate": 2.8292279833710084e-05, "epoch": 0.4579216727332439, "percentage": 45.8, "elapsed_time": "3 days, 4:57:34", "remaining_time": "3 days, 19:05:21", "throughput": 2724.28, "total_tokens": 754772256} {"current_steps": 4184, "total_steps": 9134, "loss": 0.5969, "learning_rate": 2.828375590402618e-05, "epoch": 0.45803114480418183, "percentage": 45.81, "elapsed_time": "3 days, 4:58:39", "remaining_time": "3 days, 19:04:14", "throughput": 2724.25, "total_tokens": 754943840} {"current_steps": 4185, "total_steps": 9134, "loss": 0.7089, "learning_rate": 2.8275231585880236e-05, "epoch": 0.45814061687511975, "percentage": 45.82, "elapsed_time": "3 days, 4:59:47", "remaining_time": "3 days, 19:03:10", "throughput": 2724.21, "total_tokens": 755118112} {"current_steps": 4186, "total_steps": 9134, "loss": 0.7822, "learning_rate": 2.826670688028066e-05, "epoch": 0.4582500889460576, "percentage": 45.83, "elapsed_time": "3 days, 5:00:54", "remaining_time": "3 days, 19:02:04", "throughput": 2724.15, "total_tokens": 755281632} {"current_steps": 4187, "total_steps": 9134, "loss": 0.8449, "learning_rate": 2.8258181788235906e-05, "epoch": 0.45835956101699554, "percentage": 45.84, "elapsed_time": "3 days, 5:01:57", "remaining_time": "3 days, 19:00:54", "throughput": 2724.15, "total_tokens": 755453888} {"current_steps": 4188, "total_steps": 9134, "loss": 0.7468, "learning_rate": 2.824965631075447e-05, "epoch": 0.45846903308793346, "percentage": 45.85, "elapsed_time": "3 days, 5:03:04", "remaining_time": "3 days, 18:59:48", "throughput": 2724.09, "total_tokens": 755618976} {"current_steps": 4189, "total_steps": 9134, "loss": 0.5656, "learning_rate": 2.8241130448844905e-05, "epoch": 0.45857850515887133, "percentage": 45.86, "elapsed_time": "3 days, 5:04:09", "remaining_time": "3 days, 18:58:41", "throughput": 2724.11, "total_tokens": 755802432} {"current_steps": 4190, "total_steps": 9134, "loss": 0.7551, "learning_rate": 2.82326042035158e-05, "epoch": 0.45868797722980925, "percentage": 45.87, "elapsed_time": "3 days, 5:05:08", "remaining_time": "3 days, 18:57:26", "throughput": 2724.0, "total_tokens": 755932352} {"current_steps": 4191, "total_steps": 9134, "loss": 0.6234, "learning_rate": 2.8224077575775803e-05, "epoch": 0.4587974493007472, "percentage": 45.88, "elapsed_time": "3 days, 5:06:16", "remaining_time": "3 days, 18:56:22", "throughput": 2724.04, "total_tokens": 756128352} {"current_steps": 4192, "total_steps": 9134, "loss": 0.8083, "learning_rate": 2.8215550566633588e-05, "epoch": 0.45890692137168504, "percentage": 45.89, "elapsed_time": "3 days, 5:07:19", "remaining_time": "3 days, 18:55:12", "throughput": 2724.02, "total_tokens": 756295680} {"current_steps": 4193, "total_steps": 9134, "loss": 0.7964, "learning_rate": 2.820702317709789e-05, "epoch": 0.45901639344262296, "percentage": 45.91, "elapsed_time": "3 days, 5:08:21", "remaining_time": "3 days, 18:54:01", "throughput": 2723.95, "total_tokens": 756443968} {"current_steps": 4194, "total_steps": 9134, "loss": 0.5165, "learning_rate": 2.8198495408177484e-05, "epoch": 0.4591258655135608, "percentage": 45.92, "elapsed_time": "3 days, 5:09:24", "remaining_time": "3 days, 18:52:50", "throughput": 2723.88, "total_tokens": 756595840} {"current_steps": 4195, "total_steps": 9134, "loss": 0.6723, "learning_rate": 2.8189967260881183e-05, "epoch": 0.45923533758449875, "percentage": 45.93, "elapsed_time": "3 days, 5:10:30", "remaining_time": "3 days, 18:51:44", "throughput": 2723.87, "total_tokens": 756772800} {"current_steps": 4196, "total_steps": 9134, "loss": 0.6793, "learning_rate": 2.818143873621785e-05, "epoch": 0.45934480965543667, "percentage": 45.94, "elapsed_time": "3 days, 5:11:37", "remaining_time": "3 days, 18:50:39", "throughput": 2723.9, "total_tokens": 756963424} {"current_steps": 4197, "total_steps": 9134, "loss": 0.6344, "learning_rate": 2.8172909835196404e-05, "epoch": 0.45945428172637454, "percentage": 45.95, "elapsed_time": "3 days, 5:12:35", "remaining_time": "3 days, 18:49:24", "throughput": 2723.78, "total_tokens": 757089984} {"current_steps": 4198, "total_steps": 9134, "loss": 0.7127, "learning_rate": 2.8164380558825782e-05, "epoch": 0.45956375379731246, "percentage": 45.96, "elapsed_time": "3 days, 5:13:42", "remaining_time": "3 days, 18:48:18", "throughput": 2723.82, "total_tokens": 757284640} {"current_steps": 4199, "total_steps": 9134, "loss": 0.6374, "learning_rate": 2.8155850908114996e-05, "epoch": 0.4596732258682504, "percentage": 45.97, "elapsed_time": "3 days, 5:14:51", "remaining_time": "3 days, 18:47:15", "throughput": 2723.82, "total_tokens": 757471008} {"current_steps": 4200, "total_steps": 9134, "loss": 0.5336, "learning_rate": 2.814732088407308e-05, "epoch": 0.45978269793918825, "percentage": 45.98, "elapsed_time": "3 days, 5:15:52", "remaining_time": "3 days, 18:46:02", "throughput": 2723.72, "total_tokens": 757610560} {"current_steps": 4201, "total_steps": 9134, "loss": 0.9575, "learning_rate": 2.8138790487709115e-05, "epoch": 0.45989217001012617, "percentage": 45.99, "elapsed_time": "3 days, 5:17:01", "remaining_time": "3 days, 18:44:59", "throughput": 2723.75, "total_tokens": 757804992} {"current_steps": 4202, "total_steps": 9134, "loss": 0.5293, "learning_rate": 2.8130259720032237e-05, "epoch": 0.4600016420810641, "percentage": 46.0, "elapsed_time": "3 days, 5:18:03", "remaining_time": "3 days, 18:43:48", "throughput": 2723.69, "total_tokens": 757957312} {"current_steps": 4203, "total_steps": 9134, "loss": 0.639, "learning_rate": 2.812172858205162e-05, "epoch": 0.46011111415200195, "percentage": 46.01, "elapsed_time": "3 days, 5:19:10", "remaining_time": "3 days, 18:42:44", "throughput": 2723.73, "total_tokens": 758151744} {"current_steps": 4204, "total_steps": 9134, "loss": 0.6157, "learning_rate": 2.8113197074776477e-05, "epoch": 0.4602205862229399, "percentage": 46.03, "elapsed_time": "3 days, 5:20:18", "remaining_time": "3 days, 18:41:38", "throughput": 2723.64, "total_tokens": 758309888} {"current_steps": 4205, "total_steps": 9134, "loss": 0.9556, "learning_rate": 2.8104665199216074e-05, "epoch": 0.4603300582938778, "percentage": 46.04, "elapsed_time": "3 days, 5:21:21", "remaining_time": "3 days, 18:40:28", "throughput": 2723.65, "total_tokens": 758483936} {"current_steps": 4206, "total_steps": 9134, "loss": 0.7719, "learning_rate": 2.809613295637971e-05, "epoch": 0.46043953036481566, "percentage": 46.05, "elapsed_time": "3 days, 5:22:29", "remaining_time": "3 days, 18:39:24", "throughput": 2723.66, "total_tokens": 758672320} {"current_steps": 4207, "total_steps": 9134, "loss": 0.7458, "learning_rate": 2.8087600347276744e-05, "epoch": 0.4605490024357536, "percentage": 46.06, "elapsed_time": "3 days, 5:23:35", "remaining_time": "3 days, 18:38:18", "throughput": 2723.68, "total_tokens": 758860032} {"current_steps": 4208, "total_steps": 9134, "loss": 0.5115, "learning_rate": 2.8079067372916555e-05, "epoch": 0.4606584745066915, "percentage": 46.07, "elapsed_time": "3 days, 5:24:38", "remaining_time": "3 days, 18:37:08", "throughput": 2723.6, "total_tokens": 759009440} {"current_steps": 4209, "total_steps": 9134, "loss": 0.8742, "learning_rate": 2.8070534034308583e-05, "epoch": 0.4607679465776294, "percentage": 46.08, "elapsed_time": "3 days, 5:25:45", "remaining_time": "3 days, 18:36:03", "throughput": 2723.59, "total_tokens": 759190656} {"current_steps": 4210, "total_steps": 9134, "loss": 0.5874, "learning_rate": 2.8062000332462302e-05, "epoch": 0.4608774186485673, "percentage": 46.09, "elapsed_time": "3 days, 5:26:55", "remaining_time": "3 days, 18:35:01", "throughput": 2723.66, "total_tokens": 759398528} {"current_steps": 4211, "total_steps": 9134, "loss": 0.7034, "learning_rate": 2.805346626838723e-05, "epoch": 0.46098689071950516, "percentage": 46.1, "elapsed_time": "3 days, 5:27:58", "remaining_time": "3 days, 18:33:51", "throughput": 2723.67, "total_tokens": 759572128} {"current_steps": 4212, "total_steps": 9134, "loss": 1.0248, "learning_rate": 2.8044931843092948e-05, "epoch": 0.4610963627904431, "percentage": 46.11, "elapsed_time": "3 days, 5:29:06", "remaining_time": "3 days, 18:32:47", "throughput": 2723.67, "total_tokens": 759758272} {"current_steps": 4213, "total_steps": 9134, "loss": 0.7229, "learning_rate": 2.8036397057589038e-05, "epoch": 0.461205834861381, "percentage": 46.12, "elapsed_time": "3 days, 5:30:15", "remaining_time": "3 days, 18:31:44", "throughput": 2723.71, "total_tokens": 759958528} {"current_steps": 4214, "total_steps": 9134, "loss": 0.6246, "learning_rate": 2.8027861912885168e-05, "epoch": 0.46131530693231887, "percentage": 46.14, "elapsed_time": "3 days, 5:31:24", "remaining_time": "3 days, 18:30:41", "throughput": 2723.67, "total_tokens": 760135264} {"current_steps": 4215, "total_steps": 9134, "loss": 0.7071, "learning_rate": 2.801932640999102e-05, "epoch": 0.4614247790032568, "percentage": 46.15, "elapsed_time": "3 days, 5:32:31", "remaining_time": "3 days, 18:29:36", "throughput": 2723.59, "total_tokens": 760295200} {"current_steps": 4216, "total_steps": 9134, "loss": 0.7642, "learning_rate": 2.8010790549916333e-05, "epoch": 0.4615342510741947, "percentage": 46.16, "elapsed_time": "3 days, 5:33:39", "remaining_time": "3 days, 18:28:31", "throughput": 2723.64, "total_tokens": 760491872} {"current_steps": 4217, "total_steps": 9134, "loss": 0.6831, "learning_rate": 2.8002254333670874e-05, "epoch": 0.4616437231451326, "percentage": 46.17, "elapsed_time": "3 days, 5:34:46", "remaining_time": "3 days, 18:27:26", "throughput": 2723.63, "total_tokens": 760671520} {"current_steps": 4218, "total_steps": 9134, "loss": 0.835, "learning_rate": 2.7993717762264464e-05, "epoch": 0.4617531952160705, "percentage": 46.18, "elapsed_time": "3 days, 5:35:55", "remaining_time": "3 days, 18:26:23", "throughput": 2723.62, "total_tokens": 760858784} {"current_steps": 4219, "total_steps": 9134, "loss": 0.7763, "learning_rate": 2.7985180836706975e-05, "epoch": 0.4618626672870084, "percentage": 46.19, "elapsed_time": "3 days, 5:37:01", "remaining_time": "3 days, 18:25:16", "throughput": 2723.57, "total_tokens": 761024096} {"current_steps": 4220, "total_steps": 9134, "loss": 0.5668, "learning_rate": 2.7976643558008297e-05, "epoch": 0.4619721393579463, "percentage": 46.2, "elapsed_time": "3 days, 5:38:03", "remaining_time": "3 days, 18:24:05", "throughput": 2723.58, "total_tokens": 761196576} {"current_steps": 4221, "total_steps": 9134, "loss": 0.6902, "learning_rate": 2.7968105927178372e-05, "epoch": 0.4620816114288842, "percentage": 46.21, "elapsed_time": "3 days, 5:39:11", "remaining_time": "3 days, 18:23:02", "throughput": 2723.64, "total_tokens": 761399744} {"current_steps": 4222, "total_steps": 9134, "loss": 0.7692, "learning_rate": 2.7959567945227195e-05, "epoch": 0.46219108349982213, "percentage": 46.22, "elapsed_time": "3 days, 5:40:18", "remaining_time": "3 days, 18:21:56", "throughput": 2723.6, "total_tokens": 761567968} {"current_steps": 4223, "total_steps": 9134, "loss": 0.603, "learning_rate": 2.7951029613164782e-05, "epoch": 0.46230055557076, "percentage": 46.23, "elapsed_time": "3 days, 5:41:26", "remaining_time": "3 days, 18:20:52", "throughput": 2723.58, "total_tokens": 761750528} {"current_steps": 4224, "total_steps": 9134, "loss": 0.8188, "learning_rate": 2.7942490932001212e-05, "epoch": 0.4624100276416979, "percentage": 46.24, "elapsed_time": "3 days, 5:42:31", "remaining_time": "3 days, 18:19:44", "throughput": 2723.62, "total_tokens": 761936000} {"current_steps": 4225, "total_steps": 9134, "loss": 0.5685, "learning_rate": 2.7933951902746587e-05, "epoch": 0.46251949971263584, "percentage": 46.26, "elapsed_time": "3 days, 5:43:38", "remaining_time": "3 days, 18:18:38", "throughput": 2723.61, "total_tokens": 762116096} {"current_steps": 4226, "total_steps": 9134, "loss": 0.7955, "learning_rate": 2.792541252641106e-05, "epoch": 0.4626289717835737, "percentage": 46.27, "elapsed_time": "3 days, 5:44:47", "remaining_time": "3 days, 18:17:36", "throughput": 2723.65, "total_tokens": 762314336} {"current_steps": 4227, "total_steps": 9134, "loss": 0.8521, "learning_rate": 2.791687280400483e-05, "epoch": 0.4627384438545116, "percentage": 46.28, "elapsed_time": "3 days, 5:45:52", "remaining_time": "3 days, 18:16:29", "throughput": 2723.59, "total_tokens": 762476736} {"current_steps": 4228, "total_steps": 9134, "loss": 0.8275, "learning_rate": 2.790833273653812e-05, "epoch": 0.4628479159254495, "percentage": 46.29, "elapsed_time": "3 days, 5:47:01", "remaining_time": "3 days, 18:15:25", "throughput": 2723.6, "total_tokens": 762664896} {"current_steps": 4229, "total_steps": 9134, "loss": 0.8029, "learning_rate": 2.7899792325021207e-05, "epoch": 0.4629573879963874, "percentage": 46.3, "elapsed_time": "3 days, 5:48:05", "remaining_time": "3 days, 18:14:16", "throughput": 2723.55, "total_tokens": 762828192} {"current_steps": 4230, "total_steps": 9134, "loss": 0.8204, "learning_rate": 2.7891251570464406e-05, "epoch": 0.46306686006732534, "percentage": 46.31, "elapsed_time": "3 days, 5:49:12", "remaining_time": "3 days, 18:13:11", "throughput": 2723.57, "total_tokens": 763015904} {"current_steps": 4231, "total_steps": 9134, "loss": 0.7079, "learning_rate": 2.788271047387807e-05, "epoch": 0.4631763321382632, "percentage": 46.32, "elapsed_time": "3 days, 5:50:18", "remaining_time": "3 days, 18:12:04", "throughput": 2723.6, "total_tokens": 763202496} {"current_steps": 4232, "total_steps": 9134, "loss": 0.6894, "learning_rate": 2.7874169036272597e-05, "epoch": 0.4632858042092011, "percentage": 46.33, "elapsed_time": "3 days, 5:51:17", "remaining_time": "3 days, 18:10:50", "throughput": 2723.51, "total_tokens": 763336672} {"current_steps": 4233, "total_steps": 9134, "loss": 0.6564, "learning_rate": 2.7865627258658417e-05, "epoch": 0.46339527628013905, "percentage": 46.34, "elapsed_time": "3 days, 5:52:22", "remaining_time": "3 days, 18:09:43", "throughput": 2723.56, "total_tokens": 763531776} {"current_steps": 4234, "total_steps": 9134, "loss": 0.676, "learning_rate": 2.7857085142046013e-05, "epoch": 0.4635047483510769, "percentage": 46.35, "elapsed_time": "3 days, 5:53:28", "remaining_time": "3 days, 18:08:35", "throughput": 2723.52, "total_tokens": 763696416} {"current_steps": 4235, "total_steps": 9134, "loss": 0.6123, "learning_rate": 2.78485426874459e-05, "epoch": 0.46361422042201483, "percentage": 46.37, "elapsed_time": "3 days, 5:54:37", "remaining_time": "3 days, 18:07:32", "throughput": 2723.51, "total_tokens": 763880768} {"current_steps": 4236, "total_steps": 9134, "loss": 0.6461, "learning_rate": 2.783999989586863e-05, "epoch": 0.46372369249295275, "percentage": 46.38, "elapsed_time": "3 days, 5:55:44", "remaining_time": "3 days, 18:06:27", "throughput": 2723.52, "total_tokens": 764069152} {"current_steps": 4237, "total_steps": 9134, "loss": 0.7703, "learning_rate": 2.7831456768324805e-05, "epoch": 0.4638331645638906, "percentage": 46.39, "elapsed_time": "3 days, 5:56:52", "remaining_time": "3 days, 18:05:24", "throughput": 2723.52, "total_tokens": 764253504} {"current_steps": 4238, "total_steps": 9134, "loss": 0.8396, "learning_rate": 2.7822913305825054e-05, "epoch": 0.46394263663482854, "percentage": 46.4, "elapsed_time": "3 days, 5:58:02", "remaining_time": "3 days, 18:04:21", "throughput": 2723.54, "total_tokens": 764451296} {"current_steps": 4239, "total_steps": 9134, "loss": 0.8019, "learning_rate": 2.7814369509380055e-05, "epoch": 0.46405210870576646, "percentage": 46.41, "elapsed_time": "3 days, 5:59:08", "remaining_time": "3 days, 18:03:15", "throughput": 2723.54, "total_tokens": 764630048} {"current_steps": 4240, "total_steps": 9134, "loss": 0.733, "learning_rate": 2.7805825380000528e-05, "epoch": 0.46416158077670433, "percentage": 46.42, "elapsed_time": "3 days, 6:00:12", "remaining_time": "3 days, 18:02:06", "throughput": 2723.53, "total_tokens": 764801184} {"current_steps": 4241, "total_steps": 9134, "loss": 0.7258, "learning_rate": 2.779728091869722e-05, "epoch": 0.46427105284764225, "percentage": 46.43, "elapsed_time": "3 days, 6:01:18", "remaining_time": "3 days, 18:00:59", "throughput": 2723.5, "total_tokens": 764970528} {"current_steps": 4242, "total_steps": 9134, "loss": 0.8455, "learning_rate": 2.778873612648093e-05, "epoch": 0.4643805249185802, "percentage": 46.44, "elapsed_time": "3 days, 6:02:24", "remaining_time": "3 days, 17:59:53", "throughput": 2723.58, "total_tokens": 765174816} {"current_steps": 4243, "total_steps": 9134, "loss": 0.7934, "learning_rate": 2.778019100436248e-05, "epoch": 0.46448999698951804, "percentage": 46.45, "elapsed_time": "3 days, 6:03:32", "remaining_time": "3 days, 17:58:49", "throughput": 2723.62, "total_tokens": 765373280} {"current_steps": 4244, "total_steps": 9134, "loss": 0.6965, "learning_rate": 2.7771645553352753e-05, "epoch": 0.46459946906045596, "percentage": 46.46, "elapsed_time": "3 days, 6:04:41", "remaining_time": "3 days, 17:57:46", "throughput": 2723.68, "total_tokens": 765577568} {"current_steps": 4245, "total_steps": 9134, "loss": 0.5751, "learning_rate": 2.7763099774462646e-05, "epoch": 0.4647089411313938, "percentage": 46.47, "elapsed_time": "3 days, 6:05:43", "remaining_time": "3 days, 17:56:35", "throughput": 2723.65, "total_tokens": 765738624} {"current_steps": 4246, "total_steps": 9134, "loss": 0.6169, "learning_rate": 2.775455366870313e-05, "epoch": 0.46481841320233175, "percentage": 46.49, "elapsed_time": "3 days, 6:06:51", "remaining_time": "3 days, 17:55:30", "throughput": 2723.67, "total_tokens": 765927008} {"current_steps": 4247, "total_steps": 9134, "loss": 0.6674, "learning_rate": 2.774600723708518e-05, "epoch": 0.46492788527326967, "percentage": 46.5, "elapsed_time": "3 days, 6:08:00", "remaining_time": "3 days, 17:54:28", "throughput": 2723.75, "total_tokens": 766137792} {"current_steps": 4248, "total_steps": 9134, "loss": 0.6421, "learning_rate": 2.7737460480619827e-05, "epoch": 0.46503735734420754, "percentage": 46.51, "elapsed_time": "3 days, 6:09:02", "remaining_time": "3 days, 17:53:17", "throughput": 2723.68, "total_tokens": 766287424} {"current_steps": 4249, "total_steps": 9134, "loss": 0.6302, "learning_rate": 2.7728913400318125e-05, "epoch": 0.46514682941514546, "percentage": 46.52, "elapsed_time": "3 days, 6:10:11", "remaining_time": "3 days, 17:52:14", "throughput": 2723.76, "total_tokens": 766499328} {"current_steps": 4250, "total_steps": 9134, "loss": 0.6673, "learning_rate": 2.7720365997191188e-05, "epoch": 0.4652563014860834, "percentage": 46.53, "elapsed_time": "3 days, 6:11:20", "remaining_time": "3 days, 17:51:10", "throughput": 2723.77, "total_tokens": 766685920} {"current_steps": 4251, "total_steps": 9134, "loss": 0.8285, "learning_rate": 2.7711818272250152e-05, "epoch": 0.46536577355702125, "percentage": 46.54, "elapsed_time": "3 days, 6:12:27", "remaining_time": "3 days, 17:50:04", "throughput": 2723.82, "total_tokens": 766883040} {"current_steps": 4252, "total_steps": 9134, "loss": 0.6953, "learning_rate": 2.7703270226506196e-05, "epoch": 0.46547524562795917, "percentage": 46.55, "elapsed_time": "3 days, 6:13:26", "remaining_time": "3 days, 17:48:51", "throughput": 2723.76, "total_tokens": 767028640} {"current_steps": 4253, "total_steps": 9134, "loss": 0.6327, "learning_rate": 2.769472186097054e-05, "epoch": 0.4655847176988971, "percentage": 46.56, "elapsed_time": "3 days, 6:14:35", "remaining_time": "3 days, 17:47:47", "throughput": 2723.81, "total_tokens": 767231360} {"current_steps": 4254, "total_steps": 9134, "loss": 0.6156, "learning_rate": 2.7686173176654446e-05, "epoch": 0.46569418976983495, "percentage": 46.57, "elapsed_time": "3 days, 6:15:42", "remaining_time": "3 days, 17:46:42", "throughput": 2723.81, "total_tokens": 767412576} {"current_steps": 4255, "total_steps": 9134, "loss": 0.8213, "learning_rate": 2.7677624174569187e-05, "epoch": 0.4658036618407729, "percentage": 46.58, "elapsed_time": "3 days, 6:16:50", "remaining_time": "3 days, 17:45:38", "throughput": 2723.8, "total_tokens": 767595808} {"current_steps": 4256, "total_steps": 9134, "loss": 0.5815, "learning_rate": 2.766907485572612e-05, "epoch": 0.4659131339117108, "percentage": 46.6, "elapsed_time": "3 days, 6:17:58", "remaining_time": "3 days, 17:44:34", "throughput": 2723.81, "total_tokens": 767783520} {"current_steps": 4257, "total_steps": 9134, "loss": 0.5881, "learning_rate": 2.7660525221136595e-05, "epoch": 0.46602260598264866, "percentage": 46.61, "elapsed_time": "3 days, 6:19:05", "remaining_time": "3 days, 17:43:28", "throughput": 2723.77, "total_tokens": 767953984} {"current_steps": 4258, "total_steps": 9134, "loss": 0.9978, "learning_rate": 2.7651975271812026e-05, "epoch": 0.4661320780535866, "percentage": 46.62, "elapsed_time": "3 days, 6:20:11", "remaining_time": "3 days, 17:42:22", "throughput": 2723.69, "total_tokens": 768112352} {"current_steps": 4259, "total_steps": 9134, "loss": 0.6524, "learning_rate": 2.7643425008763845e-05, "epoch": 0.4662415501245245, "percentage": 46.63, "elapsed_time": "3 days, 6:21:15", "remaining_time": "3 days, 17:41:12", "throughput": 2723.65, "total_tokens": 768274976} {"current_steps": 4260, "total_steps": 9134, "loss": 0.7458, "learning_rate": 2.7634874433003545e-05, "epoch": 0.4663510221954624, "percentage": 46.64, "elapsed_time": "3 days, 6:22:19", "remaining_time": "3 days, 17:40:04", "throughput": 2723.57, "total_tokens": 768426848} {"current_steps": 4261, "total_steps": 9134, "loss": 0.9385, "learning_rate": 2.762632354554264e-05, "epoch": 0.4664604942664003, "percentage": 46.65, "elapsed_time": "3 days, 6:23:27", "remaining_time": "3 days, 17:39:00", "throughput": 2723.56, "total_tokens": 768608288} {"current_steps": 4262, "total_steps": 9134, "loss": 0.793, "learning_rate": 2.7617772347392672e-05, "epoch": 0.46656996633733816, "percentage": 46.66, "elapsed_time": "3 days, 6:24:34", "remaining_time": "3 days, 17:37:54", "throughput": 2723.49, "total_tokens": 768771584} {"current_steps": 4263, "total_steps": 9134, "loss": 0.6927, "learning_rate": 2.760922083956525e-05, "epoch": 0.4666794384082761, "percentage": 46.67, "elapsed_time": "3 days, 6:25:36", "remaining_time": "3 days, 17:36:44", "throughput": 2723.45, "total_tokens": 768930400} {"current_steps": 4264, "total_steps": 9134, "loss": 0.6679, "learning_rate": 2.7600669023071978e-05, "epoch": 0.466788910479214, "percentage": 46.68, "elapsed_time": "3 days, 6:26:43", "remaining_time": "3 days, 17:35:38", "throughput": 2723.46, "total_tokens": 769113632} {"current_steps": 4265, "total_steps": 9134, "loss": 0.5807, "learning_rate": 2.7592116898924537e-05, "epoch": 0.46689838255015187, "percentage": 46.69, "elapsed_time": "3 days, 6:27:46", "remaining_time": "3 days, 17:34:28", "throughput": 2723.34, "total_tokens": 769252512} {"current_steps": 4266, "total_steps": 9134, "loss": 0.7771, "learning_rate": 2.7583564468134615e-05, "epoch": 0.4670078546210898, "percentage": 46.7, "elapsed_time": "3 days, 6:28:53", "remaining_time": "3 days, 17:33:22", "throughput": 2723.4, "total_tokens": 769449408} {"current_steps": 4267, "total_steps": 9134, "loss": 1.1046, "learning_rate": 2.7575011731713968e-05, "epoch": 0.4671173266920277, "percentage": 46.72, "elapsed_time": "3 days, 6:30:00", "remaining_time": "3 days, 17:32:17", "throughput": 2723.43, "total_tokens": 769641600} {"current_steps": 4268, "total_steps": 9134, "loss": 0.7965, "learning_rate": 2.756645869067435e-05, "epoch": 0.4672267987629656, "percentage": 46.73, "elapsed_time": "3 days, 6:31:09", "remaining_time": "3 days, 17:31:14", "throughput": 2723.51, "total_tokens": 769851488} {"current_steps": 4269, "total_steps": 9134, "loss": 0.7947, "learning_rate": 2.7557905346027578e-05, "epoch": 0.4673362708339035, "percentage": 46.74, "elapsed_time": "3 days, 6:32:15", "remaining_time": "3 days, 17:30:08", "throughput": 2723.53, "total_tokens": 770039648} {"current_steps": 4270, "total_steps": 9134, "loss": 0.6467, "learning_rate": 2.7549351698785492e-05, "epoch": 0.4674457429048414, "percentage": 46.75, "elapsed_time": "3 days, 6:33:21", "remaining_time": "3 days, 17:29:02", "throughput": 2723.55, "total_tokens": 770225344} {"current_steps": 4271, "total_steps": 9134, "loss": 0.552, "learning_rate": 2.7540797749959974e-05, "epoch": 0.4675552149757793, "percentage": 46.76, "elapsed_time": "3 days, 6:34:28", "remaining_time": "3 days, 17:27:57", "throughput": 2723.53, "total_tokens": 770402976} {"current_steps": 4272, "total_steps": 9134, "loss": 0.8069, "learning_rate": 2.753224350056293e-05, "epoch": 0.4676646870467172, "percentage": 46.77, "elapsed_time": "3 days, 6:35:37", "remaining_time": "3 days, 17:26:53", "throughput": 2723.63, "total_tokens": 770615104} {"current_steps": 4273, "total_steps": 9134, "loss": 0.6014, "learning_rate": 2.7523688951606337e-05, "epoch": 0.46777415911765513, "percentage": 46.78, "elapsed_time": "3 days, 6:36:43", "remaining_time": "3 days, 17:25:47", "throughput": 2723.67, "total_tokens": 770809984} {"current_steps": 4274, "total_steps": 9134, "loss": 0.6194, "learning_rate": 2.751513410410216e-05, "epoch": 0.467883631188593, "percentage": 46.79, "elapsed_time": "3 days, 6:37:47", "remaining_time": "3 days, 17:24:37", "throughput": 2723.65, "total_tokens": 770975968} {"current_steps": 4275, "total_steps": 9134, "loss": 0.8015, "learning_rate": 2.7506578959062424e-05, "epoch": 0.4679931032595309, "percentage": 46.8, "elapsed_time": "3 days, 6:38:53", "remaining_time": "3 days, 17:23:31", "throughput": 2723.62, "total_tokens": 771149344} {"current_steps": 4276, "total_steps": 9134, "loss": 0.6043, "learning_rate": 2.7498023517499183e-05, "epoch": 0.46810257533046884, "percentage": 46.81, "elapsed_time": "3 days, 6:39:56", "remaining_time": "3 days, 17:22:22", "throughput": 2723.62, "total_tokens": 771318912} {"current_steps": 4277, "total_steps": 9134, "loss": 0.8178, "learning_rate": 2.7489467780424544e-05, "epoch": 0.4682120474014067, "percentage": 46.83, "elapsed_time": "3 days, 6:41:00", "remaining_time": "3 days, 17:21:13", "throughput": 2723.62, "total_tokens": 771494304} {"current_steps": 4278, "total_steps": 9134, "loss": 0.7673, "learning_rate": 2.7480911748850624e-05, "epoch": 0.4683215194723446, "percentage": 46.84, "elapsed_time": "3 days, 6:42:05", "remaining_time": "3 days, 17:20:05", "throughput": 2723.6, "total_tokens": 771662976} {"current_steps": 4279, "total_steps": 9134, "loss": 0.6127, "learning_rate": 2.7472355423789582e-05, "epoch": 0.4684309915432825, "percentage": 46.85, "elapsed_time": "3 days, 6:43:10", "remaining_time": "3 days, 17:18:58", "throughput": 2723.6, "total_tokens": 771844640} {"current_steps": 4280, "total_steps": 9134, "loss": 0.5756, "learning_rate": 2.746379880625362e-05, "epoch": 0.4685404636142204, "percentage": 46.86, "elapsed_time": "3 days, 6:44:12", "remaining_time": "3 days, 17:17:47", "throughput": 2723.59, "total_tokens": 772007488} {"current_steps": 4281, "total_steps": 9134, "loss": 0.6482, "learning_rate": 2.7455241897254974e-05, "epoch": 0.46864993568515834, "percentage": 46.87, "elapsed_time": "3 days, 6:45:21", "remaining_time": "3 days, 17:16:44", "throughput": 2723.55, "total_tokens": 772185792} {"current_steps": 4282, "total_steps": 9134, "loss": 0.6445, "learning_rate": 2.7446684697805907e-05, "epoch": 0.4687594077560962, "percentage": 46.88, "elapsed_time": "3 days, 6:46:27", "remaining_time": "3 days, 17:15:37", "throughput": 2723.48, "total_tokens": 772344160} {"current_steps": 4283, "total_steps": 9134, "loss": 0.6815, "learning_rate": 2.743812720891872e-05, "epoch": 0.4688688798270341, "percentage": 46.89, "elapsed_time": "3 days, 6:47:36", "remaining_time": "3 days, 17:14:34", "throughput": 2723.53, "total_tokens": 772547776} {"current_steps": 4284, "total_steps": 9134, "loss": 0.5607, "learning_rate": 2.742956943160574e-05, "epoch": 0.46897835189797205, "percentage": 46.9, "elapsed_time": "3 days, 6:48:44", "remaining_time": "3 days, 17:13:29", "throughput": 2723.52, "total_tokens": 772730336} {"current_steps": 4285, "total_steps": 9134, "loss": 0.8053, "learning_rate": 2.742101136687934e-05, "epoch": 0.4690878239689099, "percentage": 46.91, "elapsed_time": "3 days, 6:49:50", "remaining_time": "3 days, 17:12:23", "throughput": 2723.53, "total_tokens": 772911776} {"current_steps": 4286, "total_steps": 9134, "loss": 0.5849, "learning_rate": 2.7412453015751916e-05, "epoch": 0.46919729603984783, "percentage": 46.92, "elapsed_time": "3 days, 6:50:59", "remaining_time": "3 days, 17:11:20", "throughput": 2723.62, "total_tokens": 773125696} {"current_steps": 4287, "total_steps": 9134, "loss": 1.0683, "learning_rate": 2.7403894379235916e-05, "epoch": 0.46930676811078575, "percentage": 46.93, "elapsed_time": "3 days, 6:52:08", "remaining_time": "3 days, 17:10:16", "throughput": 2723.68, "total_tokens": 773328864} {"current_steps": 4288, "total_steps": 9134, "loss": 0.5099, "learning_rate": 2.7395335458343813e-05, "epoch": 0.4694162401817236, "percentage": 46.95, "elapsed_time": "3 days, 6:53:13", "remaining_time": "3 days, 17:09:09", "throughput": 2723.63, "total_tokens": 773491488} {"current_steps": 4289, "total_steps": 9134, "loss": 0.7875, "learning_rate": 2.7386776254088103e-05, "epoch": 0.46952571225266154, "percentage": 46.96, "elapsed_time": "3 days, 6:54:19", "remaining_time": "3 days, 17:08:03", "throughput": 2723.54, "total_tokens": 773648512} {"current_steps": 4290, "total_steps": 9134, "loss": 0.5539, "learning_rate": 2.7378216767481322e-05, "epoch": 0.46963518432359946, "percentage": 46.97, "elapsed_time": "3 days, 6:55:23", "remaining_time": "3 days, 17:06:54", "throughput": 2723.55, "total_tokens": 773823680} {"current_steps": 4291, "total_steps": 9134, "loss": 0.6998, "learning_rate": 2.736965699953605e-05, "epoch": 0.46974465639453733, "percentage": 46.98, "elapsed_time": "3 days, 6:56:31", "remaining_time": "3 days, 17:05:50", "throughput": 2723.59, "total_tokens": 774021248} {"current_steps": 4292, "total_steps": 9134, "loss": 0.8498, "learning_rate": 2.7361096951264882e-05, "epoch": 0.46985412846547525, "percentage": 46.99, "elapsed_time": "3 days, 6:57:37", "remaining_time": "3 days, 17:04:43", "throughput": 2723.66, "total_tokens": 774221952} {"current_steps": 4293, "total_steps": 9134, "loss": 0.7234, "learning_rate": 2.7352536623680454e-05, "epoch": 0.4699636005364132, "percentage": 47.0, "elapsed_time": "3 days, 6:58:43", "remaining_time": "3 days, 17:03:37", "throughput": 2723.65, "total_tokens": 774398688} {"current_steps": 4294, "total_steps": 9134, "loss": 0.7814, "learning_rate": 2.7343976017795443e-05, "epoch": 0.47007307260735104, "percentage": 47.01, "elapsed_time": "3 days, 6:59:46", "remaining_time": "3 days, 17:02:27", "throughput": 2723.53, "total_tokens": 774533088} {"current_steps": 4295, "total_steps": 9134, "loss": 0.6258, "learning_rate": 2.7335415134622548e-05, "epoch": 0.47018254467828896, "percentage": 47.02, "elapsed_time": "3 days, 7:00:48", "remaining_time": "3 days, 17:01:16", "throughput": 2723.45, "total_tokens": 774680928} {"current_steps": 4296, "total_steps": 9134, "loss": 0.8843, "learning_rate": 2.732685397517451e-05, "epoch": 0.4702920167492268, "percentage": 47.03, "elapsed_time": "3 days, 7:01:55", "remaining_time": "3 days, 17:00:10", "throughput": 2723.48, "total_tokens": 774872000} {"current_steps": 4297, "total_steps": 9134, "loss": 0.8768, "learning_rate": 2.731829254046409e-05, "epoch": 0.47040148882016475, "percentage": 47.04, "elapsed_time": "3 days, 7:03:04", "remaining_time": "3 days, 16:59:08", "throughput": 2723.51, "total_tokens": 775069344} {"current_steps": 4298, "total_steps": 9134, "loss": 0.6972, "learning_rate": 2.7309730831504105e-05, "epoch": 0.47051096089110267, "percentage": 47.05, "elapsed_time": "3 days, 7:04:10", "remaining_time": "3 days, 16:58:01", "throughput": 2723.49, "total_tokens": 775241824} {"current_steps": 4299, "total_steps": 9134, "loss": 0.8387, "learning_rate": 2.7301168849307364e-05, "epoch": 0.47062043296204054, "percentage": 47.07, "elapsed_time": "3 days, 7:05:20", "remaining_time": "3 days, 16:56:59", "throughput": 2723.53, "total_tokens": 775444768} {"current_steps": 4300, "total_steps": 9134, "loss": 0.7989, "learning_rate": 2.7292606594886756e-05, "epoch": 0.47072990503297846, "percentage": 47.08, "elapsed_time": "3 days, 7:06:28", "remaining_time": "3 days, 16:55:54", "throughput": 2723.54, "total_tokens": 775631360} {"current_steps": 4301, "total_steps": 9134, "loss": 0.7526, "learning_rate": 2.728404406925517e-05, "epoch": 0.4708393771039164, "percentage": 47.09, "elapsed_time": "3 days, 7:07:35", "remaining_time": "3 days, 16:54:49", "throughput": 2723.58, "total_tokens": 775824448} {"current_steps": 4302, "total_steps": 9134, "loss": 0.6731, "learning_rate": 2.727548127342554e-05, "epoch": 0.47094884917485424, "percentage": 47.1, "elapsed_time": "3 days, 7:08:42", "remaining_time": "3 days, 16:53:44", "throughput": 2723.63, "total_tokens": 776024928} {"current_steps": 4303, "total_steps": 9134, "loss": 0.7333, "learning_rate": 2.7266918208410824e-05, "epoch": 0.47105832124579217, "percentage": 47.11, "elapsed_time": "3 days, 7:09:46", "remaining_time": "3 days, 16:52:35", "throughput": 2723.66, "total_tokens": 776206592} {"current_steps": 4304, "total_steps": 9134, "loss": 0.6393, "learning_rate": 2.7258354875224014e-05, "epoch": 0.4711677933167301, "percentage": 47.12, "elapsed_time": "3 days, 7:10:47", "remaining_time": "3 days, 16:51:24", "throughput": 2723.6, "total_tokens": 776357568} {"current_steps": 4305, "total_steps": 9134, "loss": 0.778, "learning_rate": 2.7249791274878146e-05, "epoch": 0.47127726538766795, "percentage": 47.13, "elapsed_time": "3 days, 7:11:53", "remaining_time": "3 days, 16:50:17", "throughput": 2723.59, "total_tokens": 776530944} {"current_steps": 4306, "total_steps": 9134, "loss": 0.6682, "learning_rate": 2.724122740838626e-05, "epoch": 0.4713867374586059, "percentage": 47.14, "elapsed_time": "3 days, 7:12:59", "remaining_time": "3 days, 16:49:10", "throughput": 2723.6, "total_tokens": 776713952} {"current_steps": 4307, "total_steps": 9134, "loss": 0.8789, "learning_rate": 2.723266327676146e-05, "epoch": 0.4714962095295438, "percentage": 47.15, "elapsed_time": "3 days, 7:14:07", "remaining_time": "3 days, 16:48:06", "throughput": 2723.58, "total_tokens": 776894496} {"current_steps": 4308, "total_steps": 9134, "loss": 0.6702, "learning_rate": 2.722409888101686e-05, "epoch": 0.47160568160048166, "percentage": 47.16, "elapsed_time": "3 days, 7:15:16", "remaining_time": "3 days, 16:47:03", "throughput": 2723.57, "total_tokens": 777080416} {"current_steps": 4309, "total_steps": 9134, "loss": 0.8059, "learning_rate": 2.7215534222165622e-05, "epoch": 0.4717151536714196, "percentage": 47.18, "elapsed_time": "3 days, 7:16:25", "remaining_time": "3 days, 16:46:00", "throughput": 2723.63, "total_tokens": 777285152} {"current_steps": 4310, "total_steps": 9134, "loss": 0.7218, "learning_rate": 2.720696930122092e-05, "epoch": 0.4718246257423575, "percentage": 47.19, "elapsed_time": "3 days, 7:17:34", "remaining_time": "3 days, 16:44:57", "throughput": 2723.65, "total_tokens": 777477792} {"current_steps": 4311, "total_steps": 9134, "loss": 0.9108, "learning_rate": 2.7198404119195965e-05, "epoch": 0.4719340978132954, "percentage": 47.2, "elapsed_time": "3 days, 7:18:44", "remaining_time": "3 days, 16:43:54", "throughput": 2723.63, "total_tokens": 777660800} {"current_steps": 4312, "total_steps": 9134, "loss": 0.8167, "learning_rate": 2.718983867710401e-05, "epoch": 0.4720435698842333, "percentage": 47.21, "elapsed_time": "3 days, 7:19:53", "remaining_time": "3 days, 16:42:51", "throughput": 2723.62, "total_tokens": 777846048} {"current_steps": 4313, "total_steps": 9134, "loss": 0.5095, "learning_rate": 2.7181272975958318e-05, "epoch": 0.47215304195517116, "percentage": 47.22, "elapsed_time": "3 days, 7:20:59", "remaining_time": "3 days, 16:41:45", "throughput": 2723.64, "total_tokens": 778036000} {"current_steps": 4314, "total_steps": 9134, "loss": 0.6635, "learning_rate": 2.717270701677221e-05, "epoch": 0.4722625140261091, "percentage": 47.23, "elapsed_time": "3 days, 7:22:09", "remaining_time": "3 days, 16:40:43", "throughput": 2723.65, "total_tokens": 778228192} {"current_steps": 4315, "total_steps": 9134, "loss": 0.7656, "learning_rate": 2.7164140800559013e-05, "epoch": 0.472371986097047, "percentage": 47.24, "elapsed_time": "3 days, 7:23:14", "remaining_time": "3 days, 16:39:36", "throughput": 2723.64, "total_tokens": 778402912} {"current_steps": 4316, "total_steps": 9134, "loss": 0.6086, "learning_rate": 2.7155574328332095e-05, "epoch": 0.47248145816798487, "percentage": 47.25, "elapsed_time": "3 days, 7:24:24", "remaining_time": "3 days, 16:38:33", "throughput": 2723.7, "total_tokens": 778608544} {"current_steps": 4317, "total_steps": 9134, "loss": 0.6855, "learning_rate": 2.7147007601104858e-05, "epoch": 0.4725909302389228, "percentage": 47.26, "elapsed_time": "3 days, 7:25:27", "remaining_time": "3 days, 16:37:24", "throughput": 2723.65, "total_tokens": 778766016} {"current_steps": 4318, "total_steps": 9134, "loss": 0.7241, "learning_rate": 2.713844061989072e-05, "epoch": 0.4727004023098607, "percentage": 47.27, "elapsed_time": "3 days, 7:26:33", "remaining_time": "3 days, 16:36:17", "throughput": 2723.62, "total_tokens": 778937152} {"current_steps": 4319, "total_steps": 9134, "loss": 0.8103, "learning_rate": 2.7129873385703146e-05, "epoch": 0.4728098743807986, "percentage": 47.28, "elapsed_time": "3 days, 7:27:39", "remaining_time": "3 days, 16:35:10", "throughput": 2723.59, "total_tokens": 779109856} {"current_steps": 4320, "total_steps": 9134, "loss": 0.6347, "learning_rate": 2.712130589955562e-05, "epoch": 0.4729193464517365, "percentage": 47.3, "elapsed_time": "3 days, 7:28:43", "remaining_time": "3 days, 16:34:02", "throughput": 2723.55, "total_tokens": 779272256} {"current_steps": 4321, "total_steps": 9134, "loss": 0.6893, "learning_rate": 2.711273816246167e-05, "epoch": 0.4730288185226744, "percentage": 47.31, "elapsed_time": "3 days, 7:29:48", "remaining_time": "3 days, 16:32:54", "throughput": 2723.52, "total_tokens": 779438688} {"current_steps": 4322, "total_steps": 9134, "loss": 0.82, "learning_rate": 2.710417017543483e-05, "epoch": 0.4731382905936123, "percentage": 47.32, "elapsed_time": "3 days, 7:30:57", "remaining_time": "3 days, 16:31:51", "throughput": 2723.53, "total_tokens": 779630208} {"current_steps": 4323, "total_steps": 9134, "loss": 0.7439, "learning_rate": 2.7095601939488685e-05, "epoch": 0.4732477626645502, "percentage": 47.33, "elapsed_time": "3 days, 7:32:05", "remaining_time": "3 days, 16:30:47", "throughput": 2723.58, "total_tokens": 779832928} {"current_steps": 4324, "total_steps": 9134, "loss": 0.677, "learning_rate": 2.7087033455636834e-05, "epoch": 0.47335723473548813, "percentage": 47.34, "elapsed_time": "3 days, 7:33:12", "remaining_time": "3 days, 16:29:42", "throughput": 2723.59, "total_tokens": 780015488} {"current_steps": 4325, "total_steps": 9134, "loss": 0.853, "learning_rate": 2.7078464724892917e-05, "epoch": 0.473466706806426, "percentage": 47.35, "elapsed_time": "3 days, 7:34:22", "remaining_time": "3 days, 16:28:39", "throughput": 2723.66, "total_tokens": 780225376} {"current_steps": 4326, "total_steps": 9134, "loss": 0.6221, "learning_rate": 2.706989574827059e-05, "epoch": 0.4735761788773639, "percentage": 47.36, "elapsed_time": "3 days, 7:35:27", "remaining_time": "3 days, 16:27:32", "throughput": 2723.65, "total_tokens": 780401664} {"current_steps": 4327, "total_steps": 9134, "loss": 0.599, "learning_rate": 2.7061326526783555e-05, "epoch": 0.47368565094830184, "percentage": 47.37, "elapsed_time": "3 days, 7:36:33", "remaining_time": "3 days, 16:26:25", "throughput": 2723.66, "total_tokens": 780583552} {"current_steps": 4328, "total_steps": 9134, "loss": 0.8147, "learning_rate": 2.7052757061445534e-05, "epoch": 0.4737951230192397, "percentage": 47.38, "elapsed_time": "3 days, 7:37:38", "remaining_time": "3 days, 16:25:17", "throughput": 2723.68, "total_tokens": 780764096} {"current_steps": 4329, "total_steps": 9134, "loss": 0.9329, "learning_rate": 2.7044187353270268e-05, "epoch": 0.4739045950901776, "percentage": 47.39, "elapsed_time": "3 days, 7:38:47", "remaining_time": "3 days, 16:24:15", "throughput": 2723.66, "total_tokens": 780949568} {"current_steps": 4330, "total_steps": 9134, "loss": 0.7073, "learning_rate": 2.703561740327156e-05, "epoch": 0.4740140671611155, "percentage": 47.41, "elapsed_time": "3 days, 7:39:52", "remaining_time": "3 days, 16:23:07", "throughput": 2723.6, "total_tokens": 781107264} {"current_steps": 4331, "total_steps": 9134, "loss": 0.7422, "learning_rate": 2.7027047212463198e-05, "epoch": 0.4741235392320534, "percentage": 47.42, "elapsed_time": "3 days, 7:40:55", "remaining_time": "3 days, 16:21:58", "throughput": 2723.54, "total_tokens": 781264960} {"current_steps": 4332, "total_steps": 9134, "loss": 0.7077, "learning_rate": 2.7018476781859027e-05, "epoch": 0.47423301130299134, "percentage": 47.43, "elapsed_time": "3 days, 7:42:03", "remaining_time": "3 days, 16:20:52", "throughput": 2723.57, "total_tokens": 781456032} {"current_steps": 4333, "total_steps": 9134, "loss": 0.6652, "learning_rate": 2.7009906112472904e-05, "epoch": 0.4743424833739292, "percentage": 47.44, "elapsed_time": "3 days, 7:43:10", "remaining_time": "3 days, 16:19:48", "throughput": 2723.58, "total_tokens": 781644192} {"current_steps": 4334, "total_steps": 9134, "loss": 0.8589, "learning_rate": 2.700133520531874e-05, "epoch": 0.4744519554448671, "percentage": 47.45, "elapsed_time": "3 days, 7:44:18", "remaining_time": "3 days, 16:18:43", "throughput": 2723.67, "total_tokens": 781852960} {"current_steps": 4335, "total_steps": 9134, "loss": 0.7215, "learning_rate": 2.6992764061410446e-05, "epoch": 0.47456142751580505, "percentage": 47.46, "elapsed_time": "3 days, 7:45:22", "remaining_time": "3 days, 16:17:34", "throughput": 2723.65, "total_tokens": 782022528} {"current_steps": 4336, "total_steps": 9134, "loss": 0.7996, "learning_rate": 2.6984192681761972e-05, "epoch": 0.4746708995867429, "percentage": 47.47, "elapsed_time": "3 days, 7:46:27", "remaining_time": "3 days, 16:16:27", "throughput": 2723.64, "total_tokens": 782194784} {"current_steps": 4337, "total_steps": 9134, "loss": 0.9537, "learning_rate": 2.6975621067387296e-05, "epoch": 0.47478037165768083, "percentage": 47.48, "elapsed_time": "3 days, 7:47:36", "remaining_time": "3 days, 16:15:23", "throughput": 2723.73, "total_tokens": 782408480} {"current_steps": 4338, "total_steps": 9134, "loss": 0.5328, "learning_rate": 2.6967049219300427e-05, "epoch": 0.47488984372861875, "percentage": 47.49, "elapsed_time": "3 days, 7:48:42", "remaining_time": "3 days, 16:14:17", "throughput": 2723.73, "total_tokens": 782588352} {"current_steps": 4339, "total_steps": 9134, "loss": 0.9314, "learning_rate": 2.6958477138515393e-05, "epoch": 0.4749993157995566, "percentage": 47.5, "elapsed_time": "3 days, 7:49:46", "remaining_time": "3 days, 16:13:09", "throughput": 2723.68, "total_tokens": 782750080} {"current_steps": 4340, "total_steps": 9134, "loss": 0.6225, "learning_rate": 2.6949904826046258e-05, "epoch": 0.47510878787049454, "percentage": 47.51, "elapsed_time": "3 days, 7:50:46", "remaining_time": "3 days, 16:11:55", "throughput": 2723.6, "total_tokens": 782889632} {"current_steps": 4341, "total_steps": 9134, "loss": 0.7861, "learning_rate": 2.6941332282907107e-05, "epoch": 0.47521825994143246, "percentage": 47.53, "elapsed_time": "3 days, 7:51:55", "remaining_time": "3 days, 16:10:52", "throughput": 2723.64, "total_tokens": 783088768} {"current_steps": 4342, "total_steps": 9134, "loss": 0.7144, "learning_rate": 2.693275951011206e-05, "epoch": 0.47532773201237033, "percentage": 47.54, "elapsed_time": "3 days, 7:53:00", "remaining_time": "3 days, 16:09:45", "throughput": 2723.62, "total_tokens": 783261920} {"current_steps": 4343, "total_steps": 9134, "loss": 0.658, "learning_rate": 2.692418650867526e-05, "epoch": 0.47543720408330825, "percentage": 47.55, "elapsed_time": "3 days, 7:54:05", "remaining_time": "3 days, 16:08:36", "throughput": 2723.61, "total_tokens": 783433056} {"current_steps": 4344, "total_steps": 9134, "loss": 0.9023, "learning_rate": 2.6915613279610874e-05, "epoch": 0.4755466761542462, "percentage": 47.56, "elapsed_time": "3 days, 7:55:12", "remaining_time": "3 days, 16:07:32", "throughput": 2723.64, "total_tokens": 783623904} {"current_steps": 4345, "total_steps": 9134, "loss": 0.5613, "learning_rate": 2.6907039823933093e-05, "epoch": 0.47565614822518404, "percentage": 47.57, "elapsed_time": "3 days, 7:56:13", "remaining_time": "3 days, 16:06:19", "throughput": 2723.57, "total_tokens": 783771520} {"current_steps": 4346, "total_steps": 9134, "loss": 0.6151, "learning_rate": 2.6898466142656154e-05, "epoch": 0.47576562029612196, "percentage": 47.58, "elapsed_time": "3 days, 7:57:14", "remaining_time": "3 days, 16:05:07", "throughput": 2723.5, "total_tokens": 783918240} {"current_steps": 4347, "total_steps": 9134, "loss": 0.5388, "learning_rate": 2.6889892236794294e-05, "epoch": 0.4758750923670598, "percentage": 47.59, "elapsed_time": "3 days, 7:58:20", "remaining_time": "3 days, 16:04:01", "throughput": 2723.46, "total_tokens": 784084672} {"current_steps": 4348, "total_steps": 9134, "loss": 0.6254, "learning_rate": 2.68813181073618e-05, "epoch": 0.47598456443799775, "percentage": 47.6, "elapsed_time": "3 days, 7:59:24", "remaining_time": "3 days, 16:02:53", "throughput": 2723.42, "total_tokens": 784248416} {"current_steps": 4349, "total_steps": 9134, "loss": 0.5564, "learning_rate": 2.687274375537297e-05, "epoch": 0.47609403650893567, "percentage": 47.61, "elapsed_time": "3 days, 8:00:31", "remaining_time": "3 days, 16:01:47", "throughput": 2723.37, "total_tokens": 784416864} {"current_steps": 4350, "total_steps": 9134, "loss": 0.8855, "learning_rate": 2.686416918184213e-05, "epoch": 0.47620350857987354, "percentage": 47.62, "elapsed_time": "3 days, 8:01:40", "remaining_time": "3 days, 16:00:44", "throughput": 2723.42, "total_tokens": 784620032} {"current_steps": 4351, "total_steps": 9134, "loss": 0.7481, "learning_rate": 2.6855594387783638e-05, "epoch": 0.47631298065081146, "percentage": 47.64, "elapsed_time": "3 days, 8:02:49", "remaining_time": "3 days, 15:59:41", "throughput": 2723.46, "total_tokens": 784818048} {"current_steps": 4352, "total_steps": 9134, "loss": 0.8672, "learning_rate": 2.6847019374211886e-05, "epoch": 0.4764224527217494, "percentage": 47.65, "elapsed_time": "3 days, 8:03:58", "remaining_time": "3 days, 15:58:38", "throughput": 2723.53, "total_tokens": 785028608} {"current_steps": 4353, "total_steps": 9134, "loss": 0.6204, "learning_rate": 2.6838444142141267e-05, "epoch": 0.47653192479268724, "percentage": 47.66, "elapsed_time": "3 days, 8:05:05", "remaining_time": "3 days, 15:57:32", "throughput": 2723.52, "total_tokens": 785206240} {"current_steps": 4354, "total_steps": 9134, "loss": 0.649, "learning_rate": 2.6829868692586218e-05, "epoch": 0.47664139686362517, "percentage": 47.67, "elapsed_time": "3 days, 8:06:11", "remaining_time": "3 days, 15:56:25", "throughput": 2723.49, "total_tokens": 785376032} {"current_steps": 4355, "total_steps": 9134, "loss": 0.7916, "learning_rate": 2.6821293026561206e-05, "epoch": 0.4767508689345631, "percentage": 47.68, "elapsed_time": "3 days, 8:07:17", "remaining_time": "3 days, 15:55:19", "throughput": 2723.56, "total_tokens": 785576064} {"current_steps": 4356, "total_steps": 9134, "loss": 0.7191, "learning_rate": 2.6812717145080713e-05, "epoch": 0.47686034100550095, "percentage": 47.69, "elapsed_time": "3 days, 8:08:23", "remaining_time": "3 days, 15:54:12", "throughput": 2723.58, "total_tokens": 785761088} {"current_steps": 4357, "total_steps": 9134, "loss": 0.5745, "learning_rate": 2.6804141049159243e-05, "epoch": 0.4769698130764389, "percentage": 47.7, "elapsed_time": "3 days, 8:09:29", "remaining_time": "3 days, 15:53:07", "throughput": 2723.65, "total_tokens": 785963808} {"current_steps": 4358, "total_steps": 9134, "loss": 0.6032, "learning_rate": 2.6795564739811335e-05, "epoch": 0.4770792851473768, "percentage": 47.71, "elapsed_time": "3 days, 8:10:33", "remaining_time": "3 days, 15:51:58", "throughput": 2723.62, "total_tokens": 786128672} {"current_steps": 4359, "total_steps": 9134, "loss": 0.8609, "learning_rate": 2.6786988218051556e-05, "epoch": 0.47718875721831466, "percentage": 47.72, "elapsed_time": "3 days, 8:11:41", "remaining_time": "3 days, 15:50:53", "throughput": 2723.63, "total_tokens": 786316832} {"current_steps": 4360, "total_steps": 9134, "loss": 0.5873, "learning_rate": 2.6778411484894478e-05, "epoch": 0.4772982292892526, "percentage": 47.73, "elapsed_time": "3 days, 8:12:43", "remaining_time": "3 days, 15:49:42", "throughput": 2723.6, "total_tokens": 786475872} {"current_steps": 4361, "total_steps": 9134, "loss": 0.7035, "learning_rate": 2.6769834541354727e-05, "epoch": 0.4774077013601905, "percentage": 47.74, "elapsed_time": "3 days, 8:13:50", "remaining_time": "3 days, 15:48:37", "throughput": 2723.68, "total_tokens": 786682400} {"current_steps": 4362, "total_steps": 9134, "loss": 0.8495, "learning_rate": 2.6761257388446924e-05, "epoch": 0.47751717343112837, "percentage": 47.76, "elapsed_time": "3 days, 8:14:56", "remaining_time": "3 days, 15:47:30", "throughput": 2723.64, "total_tokens": 786849952} {"current_steps": 4363, "total_steps": 9134, "loss": 0.8792, "learning_rate": 2.675268002718575e-05, "epoch": 0.4776266455020663, "percentage": 47.77, "elapsed_time": "3 days, 8:16:04", "remaining_time": "3 days, 15:46:26", "throughput": 2723.66, "total_tokens": 787042816} {"current_steps": 4364, "total_steps": 9134, "loss": 0.5287, "learning_rate": 2.674410245858588e-05, "epoch": 0.47773611757300416, "percentage": 47.78, "elapsed_time": "3 days, 8:17:10", "remaining_time": "3 days, 15:45:19", "throughput": 2723.63, "total_tokens": 787210144} {"current_steps": 4365, "total_steps": 9134, "loss": 0.5813, "learning_rate": 2.6735524683662017e-05, "epoch": 0.4778455896439421, "percentage": 47.79, "elapsed_time": "3 days, 8:18:14", "remaining_time": "3 days, 15:44:11", "throughput": 2723.57, "total_tokens": 787370080} {"current_steps": 4366, "total_steps": 9134, "loss": 0.9046, "learning_rate": 2.6726946703428908e-05, "epoch": 0.47795506171488, "percentage": 47.8, "elapsed_time": "3 days, 8:19:19", "remaining_time": "3 days, 15:43:03", "throughput": 2723.63, "total_tokens": 787563168} {"current_steps": 4367, "total_steps": 9134, "loss": 0.648, "learning_rate": 2.6718368518901295e-05, "epoch": 0.47806453378581787, "percentage": 47.81, "elapsed_time": "3 days, 8:20:24", "remaining_time": "3 days, 15:41:56", "throughput": 2723.6, "total_tokens": 787731840} {"current_steps": 4368, "total_steps": 9134, "loss": 0.7588, "learning_rate": 2.670979013109398e-05, "epoch": 0.4781740058567558, "percentage": 47.82, "elapsed_time": "3 days, 8:21:33", "remaining_time": "3 days, 15:40:53", "throughput": 2723.68, "total_tokens": 787943744} {"current_steps": 4369, "total_steps": 9134, "loss": 0.715, "learning_rate": 2.6701211541021757e-05, "epoch": 0.4782834779276937, "percentage": 47.83, "elapsed_time": "3 days, 8:22:41", "remaining_time": "3 days, 15:39:48", "throughput": 2723.67, "total_tokens": 788124736} {"current_steps": 4370, "total_steps": 9134, "loss": 0.9237, "learning_rate": 2.6692632749699463e-05, "epoch": 0.4783929499986316, "percentage": 47.84, "elapsed_time": "3 days, 8:23:49", "remaining_time": "3 days, 15:38:44", "throughput": 2723.74, "total_tokens": 788331040} {"current_steps": 4371, "total_steps": 9134, "loss": 0.5633, "learning_rate": 2.6684053758141948e-05, "epoch": 0.4785024220695695, "percentage": 47.85, "elapsed_time": "3 days, 8:24:57", "remaining_time": "3 days, 15:37:39", "throughput": 2723.75, "total_tokens": 788517184} {"current_steps": 4372, "total_steps": 9134, "loss": 0.7447, "learning_rate": 2.6675474567364096e-05, "epoch": 0.4786118941405074, "percentage": 47.87, "elapsed_time": "3 days, 8:26:03", "remaining_time": "3 days, 15:36:33", "throughput": 2723.72, "total_tokens": 788688096} {"current_steps": 4373, "total_steps": 9134, "loss": 0.6098, "learning_rate": 2.666689517838081e-05, "epoch": 0.4787213662114453, "percentage": 47.88, "elapsed_time": "3 days, 8:27:07", "remaining_time": "3 days, 15:35:24", "throughput": 2723.66, "total_tokens": 788846464} {"current_steps": 4374, "total_steps": 9134, "loss": 0.5732, "learning_rate": 2.6658315592206995e-05, "epoch": 0.4788308382823832, "percentage": 47.89, "elapsed_time": "3 days, 8:28:12", "remaining_time": "3 days, 15:34:17", "throughput": 2723.71, "total_tokens": 789037088} {"current_steps": 4375, "total_steps": 9134, "loss": 0.6179, "learning_rate": 2.664973580985763e-05, "epoch": 0.47894031035332113, "percentage": 47.9, "elapsed_time": "3 days, 8:29:18", "remaining_time": "3 days, 15:33:11", "throughput": 2723.74, "total_tokens": 789227264} {"current_steps": 4376, "total_steps": 9134, "loss": 0.8444, "learning_rate": 2.6641155832347668e-05, "epoch": 0.479049782424259, "percentage": 47.91, "elapsed_time": "3 days, 8:30:27", "remaining_time": "3 days, 15:32:08", "throughput": 2723.77, "total_tokens": 789424160} {"current_steps": 4377, "total_steps": 9134, "loss": 0.643, "learning_rate": 2.663257566069211e-05, "epoch": 0.4791592544951969, "percentage": 47.92, "elapsed_time": "3 days, 8:31:29", "remaining_time": "3 days, 15:30:57", "throughput": 2723.74, "total_tokens": 789584992} {"current_steps": 4378, "total_steps": 9134, "loss": 0.863, "learning_rate": 2.6623995295905974e-05, "epoch": 0.47926872656613484, "percentage": 47.93, "elapsed_time": "3 days, 8:32:38", "remaining_time": "3 days, 15:29:53", "throughput": 2723.75, "total_tokens": 789774720} {"current_steps": 4379, "total_steps": 9134, "loss": 0.5948, "learning_rate": 2.6615414739004297e-05, "epoch": 0.4793781986370727, "percentage": 47.94, "elapsed_time": "3 days, 8:33:40", "remaining_time": "3 days, 15:28:43", "throughput": 2723.72, "total_tokens": 789935328} {"current_steps": 4380, "total_steps": 9134, "loss": 0.7567, "learning_rate": 2.6606833991002146e-05, "epoch": 0.4794876707080106, "percentage": 47.95, "elapsed_time": "3 days, 8:34:48", "remaining_time": "3 days, 15:27:38", "throughput": 2723.73, "total_tokens": 790125056} {"current_steps": 4381, "total_steps": 9134, "loss": 0.6668, "learning_rate": 2.6598253052914596e-05, "epoch": 0.4795971427789485, "percentage": 47.96, "elapsed_time": "3 days, 8:35:56", "remaining_time": "3 days, 15:26:34", "throughput": 2723.75, "total_tokens": 790312320} {"current_steps": 4382, "total_steps": 9134, "loss": 0.7412, "learning_rate": 2.6589671925756777e-05, "epoch": 0.4797066148498864, "percentage": 47.97, "elapsed_time": "3 days, 8:37:03", "remaining_time": "3 days, 15:25:29", "throughput": 2723.74, "total_tokens": 790492640} {"current_steps": 4383, "total_steps": 9134, "loss": 0.6251, "learning_rate": 2.6581090610543796e-05, "epoch": 0.47981608692082434, "percentage": 47.99, "elapsed_time": "3 days, 8:38:11", "remaining_time": "3 days, 15:24:24", "throughput": 2723.69, "total_tokens": 790665568} {"current_steps": 4384, "total_steps": 9134, "loss": 0.6585, "learning_rate": 2.6572509108290826e-05, "epoch": 0.4799255589917622, "percentage": 48.0, "elapsed_time": "3 days, 8:39:19", "remaining_time": "3 days, 15:23:20", "throughput": 2723.65, "total_tokens": 790838272} {"current_steps": 4385, "total_steps": 9134, "loss": 0.7041, "learning_rate": 2.6563927420013036e-05, "epoch": 0.4800350310627001, "percentage": 48.01, "elapsed_time": "3 days, 8:40:27", "remaining_time": "3 days, 15:22:16", "throughput": 2723.66, "total_tokens": 791025536} {"current_steps": 4386, "total_steps": 9134, "loss": 0.7529, "learning_rate": 2.6555345546725625e-05, "epoch": 0.48014450313363805, "percentage": 48.02, "elapsed_time": "3 days, 8:41:35", "remaining_time": "3 days, 15:21:11", "throughput": 2723.71, "total_tokens": 791225792} {"current_steps": 4387, "total_steps": 9134, "loss": 0.6692, "learning_rate": 2.6546763489443806e-05, "epoch": 0.4802539752045759, "percentage": 48.03, "elapsed_time": "3 days, 8:42:43", "remaining_time": "3 days, 15:20:07", "throughput": 2723.77, "total_tokens": 791427616} {"current_steps": 4388, "total_steps": 9134, "loss": 0.7764, "learning_rate": 2.6538181249182813e-05, "epoch": 0.48036344727551383, "percentage": 48.04, "elapsed_time": "3 days, 8:43:49", "remaining_time": "3 days, 15:19:01", "throughput": 2723.78, "total_tokens": 791612416} {"current_steps": 4389, "total_steps": 9134, "loss": 0.6676, "learning_rate": 2.652959882695793e-05, "epoch": 0.48047291934645175, "percentage": 48.05, "elapsed_time": "3 days, 8:44:52", "remaining_time": "3 days, 15:17:51", "throughput": 2723.76, "total_tokens": 791777952} {"current_steps": 4390, "total_steps": 9134, "loss": 0.5715, "learning_rate": 2.6521016223784427e-05, "epoch": 0.4805823914173896, "percentage": 48.06, "elapsed_time": "3 days, 8:45:59", "remaining_time": "3 days, 15:16:46", "throughput": 2723.74, "total_tokens": 791954240} {"current_steps": 4391, "total_steps": 9134, "loss": 0.6608, "learning_rate": 2.6512433440677613e-05, "epoch": 0.48069186348832754, "percentage": 48.07, "elapsed_time": "3 days, 8:47:05", "remaining_time": "3 days, 15:15:39", "throughput": 2723.74, "total_tokens": 792132992} {"current_steps": 4392, "total_steps": 9134, "loss": 0.5923, "learning_rate": 2.6503850478652815e-05, "epoch": 0.48080133555926546, "percentage": 48.08, "elapsed_time": "3 days, 8:48:12", "remaining_time": "3 days, 15:14:33", "throughput": 2723.73, "total_tokens": 792313536} {"current_steps": 4393, "total_steps": 9134, "loss": 0.6078, "learning_rate": 2.6495267338725375e-05, "epoch": 0.48091080763020333, "percentage": 48.1, "elapsed_time": "3 days, 8:49:19", "remaining_time": "3 days, 15:13:28", "throughput": 2723.75, "total_tokens": 792500576} {"current_steps": 4394, "total_steps": 9134, "loss": 0.5514, "learning_rate": 2.6486684021910667e-05, "epoch": 0.48102027970114125, "percentage": 48.11, "elapsed_time": "3 days, 8:50:27", "remaining_time": "3 days, 15:12:23", "throughput": 2723.77, "total_tokens": 792689632} {"current_steps": 4395, "total_steps": 9134, "loss": 0.6569, "learning_rate": 2.647810052922409e-05, "epoch": 0.4811297517720792, "percentage": 48.12, "elapsed_time": "3 days, 8:51:35", "remaining_time": "3 days, 15:11:20", "throughput": 2723.79, "total_tokens": 792885184} {"current_steps": 4396, "total_steps": 9134, "loss": 0.5656, "learning_rate": 2.6469516861681042e-05, "epoch": 0.48123922384301704, "percentage": 48.13, "elapsed_time": "3 days, 8:52:45", "remaining_time": "3 days, 15:10:17", "throughput": 2723.91, "total_tokens": 793107840} {"current_steps": 4397, "total_steps": 9134, "loss": 0.6172, "learning_rate": 2.6460933020296962e-05, "epoch": 0.48134869591395496, "percentage": 48.14, "elapsed_time": "3 days, 8:53:49", "remaining_time": "3 days, 15:09:08", "throughput": 2723.91, "total_tokens": 793283232} {"current_steps": 4398, "total_steps": 9134, "loss": 0.6068, "learning_rate": 2.6452349006087295e-05, "epoch": 0.4814581679848929, "percentage": 48.15, "elapsed_time": "3 days, 8:54:56", "remaining_time": "3 days, 15:08:03", "throughput": 2723.97, "total_tokens": 793481696} {"current_steps": 4399, "total_steps": 9134, "loss": 0.6319, "learning_rate": 2.644376482006752e-05, "epoch": 0.48156764005583075, "percentage": 48.16, "elapsed_time": "3 days, 8:55:59", "remaining_time": "3 days, 15:06:53", "throughput": 2723.89, "total_tokens": 793630880} {"current_steps": 4400, "total_steps": 9134, "loss": 0.7313, "learning_rate": 2.6435180463253123e-05, "epoch": 0.48167711212676867, "percentage": 48.17, "elapsed_time": "3 days, 8:57:05", "remaining_time": "3 days, 15:05:46", "throughput": 2723.91, "total_tokens": 793814784} {"current_steps": 4401, "total_steps": 9134, "loss": 0.9118, "learning_rate": 2.6426595936659616e-05, "epoch": 0.48178658419770654, "percentage": 48.18, "elapsed_time": "3 days, 8:58:13", "remaining_time": "3 days, 15:04:42", "throughput": 2723.85, "total_tokens": 793982336} {"current_steps": 4402, "total_steps": 9134, "loss": 0.8365, "learning_rate": 2.6418011241302543e-05, "epoch": 0.48189605626864446, "percentage": 48.19, "elapsed_time": "3 days, 8:59:22", "remaining_time": "3 days, 15:03:39", "throughput": 2723.93, "total_tokens": 794196480} {"current_steps": 4403, "total_steps": 9134, "loss": 0.6519, "learning_rate": 2.6409426378197456e-05, "epoch": 0.4820055283395824, "percentage": 48.2, "elapsed_time": "3 days, 9:00:24", "remaining_time": "3 days, 15:02:28", "throughput": 2723.89, "total_tokens": 794353504} {"current_steps": 4404, "total_steps": 9134, "loss": 0.7739, "learning_rate": 2.6400841348359913e-05, "epoch": 0.48211500041052024, "percentage": 48.22, "elapsed_time": "3 days, 9:01:30", "remaining_time": "3 days, 15:01:22", "throughput": 2723.93, "total_tokens": 794543232} {"current_steps": 4405, "total_steps": 9134, "loss": 0.6613, "learning_rate": 2.6392256152805517e-05, "epoch": 0.48222447248145817, "percentage": 48.23, "elapsed_time": "3 days, 9:02:38", "remaining_time": "3 days, 15:00:18", "throughput": 2723.97, "total_tokens": 794742592} {"current_steps": 4406, "total_steps": 9134, "loss": 0.6293, "learning_rate": 2.6383670792549885e-05, "epoch": 0.4823339445523961, "percentage": 48.24, "elapsed_time": "3 days, 9:03:40", "remaining_time": "3 days, 14:59:07", "throughput": 2723.96, "total_tokens": 794908800} {"current_steps": 4407, "total_steps": 9134, "loss": 0.769, "learning_rate": 2.6375085268608645e-05, "epoch": 0.48244341662333395, "percentage": 48.25, "elapsed_time": "3 days, 9:04:43", "remaining_time": "3 days, 14:57:57", "throughput": 2723.89, "total_tokens": 795058432} {"current_steps": 4408, "total_steps": 9134, "loss": 0.9351, "learning_rate": 2.636649958199744e-05, "epoch": 0.4825528886942719, "percentage": 48.26, "elapsed_time": "3 days, 9:05:53", "remaining_time": "3 days, 14:56:55", "throughput": 2723.94, "total_tokens": 795263392} {"current_steps": 4409, "total_steps": 9134, "loss": 0.62, "learning_rate": 2.635791373373195e-05, "epoch": 0.4826623607652098, "percentage": 48.27, "elapsed_time": "3 days, 9:06:56", "remaining_time": "3 days, 14:55:46", "throughput": 2723.92, "total_tokens": 795431616} {"current_steps": 4410, "total_steps": 9134, "loss": 0.8784, "learning_rate": 2.634932772482786e-05, "epoch": 0.48277183283614766, "percentage": 48.28, "elapsed_time": "3 days, 9:08:05", "remaining_time": "3 days, 14:54:42", "throughput": 2723.98, "total_tokens": 795633440} {"current_steps": 4411, "total_steps": 9134, "loss": 0.6956, "learning_rate": 2.634074155630088e-05, "epoch": 0.4828813049070856, "percentage": 48.29, "elapsed_time": "3 days, 9:09:10", "remaining_time": "3 days, 14:53:35", "throughput": 2723.99, "total_tokens": 795817120} {"current_steps": 4412, "total_steps": 9134, "loss": 0.7658, "learning_rate": 2.6332155229166738e-05, "epoch": 0.4829907769780235, "percentage": 48.3, "elapsed_time": "3 days, 9:10:20", "remaining_time": "3 days, 14:52:32", "throughput": 2724.0, "total_tokens": 796006848} {"current_steps": 4413, "total_steps": 9134, "loss": 0.9806, "learning_rate": 2.6323568744441173e-05, "epoch": 0.48310024904896137, "percentage": 48.31, "elapsed_time": "3 days, 9:11:26", "remaining_time": "3 days, 14:51:26", "throughput": 2724.02, "total_tokens": 796193440} {"current_steps": 4414, "total_steps": 9134, "loss": 1.08, "learning_rate": 2.631498210313997e-05, "epoch": 0.4832097211198993, "percentage": 48.32, "elapsed_time": "3 days, 9:12:33", "remaining_time": "3 days, 14:50:20", "throughput": 2724.08, "total_tokens": 796393696} {"current_steps": 4415, "total_steps": 9134, "loss": 0.8097, "learning_rate": 2.630639530627888e-05, "epoch": 0.4833191931908372, "percentage": 48.34, "elapsed_time": "3 days, 9:13:40", "remaining_time": "3 days, 14:49:15", "throughput": 2724.11, "total_tokens": 796585440} {"current_steps": 4416, "total_steps": 9134, "loss": 0.7643, "learning_rate": 2.6297808354873733e-05, "epoch": 0.4834286652617751, "percentage": 48.35, "elapsed_time": "3 days, 9:14:48", "remaining_time": "3 days, 14:48:10", "throughput": 2724.19, "total_tokens": 796793760} {"current_steps": 4417, "total_steps": 9134, "loss": 0.5665, "learning_rate": 2.6289221249940337e-05, "epoch": 0.483538137332713, "percentage": 48.36, "elapsed_time": "3 days, 9:15:54", "remaining_time": "3 days, 14:47:04", "throughput": 2724.23, "total_tokens": 796984384} {"current_steps": 4418, "total_steps": 9134, "loss": 0.4882, "learning_rate": 2.6280633992494536e-05, "epoch": 0.48364760940365087, "percentage": 48.37, "elapsed_time": "3 days, 9:16:56", "remaining_time": "3 days, 14:45:54", "throughput": 2724.18, "total_tokens": 797142080} {"current_steps": 4419, "total_steps": 9134, "loss": 0.8295, "learning_rate": 2.627204658355218e-05, "epoch": 0.4837570814745888, "percentage": 48.38, "elapsed_time": "3 days, 9:18:03", "remaining_time": "3 days, 14:44:48", "throughput": 2724.25, "total_tokens": 797341216} {"current_steps": 4420, "total_steps": 9134, "loss": 0.5711, "learning_rate": 2.6263459024129144e-05, "epoch": 0.4838665535455267, "percentage": 48.39, "elapsed_time": "3 days, 9:19:10", "remaining_time": "3 days, 14:43:42", "throughput": 2724.23, "total_tokens": 797519072} {"current_steps": 4421, "total_steps": 9134, "loss": 0.6282, "learning_rate": 2.6254871315241318e-05, "epoch": 0.4839760256164646, "percentage": 48.4, "elapsed_time": "3 days, 9:20:19", "remaining_time": "3 days, 14:42:39", "throughput": 2724.33, "total_tokens": 797736352} {"current_steps": 4422, "total_steps": 9134, "loss": 0.6268, "learning_rate": 2.6246283457904612e-05, "epoch": 0.4840854976874025, "percentage": 48.41, "elapsed_time": "3 days, 9:21:22", "remaining_time": "3 days, 14:41:29", "throughput": 2724.34, "total_tokens": 797910400} {"current_steps": 4423, "total_steps": 9134, "loss": 0.7688, "learning_rate": 2.6237695453134964e-05, "epoch": 0.4841949697583404, "percentage": 48.42, "elapsed_time": "3 days, 9:22:28", "remaining_time": "3 days, 14:40:23", "throughput": 2724.31, "total_tokens": 798082880} {"current_steps": 4424, "total_steps": 9134, "loss": 0.7146, "learning_rate": 2.6229107301948308e-05, "epoch": 0.4843044418292783, "percentage": 48.43, "elapsed_time": "3 days, 9:23:33", "remaining_time": "3 days, 14:39:15", "throughput": 2724.35, "total_tokens": 798269920} {"current_steps": 4425, "total_steps": 9134, "loss": 0.7889, "learning_rate": 2.62205190053606e-05, "epoch": 0.4844139139002162, "percentage": 48.45, "elapsed_time": "3 days, 9:24:39", "remaining_time": "3 days, 14:38:09", "throughput": 2724.33, "total_tokens": 798445536} {"current_steps": 4426, "total_steps": 9134, "loss": 0.8621, "learning_rate": 2.6211930564387832e-05, "epoch": 0.48452338597115413, "percentage": 48.46, "elapsed_time": "3 days, 9:25:44", "remaining_time": "3 days, 14:37:01", "throughput": 2724.34, "total_tokens": 798624512} {"current_steps": 4427, "total_steps": 9134, "loss": 0.5768, "learning_rate": 2.6203341980045996e-05, "epoch": 0.484632858042092, "percentage": 48.47, "elapsed_time": "3 days, 9:26:48", "remaining_time": "3 days, 14:35:53", "throughput": 2724.35, "total_tokens": 798803264} {"current_steps": 4428, "total_steps": 9134, "loss": 0.6256, "learning_rate": 2.6194753253351102e-05, "epoch": 0.4847423301130299, "percentage": 48.48, "elapsed_time": "3 days, 9:27:55", "remaining_time": "3 days, 14:34:48", "throughput": 2724.39, "total_tokens": 798996128} {"current_steps": 4429, "total_steps": 9134, "loss": 0.7118, "learning_rate": 2.6186164385319186e-05, "epoch": 0.48485180218396784, "percentage": 48.49, "elapsed_time": "3 days, 9:29:02", "remaining_time": "3 days, 14:33:42", "throughput": 2724.38, "total_tokens": 799178688} {"current_steps": 4430, "total_steps": 9134, "loss": 0.6527, "learning_rate": 2.6177575376966284e-05, "epoch": 0.4849612742549057, "percentage": 48.5, "elapsed_time": "3 days, 9:30:06", "remaining_time": "3 days, 14:32:34", "throughput": 2724.35, "total_tokens": 799344224} {"current_steps": 4431, "total_steps": 9134, "loss": 0.8343, "learning_rate": 2.6168986229308473e-05, "epoch": 0.4850707463258436, "percentage": 48.51, "elapsed_time": "3 days, 9:31:13", "remaining_time": "3 days, 14:31:28", "throughput": 2724.38, "total_tokens": 799533728} {"current_steps": 4432, "total_steps": 9134, "loss": 0.7435, "learning_rate": 2.6160396943361827e-05, "epoch": 0.48518021839678155, "percentage": 48.52, "elapsed_time": "3 days, 9:32:18", "remaining_time": "3 days, 14:30:20", "throughput": 2724.37, "total_tokens": 799706432} {"current_steps": 4433, "total_steps": 9134, "loss": 0.6554, "learning_rate": 2.6151807520142436e-05, "epoch": 0.4852896904677194, "percentage": 48.53, "elapsed_time": "3 days, 9:33:22", "remaining_time": "3 days, 14:29:12", "throughput": 2724.35, "total_tokens": 799876672} {"current_steps": 4434, "total_steps": 9134, "loss": 0.7752, "learning_rate": 2.6143217960666416e-05, "epoch": 0.48539916253865734, "percentage": 48.54, "elapsed_time": "3 days, 9:34:30", "remaining_time": "3 days, 14:28:08", "throughput": 2724.45, "total_tokens": 800091936} {"current_steps": 4435, "total_steps": 9134, "loss": 0.9503, "learning_rate": 2.6134628265949903e-05, "epoch": 0.4855086346095952, "percentage": 48.55, "elapsed_time": "3 days, 9:35:39", "remaining_time": "3 days, 14:27:04", "throughput": 2724.51, "total_tokens": 800296448} {"current_steps": 4436, "total_steps": 9134, "loss": 0.8758, "learning_rate": 2.6126038437009025e-05, "epoch": 0.4856181066805331, "percentage": 48.57, "elapsed_time": "3 days, 9:36:46", "remaining_time": "3 days, 14:25:58", "throughput": 2724.52, "total_tokens": 800480352} {"current_steps": 4437, "total_steps": 9134, "loss": 0.5211, "learning_rate": 2.6117448474859958e-05, "epoch": 0.48572757875147105, "percentage": 48.58, "elapsed_time": "3 days, 9:37:53", "remaining_time": "3 days, 14:24:53", "throughput": 2724.48, "total_tokens": 800652832} {"current_steps": 4438, "total_steps": 9134, "loss": 0.6511, "learning_rate": 2.6108858380518874e-05, "epoch": 0.4858370508224089, "percentage": 48.59, "elapsed_time": "3 days, 9:38:54", "remaining_time": "3 days, 14:23:42", "throughput": 2724.41, "total_tokens": 800797312} {"current_steps": 4439, "total_steps": 9134, "loss": 0.6788, "learning_rate": 2.6100268155001968e-05, "epoch": 0.48594652289334683, "percentage": 48.6, "elapsed_time": "3 days, 9:39:57", "remaining_time": "3 days, 14:22:32", "throughput": 2724.3, "total_tokens": 800938432} {"current_steps": 4440, "total_steps": 9134, "loss": 0.7295, "learning_rate": 2.6091677799325436e-05, "epoch": 0.48605599496428475, "percentage": 48.61, "elapsed_time": "3 days, 9:41:02", "remaining_time": "3 days, 14:21:25", "throughput": 2724.3, "total_tokens": 801115616} {"current_steps": 4441, "total_steps": 9134, "loss": 0.701, "learning_rate": 2.608308731450551e-05, "epoch": 0.4861654670352226, "percentage": 48.62, "elapsed_time": "3 days, 9:42:06", "remaining_time": "3 days, 14:20:16", "throughput": 2724.26, "total_tokens": 801276896} {"current_steps": 4442, "total_steps": 9134, "loss": 0.8499, "learning_rate": 2.607449670155842e-05, "epoch": 0.48627493910616054, "percentage": 48.63, "elapsed_time": "3 days, 9:43:12", "remaining_time": "3 days, 14:19:09", "throughput": 2724.27, "total_tokens": 801458560} {"current_steps": 4443, "total_steps": 9134, "loss": 0.5845, "learning_rate": 2.6065905961500432e-05, "epoch": 0.48638441117709846, "percentage": 48.64, "elapsed_time": "3 days, 9:44:15", "remaining_time": "3 days, 14:18:00", "throughput": 2724.2, "total_tokens": 801611776} {"current_steps": 4444, "total_steps": 9134, "loss": 0.7975, "learning_rate": 2.60573150953478e-05, "epoch": 0.48649388324803633, "percentage": 48.65, "elapsed_time": "3 days, 9:45:25", "remaining_time": "3 days, 14:16:57", "throughput": 2724.21, "total_tokens": 801803296} {"current_steps": 4445, "total_steps": 9134, "loss": 0.7043, "learning_rate": 2.6048724104116818e-05, "epoch": 0.48660335531897425, "percentage": 48.66, "elapsed_time": "3 days, 9:46:34", "remaining_time": "3 days, 14:15:54", "throughput": 2724.15, "total_tokens": 801974656} {"current_steps": 4446, "total_steps": 9134, "loss": 0.7022, "learning_rate": 2.6040132988823775e-05, "epoch": 0.4867128273899122, "percentage": 48.68, "elapsed_time": "3 days, 9:47:39", "remaining_time": "3 days, 14:14:47", "throughput": 2724.17, "total_tokens": 802158336} {"current_steps": 4447, "total_steps": 9134, "loss": 0.887, "learning_rate": 2.603154175048499e-05, "epoch": 0.48682229946085004, "percentage": 48.69, "elapsed_time": "3 days, 9:48:45", "remaining_time": "3 days, 14:13:40", "throughput": 2724.14, "total_tokens": 802326560} {"current_steps": 4448, "total_steps": 9134, "loss": 0.7277, "learning_rate": 2.602295039011679e-05, "epoch": 0.48693177153178796, "percentage": 48.7, "elapsed_time": "3 days, 9:49:53", "remaining_time": "3 days, 14:12:36", "throughput": 2724.21, "total_tokens": 802533312} {"current_steps": 4449, "total_steps": 9134, "loss": 0.5252, "learning_rate": 2.6014358908735504e-05, "epoch": 0.4870412436027259, "percentage": 48.71, "elapsed_time": "3 days, 9:50:53", "remaining_time": "3 days, 14:11:23", "throughput": 2724.15, "total_tokens": 802682720} {"current_steps": 4450, "total_steps": 9134, "loss": 0.667, "learning_rate": 2.600576730735751e-05, "epoch": 0.48715071567366375, "percentage": 48.72, "elapsed_time": "3 days, 9:52:02", "remaining_time": "3 days, 14:10:20", "throughput": 2724.17, "total_tokens": 802874912} {"current_steps": 4451, "total_steps": 9134, "loss": 0.7728, "learning_rate": 2.5997175586999163e-05, "epoch": 0.48726018774460167, "percentage": 48.73, "elapsed_time": "3 days, 9:53:10", "remaining_time": "3 days, 14:09:15", "throughput": 2724.17, "total_tokens": 803060384} {"current_steps": 4452, "total_steps": 9134, "loss": 0.9502, "learning_rate": 2.5988583748676854e-05, "epoch": 0.48736965981553954, "percentage": 48.74, "elapsed_time": "3 days, 9:54:19", "remaining_time": "3 days, 14:08:12", "throughput": 2724.27, "total_tokens": 803274304} {"current_steps": 4453, "total_steps": 9134, "loss": 0.6277, "learning_rate": 2.597999179340697e-05, "epoch": 0.48747913188647746, "percentage": 48.75, "elapsed_time": "3 days, 9:55:21", "remaining_time": "3 days, 14:07:01", "throughput": 2724.21, "total_tokens": 803426848} {"current_steps": 4454, "total_steps": 9134, "loss": 0.8243, "learning_rate": 2.5971399722205936e-05, "epoch": 0.4875886039574154, "percentage": 48.76, "elapsed_time": "3 days, 9:56:30", "remaining_time": "3 days, 14:05:58", "throughput": 2724.21, "total_tokens": 803614784} {"current_steps": 4455, "total_steps": 9134, "loss": 0.7554, "learning_rate": 2.596280753609017e-05, "epoch": 0.48769807602835324, "percentage": 48.77, "elapsed_time": "3 days, 9:57:35", "remaining_time": "3 days, 14:04:50", "throughput": 2724.16, "total_tokens": 803776512} {"current_steps": 4456, "total_steps": 9134, "loss": 0.887, "learning_rate": 2.5954215236076113e-05, "epoch": 0.48780754809929117, "percentage": 48.78, "elapsed_time": "3 days, 9:58:40", "remaining_time": "3 days, 14:03:43", "throughput": 2724.15, "total_tokens": 803953920} {"current_steps": 4457, "total_steps": 9134, "loss": 0.8002, "learning_rate": 2.594562282318021e-05, "epoch": 0.4879170201702291, "percentage": 48.8, "elapsed_time": "3 days, 9:59:48", "remaining_time": "3 days, 14:02:39", "throughput": 2724.19, "total_tokens": 804149472} {"current_steps": 4458, "total_steps": 9134, "loss": 0.7096, "learning_rate": 2.5937030298418945e-05, "epoch": 0.48802649224116695, "percentage": 48.81, "elapsed_time": "3 days, 10:00:58", "remaining_time": "3 days, 14:01:36", "throughput": 2724.22, "total_tokens": 804347936} {"current_steps": 4459, "total_steps": 9134, "loss": 0.8319, "learning_rate": 2.5928437662808785e-05, "epoch": 0.4881359643121049, "percentage": 48.82, "elapsed_time": "3 days, 10:02:03", "remaining_time": "3 days, 14:00:29", "throughput": 2724.17, "total_tokens": 804512352} {"current_steps": 4460, "total_steps": 9134, "loss": 0.8599, "learning_rate": 2.5919844917366225e-05, "epoch": 0.4882454363830428, "percentage": 48.83, "elapsed_time": "3 days, 10:03:11", "remaining_time": "3 days, 13:59:25", "throughput": 2724.2, "total_tokens": 804707008} {"current_steps": 4461, "total_steps": 9134, "loss": 0.6703, "learning_rate": 2.5911252063107772e-05, "epoch": 0.48835490845398066, "percentage": 48.84, "elapsed_time": "3 days, 10:04:17", "remaining_time": "3 days, 13:58:18", "throughput": 2724.19, "total_tokens": 804879936} {"current_steps": 4462, "total_steps": 9134, "loss": 0.961, "learning_rate": 2.5902659101049933e-05, "epoch": 0.4884643805249186, "percentage": 48.85, "elapsed_time": "3 days, 10:05:23", "remaining_time": "3 days, 13:57:11", "throughput": 2724.2, "total_tokens": 805064736} {"current_steps": 4463, "total_steps": 9134, "loss": 0.6585, "learning_rate": 2.589406603220925e-05, "epoch": 0.4885738525958565, "percentage": 48.86, "elapsed_time": "3 days, 10:06:30", "remaining_time": "3 days, 13:56:06", "throughput": 2724.24, "total_tokens": 805259392} {"current_steps": 4464, "total_steps": 9134, "loss": 0.9244, "learning_rate": 2.5885472857602273e-05, "epoch": 0.48868332466679437, "percentage": 48.87, "elapsed_time": "3 days, 10:07:37", "remaining_time": "3 days, 13:55:01", "throughput": 2724.21, "total_tokens": 805432992} {"current_steps": 4465, "total_steps": 9134, "loss": 0.7632, "learning_rate": 2.5876879578245543e-05, "epoch": 0.4887927967377323, "percentage": 48.88, "elapsed_time": "3 days, 10:08:44", "remaining_time": "3 days, 13:53:56", "throughput": 2724.16, "total_tokens": 805600320} {"current_steps": 4466, "total_steps": 9134, "loss": 0.7125, "learning_rate": 2.5868286195155638e-05, "epoch": 0.4889022688086702, "percentage": 48.89, "elapsed_time": "3 days, 10:09:45", "remaining_time": "3 days, 13:52:44", "throughput": 2724.12, "total_tokens": 805756896} {"current_steps": 4467, "total_steps": 9134, "loss": 0.6898, "learning_rate": 2.585969270934913e-05, "epoch": 0.4890117408796081, "percentage": 48.91, "elapsed_time": "3 days, 10:10:46", "remaining_time": "3 days, 13:51:31", "throughput": 2724.07, "total_tokens": 805904288} {"current_steps": 4468, "total_steps": 9134, "loss": 0.6502, "learning_rate": 2.5851099121842624e-05, "epoch": 0.489121212950546, "percentage": 48.92, "elapsed_time": "3 days, 10:11:51", "remaining_time": "3 days, 13:50:24", "throughput": 2724.09, "total_tokens": 806088864} {"current_steps": 4469, "total_steps": 9134, "loss": 0.5917, "learning_rate": 2.5842505433652713e-05, "epoch": 0.48923068502148387, "percentage": 48.93, "elapsed_time": "3 days, 10:12:58", "remaining_time": "3 days, 13:49:19", "throughput": 2724.12, "total_tokens": 806281280} {"current_steps": 4470, "total_steps": 9134, "loss": 0.8224, "learning_rate": 2.583391164579603e-05, "epoch": 0.4893401570924218, "percentage": 48.94, "elapsed_time": "3 days, 10:14:04", "remaining_time": "3 days, 13:48:12", "throughput": 2724.09, "total_tokens": 806451072} {"current_steps": 4471, "total_steps": 9134, "loss": 0.6617, "learning_rate": 2.5825317759289185e-05, "epoch": 0.4894496291633597, "percentage": 48.95, "elapsed_time": "3 days, 10:15:12", "remaining_time": "3 days, 13:47:08", "throughput": 2724.14, "total_tokens": 806652448} {"current_steps": 4472, "total_steps": 9134, "loss": 0.7852, "learning_rate": 2.581672377514883e-05, "epoch": 0.4895591012342976, "percentage": 48.96, "elapsed_time": "3 days, 10:16:19", "remaining_time": "3 days, 13:46:03", "throughput": 2724.2, "total_tokens": 806852704} {"current_steps": 4473, "total_steps": 9134, "loss": 0.7199, "learning_rate": 2.580812969439162e-05, "epoch": 0.4896685733052355, "percentage": 48.97, "elapsed_time": "3 days, 10:17:27", "remaining_time": "3 days, 13:44:59", "throughput": 2724.26, "total_tokens": 807056544} {"current_steps": 4474, "total_steps": 9134, "loss": 0.7812, "learning_rate": 2.5799535518034205e-05, "epoch": 0.4897780453761734, "percentage": 48.98, "elapsed_time": "3 days, 10:18:36", "remaining_time": "3 days, 13:43:55", "throughput": 2724.26, "total_tokens": 807243584} {"current_steps": 4475, "total_steps": 9134, "loss": 0.6906, "learning_rate": 2.579094124709327e-05, "epoch": 0.4898875174471113, "percentage": 48.99, "elapsed_time": "3 days, 10:19:43", "remaining_time": "3 days, 13:42:49", "throughput": 2724.26, "total_tokens": 807424352} {"current_steps": 4476, "total_steps": 9134, "loss": 0.6976, "learning_rate": 2.578234688258549e-05, "epoch": 0.4899969895180492, "percentage": 49.0, "elapsed_time": "3 days, 10:20:49", "remaining_time": "3 days, 13:41:43", "throughput": 2724.24, "total_tokens": 807598176} {"current_steps": 4477, "total_steps": 9134, "loss": 0.6548, "learning_rate": 2.5773752425527576e-05, "epoch": 0.49010646158898713, "percentage": 49.01, "elapsed_time": "3 days, 10:21:53", "remaining_time": "3 days, 13:40:35", "throughput": 2724.18, "total_tokens": 807757440} {"current_steps": 4478, "total_steps": 9134, "loss": 0.6487, "learning_rate": 2.576515787693622e-05, "epoch": 0.490215933659925, "percentage": 49.03, "elapsed_time": "3 days, 10:23:01", "remaining_time": "3 days, 13:39:30", "throughput": 2724.18, "total_tokens": 807940896} {"current_steps": 4479, "total_steps": 9134, "loss": 0.793, "learning_rate": 2.5756563237828158e-05, "epoch": 0.4903254057308629, "percentage": 49.04, "elapsed_time": "3 days, 10:24:02", "remaining_time": "3 days, 13:38:18", "throughput": 2724.06, "total_tokens": 808070368} {"current_steps": 4480, "total_steps": 9134, "loss": 0.7771, "learning_rate": 2.574796850922011e-05, "epoch": 0.49043487780180084, "percentage": 49.05, "elapsed_time": "3 days, 10:25:10", "remaining_time": "3 days, 13:37:14", "throughput": 2724.1, "total_tokens": 808270624} {"current_steps": 4481, "total_steps": 9134, "loss": 0.6574, "learning_rate": 2.573937369212882e-05, "epoch": 0.4905443498727387, "percentage": 49.06, "elapsed_time": "3 days, 10:26:19", "remaining_time": "3 days, 13:36:10", "throughput": 2724.13, "total_tokens": 808464832} {"current_steps": 4482, "total_steps": 9134, "loss": 0.702, "learning_rate": 2.5730778787571035e-05, "epoch": 0.4906538219436766, "percentage": 49.07, "elapsed_time": "3 days, 10:27:24", "remaining_time": "3 days, 13:35:03", "throughput": 2724.16, "total_tokens": 808650528} {"current_steps": 4483, "total_steps": 9134, "loss": 0.6131, "learning_rate": 2.5722183796563508e-05, "epoch": 0.49076329401461455, "percentage": 49.08, "elapsed_time": "3 days, 10:28:30", "remaining_time": "3 days, 13:33:56", "throughput": 2724.13, "total_tokens": 808821664} {"current_steps": 4484, "total_steps": 9134, "loss": 0.9082, "learning_rate": 2.571358872012303e-05, "epoch": 0.4908727660855524, "percentage": 49.09, "elapsed_time": "3 days, 10:29:38", "remaining_time": "3 days, 13:32:52", "throughput": 2724.11, "total_tokens": 809001984} {"current_steps": 4485, "total_steps": 9134, "loss": 0.7736, "learning_rate": 2.5704993559266364e-05, "epoch": 0.49098223815649034, "percentage": 49.1, "elapsed_time": "3 days, 10:30:47", "remaining_time": "3 days, 13:31:49", "throughput": 2724.07, "total_tokens": 809177824} {"current_steps": 4486, "total_steps": 9134, "loss": 0.8074, "learning_rate": 2.569639831501031e-05, "epoch": 0.4910917102274282, "percentage": 49.11, "elapsed_time": "3 days, 10:31:54", "remaining_time": "3 days, 13:30:44", "throughput": 2724.1, "total_tokens": 809369120} {"current_steps": 4487, "total_steps": 9134, "loss": 0.8023, "learning_rate": 2.5687802988371667e-05, "epoch": 0.4912011822983661, "percentage": 49.12, "elapsed_time": "3 days, 10:33:02", "remaining_time": "3 days, 13:29:39", "throughput": 2724.04, "total_tokens": 809534880} {"current_steps": 4488, "total_steps": 9134, "loss": 0.7795, "learning_rate": 2.5679207580367242e-05, "epoch": 0.49131065436930405, "percentage": 49.14, "elapsed_time": "3 days, 10:34:07", "remaining_time": "3 days, 13:28:32", "throughput": 2724.02, "total_tokens": 809707584} {"current_steps": 4489, "total_steps": 9134, "loss": 0.8149, "learning_rate": 2.5670612092013857e-05, "epoch": 0.4914201264402419, "percentage": 49.15, "elapsed_time": "3 days, 10:35:15", "remaining_time": "3 days, 13:27:27", "throughput": 2723.98, "total_tokens": 809882528} {"current_steps": 4490, "total_steps": 9134, "loss": 0.557, "learning_rate": 2.5662016524328346e-05, "epoch": 0.49152959851117983, "percentage": 49.16, "elapsed_time": "3 days, 10:36:22", "remaining_time": "3 days, 13:26:21", "throughput": 2724.0, "total_tokens": 810067776} {"current_steps": 4491, "total_steps": 9134, "loss": 0.682, "learning_rate": 2.565342087832755e-05, "epoch": 0.49163907058211775, "percentage": 49.17, "elapsed_time": "3 days, 10:37:29", "remaining_time": "3 days, 13:25:16", "throughput": 2724.03, "total_tokens": 810261536} {"current_steps": 4492, "total_steps": 9134, "loss": 0.7489, "learning_rate": 2.5644825155028314e-05, "epoch": 0.4917485426530556, "percentage": 49.18, "elapsed_time": "3 days, 10:38:36", "remaining_time": "3 days, 13:24:11", "throughput": 2724.03, "total_tokens": 810443648} {"current_steps": 4493, "total_steps": 9134, "loss": 0.6142, "learning_rate": 2.563622935544749e-05, "epoch": 0.49185801472399354, "percentage": 49.19, "elapsed_time": "3 days, 10:39:43", "remaining_time": "3 days, 13:23:06", "throughput": 2724.05, "total_tokens": 810632032} {"current_steps": 4494, "total_steps": 9134, "loss": 0.6247, "learning_rate": 2.5627633480601953e-05, "epoch": 0.49196748679493146, "percentage": 49.2, "elapsed_time": "3 days, 10:40:53", "remaining_time": "3 days, 13:22:03", "throughput": 2724.1, "total_tokens": 810838112} {"current_steps": 4495, "total_steps": 9134, "loss": 0.7199, "learning_rate": 2.561903753150857e-05, "epoch": 0.49207695886586933, "percentage": 49.21, "elapsed_time": "3 days, 10:42:00", "remaining_time": "3 days, 13:20:57", "throughput": 2724.15, "total_tokens": 811036128} {"current_steps": 4496, "total_steps": 9134, "loss": 0.7065, "learning_rate": 2.561044150918423e-05, "epoch": 0.49218643093680725, "percentage": 49.22, "elapsed_time": "3 days, 10:43:05", "remaining_time": "3 days, 13:19:50", "throughput": 2724.16, "total_tokens": 811214208} {"current_steps": 4497, "total_steps": 9134, "loss": 0.6394, "learning_rate": 2.5601845414645832e-05, "epoch": 0.4922959030077452, "percentage": 49.23, "elapsed_time": "3 days, 10:44:12", "remaining_time": "3 days, 13:18:44", "throughput": 2724.05, "total_tokens": 811364064} {"current_steps": 4498, "total_steps": 9134, "loss": 0.8001, "learning_rate": 2.5593249248910272e-05, "epoch": 0.49240537507868304, "percentage": 49.24, "elapsed_time": "3 days, 10:45:20", "remaining_time": "3 days, 13:17:41", "throughput": 2724.05, "total_tokens": 811551328} {"current_steps": 4499, "total_steps": 9134, "loss": 0.5506, "learning_rate": 2.558465301299445e-05, "epoch": 0.49251484714962096, "percentage": 49.26, "elapsed_time": "3 days, 10:46:23", "remaining_time": "3 days, 13:16:31", "throughput": 2724.03, "total_tokens": 811716640} {"current_steps": 4500, "total_steps": 9134, "loss": 0.7206, "learning_rate": 2.5576056707915308e-05, "epoch": 0.4926243192205589, "percentage": 49.27, "elapsed_time": "3 days, 10:47:32", "remaining_time": "3 days, 13:15:28", "throughput": 2724.05, "total_tokens": 811911520} {"current_steps": 4501, "total_steps": 9134, "loss": 0.8743, "learning_rate": 2.556746033468975e-05, "epoch": 0.49273379129149675, "percentage": 49.28, "elapsed_time": "3 days, 10:48:40", "remaining_time": "3 days, 13:14:23", "throughput": 2724.06, "total_tokens": 812097440} {"current_steps": 4502, "total_steps": 9134, "loss": 0.8324, "learning_rate": 2.5558863894334722e-05, "epoch": 0.49284326336243467, "percentage": 49.29, "elapsed_time": "3 days, 10:49:48", "remaining_time": "3 days, 13:13:18", "throughput": 2724.02, "total_tokens": 812271040} {"current_steps": 4503, "total_steps": 9134, "loss": 0.6287, "learning_rate": 2.5550267387867162e-05, "epoch": 0.49295273543337254, "percentage": 49.3, "elapsed_time": "3 days, 10:50:53", "remaining_time": "3 days, 13:12:11", "throughput": 2724.02, "total_tokens": 812446432} {"current_steps": 4504, "total_steps": 9134, "loss": 0.6071, "learning_rate": 2.5541670816304026e-05, "epoch": 0.49306220750431046, "percentage": 49.31, "elapsed_time": "3 days, 10:51:58", "remaining_time": "3 days, 13:11:03", "throughput": 2724.03, "total_tokens": 812626528} {"current_steps": 4505, "total_steps": 9134, "loss": 0.555, "learning_rate": 2.5533074180662265e-05, "epoch": 0.4931716795752484, "percentage": 49.32, "elapsed_time": "3 days, 10:53:02", "remaining_time": "3 days, 13:09:55", "throughput": 2724.04, "total_tokens": 812805728} {"current_steps": 4506, "total_steps": 9134, "loss": 0.6928, "learning_rate": 2.5524477481958846e-05, "epoch": 0.49328115164618624, "percentage": 49.33, "elapsed_time": "3 days, 10:54:04", "remaining_time": "3 days, 13:08:45", "throughput": 2724.03, "total_tokens": 812972608} {"current_steps": 4507, "total_steps": 9134, "loss": 0.7494, "learning_rate": 2.551588072121075e-05, "epoch": 0.49339062371712417, "percentage": 49.34, "elapsed_time": "3 days, 10:55:09", "remaining_time": "3 days, 13:07:37", "throughput": 2723.92, "total_tokens": 813116192} {"current_steps": 4508, "total_steps": 9134, "loss": 0.7713, "learning_rate": 2.5507283899434948e-05, "epoch": 0.4935000957880621, "percentage": 49.35, "elapsed_time": "3 days, 10:56:19", "remaining_time": "3 days, 13:06:34", "throughput": 2723.96, "total_tokens": 813316448} {"current_steps": 4509, "total_steps": 9134, "loss": 0.6535, "learning_rate": 2.549868701764842e-05, "epoch": 0.49360956785899995, "percentage": 49.37, "elapsed_time": "3 days, 10:57:26", "remaining_time": "3 days, 13:05:29", "throughput": 2724.02, "total_tokens": 813518496} {"current_steps": 4510, "total_steps": 9134, "loss": 0.6622, "learning_rate": 2.5490090076868177e-05, "epoch": 0.4937190399299379, "percentage": 49.38, "elapsed_time": "3 days, 10:58:34", "remaining_time": "3 days, 13:04:25", "throughput": 2724.03, "total_tokens": 813707104} {"current_steps": 4511, "total_steps": 9134, "loss": 0.791, "learning_rate": 2.5481493078111218e-05, "epoch": 0.4938285120008758, "percentage": 49.39, "elapsed_time": "3 days, 10:59:42", "remaining_time": "3 days, 13:03:21", "throughput": 2724.08, "total_tokens": 813908928} {"current_steps": 4512, "total_steps": 9134, "loss": 0.7506, "learning_rate": 2.547289602239455e-05, "epoch": 0.49393798407181366, "percentage": 49.4, "elapsed_time": "3 days, 11:00:51", "remaining_time": "3 days, 13:02:17", "throughput": 2724.12, "total_tokens": 814108288} {"current_steps": 4513, "total_steps": 9134, "loss": 0.7561, "learning_rate": 2.5464298910735186e-05, "epoch": 0.4940474561427516, "percentage": 49.41, "elapsed_time": "3 days, 11:01:58", "remaining_time": "3 days, 13:01:11", "throughput": 2724.16, "total_tokens": 814300032} {"current_steps": 4514, "total_steps": 9134, "loss": 0.5613, "learning_rate": 2.545570174415015e-05, "epoch": 0.4941569282136895, "percentage": 49.42, "elapsed_time": "3 days, 11:03:04", "remaining_time": "3 days, 13:00:05", "throughput": 2724.18, "total_tokens": 814487520} {"current_steps": 4515, "total_steps": 9134, "loss": 0.8227, "learning_rate": 2.5447104523656466e-05, "epoch": 0.49426640028462737, "percentage": 49.43, "elapsed_time": "3 days, 11:04:12", "remaining_time": "3 days, 12:59:01", "throughput": 2724.22, "total_tokens": 814686208} {"current_steps": 4516, "total_steps": 9134, "loss": 0.7865, "learning_rate": 2.543850725027117e-05, "epoch": 0.4943758723555653, "percentage": 49.44, "elapsed_time": "3 days, 11:05:22", "remaining_time": "3 days, 12:57:58", "throughput": 2724.28, "total_tokens": 814892512} {"current_steps": 4517, "total_steps": 9134, "loss": 0.9123, "learning_rate": 2.54299099250113e-05, "epoch": 0.4944853444265032, "percentage": 49.45, "elapsed_time": "3 days, 11:06:26", "remaining_time": "3 days, 12:56:50", "throughput": 2724.25, "total_tokens": 815059616} {"current_steps": 4518, "total_steps": 9134, "loss": 0.6339, "learning_rate": 2.5421312548893917e-05, "epoch": 0.4945948164974411, "percentage": 49.46, "elapsed_time": "3 days, 11:07:33", "remaining_time": "3 days, 12:55:44", "throughput": 2724.23, "total_tokens": 815235904} {"current_steps": 4519, "total_steps": 9134, "loss": 0.6855, "learning_rate": 2.5412715122936064e-05, "epoch": 0.494704288568379, "percentage": 49.47, "elapsed_time": "3 days, 11:08:41", "remaining_time": "3 days, 12:54:39", "throughput": 2724.28, "total_tokens": 815434592} {"current_steps": 4520, "total_steps": 9134, "loss": 0.7103, "learning_rate": 2.5404117648154794e-05, "epoch": 0.49481376063931687, "percentage": 49.49, "elapsed_time": "3 days, 11:09:47", "remaining_time": "3 days, 12:53:33", "throughput": 2724.26, "total_tokens": 815609984} {"current_steps": 4521, "total_steps": 9134, "loss": 0.5366, "learning_rate": 2.5395520125567185e-05, "epoch": 0.4949232327102548, "percentage": 49.5, "elapsed_time": "3 days, 11:10:55", "remaining_time": "3 days, 12:52:29", "throughput": 2724.24, "total_tokens": 815789408} {"current_steps": 4522, "total_steps": 9134, "loss": 0.8518, "learning_rate": 2.53869225561903e-05, "epoch": 0.4950327047811927, "percentage": 49.51, "elapsed_time": "3 days, 11:12:01", "remaining_time": "3 days, 12:51:22", "throughput": 2724.24, "total_tokens": 815966368} {"current_steps": 4523, "total_steps": 9134, "loss": 0.9355, "learning_rate": 2.537832494104121e-05, "epoch": 0.4951421768521306, "percentage": 49.52, "elapsed_time": "3 days, 11:13:10", "remaining_time": "3 days, 12:50:19", "throughput": 2724.32, "total_tokens": 816182528} {"current_steps": 4524, "total_steps": 9134, "loss": 0.8543, "learning_rate": 2.536972728113701e-05, "epoch": 0.4952516489230685, "percentage": 49.53, "elapsed_time": "3 days, 11:14:17", "remaining_time": "3 days, 12:49:13", "throughput": 2724.32, "total_tokens": 816363296} {"current_steps": 4525, "total_steps": 9134, "loss": 0.8236, "learning_rate": 2.536112957749478e-05, "epoch": 0.4953611209940064, "percentage": 49.54, "elapsed_time": "3 days, 11:15:25", "remaining_time": "3 days, 12:48:09", "throughput": 2724.31, "total_tokens": 816545184} {"current_steps": 4526, "total_steps": 9134, "loss": 0.8922, "learning_rate": 2.535253183113161e-05, "epoch": 0.4954705930649443, "percentage": 49.55, "elapsed_time": "3 days, 11:16:31", "remaining_time": "3 days, 12:47:02", "throughput": 2724.39, "total_tokens": 816747680} {"current_steps": 4527, "total_steps": 9134, "loss": 0.7905, "learning_rate": 2.5343934043064598e-05, "epoch": 0.4955800651358822, "percentage": 49.56, "elapsed_time": "3 days, 11:17:39", "remaining_time": "3 days, 12:45:58", "throughput": 2724.44, "total_tokens": 816949952} {"current_steps": 4528, "total_steps": 9134, "loss": 0.7685, "learning_rate": 2.5335336214310845e-05, "epoch": 0.49568953720682013, "percentage": 49.57, "elapsed_time": "3 days, 11:18:42", "remaining_time": "3 days, 12:44:49", "throughput": 2724.39, "total_tokens": 817106304} {"current_steps": 4529, "total_steps": 9134, "loss": 0.7375, "learning_rate": 2.5326738345887462e-05, "epoch": 0.495799009277758, "percentage": 49.58, "elapsed_time": "3 days, 11:19:51", "remaining_time": "3 days, 12:43:45", "throughput": 2724.4, "total_tokens": 817296256} {"current_steps": 4530, "total_steps": 9134, "loss": 0.7674, "learning_rate": 2.531814043881155e-05, "epoch": 0.4959084813486959, "percentage": 49.59, "elapsed_time": "3 days, 11:21:00", "remaining_time": "3 days, 12:42:41", "throughput": 2724.47, "total_tokens": 817505024} {"current_steps": 4531, "total_steps": 9134, "loss": 0.5189, "learning_rate": 2.5309542494100234e-05, "epoch": 0.49601795341963384, "percentage": 49.61, "elapsed_time": "3 days, 11:22:06", "remaining_time": "3 days, 12:41:36", "throughput": 2724.52, "total_tokens": 817702144} {"current_steps": 4532, "total_steps": 9134, "loss": 0.9222, "learning_rate": 2.5300944512770636e-05, "epoch": 0.4961274254905717, "percentage": 49.62, "elapsed_time": "3 days, 11:23:12", "remaining_time": "3 days, 12:40:29", "throughput": 2724.54, "total_tokens": 817887168} {"current_steps": 4533, "total_steps": 9134, "loss": 0.7377, "learning_rate": 2.529234649583988e-05, "epoch": 0.4962368975615096, "percentage": 49.63, "elapsed_time": "3 days, 11:24:19", "remaining_time": "3 days, 12:39:23", "throughput": 2724.52, "total_tokens": 818062784} {"current_steps": 4534, "total_steps": 9134, "loss": 0.8108, "learning_rate": 2.528374844432509e-05, "epoch": 0.49634636963244755, "percentage": 49.64, "elapsed_time": "3 days, 11:25:27", "remaining_time": "3 days, 12:38:19", "throughput": 2724.49, "total_tokens": 818240864} {"current_steps": 4535, "total_steps": 9134, "loss": 0.6954, "learning_rate": 2.5275150359243405e-05, "epoch": 0.4964558417033854, "percentage": 49.65, "elapsed_time": "3 days, 11:26:33", "remaining_time": "3 days, 12:37:13", "throughput": 2724.52, "total_tokens": 818429696} {"current_steps": 4536, "total_steps": 9134, "loss": 0.7044, "learning_rate": 2.526655224161196e-05, "epoch": 0.49656531377432334, "percentage": 49.66, "elapsed_time": "3 days, 11:27:41", "remaining_time": "3 days, 12:36:07", "throughput": 2724.56, "total_tokens": 818623232} {"current_steps": 4537, "total_steps": 9134, "loss": 0.7814, "learning_rate": 2.5257954092447878e-05, "epoch": 0.4966747858452612, "percentage": 49.67, "elapsed_time": "3 days, 11:28:44", "remaining_time": "3 days, 12:34:58", "throughput": 2724.57, "total_tokens": 818797504} {"current_steps": 4538, "total_steps": 9134, "loss": 0.7245, "learning_rate": 2.5249355912768334e-05, "epoch": 0.4967842579161991, "percentage": 49.68, "elapsed_time": "3 days, 11:29:47", "remaining_time": "3 days, 12:33:49", "throughput": 2724.57, "total_tokens": 818972224} {"current_steps": 4539, "total_steps": 9134, "loss": 0.6803, "learning_rate": 2.5240757703590462e-05, "epoch": 0.49689372998713704, "percentage": 49.69, "elapsed_time": "3 days, 11:30:54", "remaining_time": "3 days, 12:32:43", "throughput": 2724.61, "total_tokens": 819165536} {"current_steps": 4540, "total_steps": 9134, "loss": 0.9152, "learning_rate": 2.523215946593141e-05, "epoch": 0.4970032020580749, "percentage": 49.7, "elapsed_time": "3 days, 11:32:03", "remaining_time": "3 days, 12:31:40", "throughput": 2724.6, "total_tokens": 819351680} {"current_steps": 4541, "total_steps": 9134, "loss": 0.5306, "learning_rate": 2.5223561200808334e-05, "epoch": 0.49711267412901283, "percentage": 49.72, "elapsed_time": "3 days, 11:33:11", "remaining_time": "3 days, 12:30:35", "throughput": 2724.54, "total_tokens": 819517888} {"current_steps": 4542, "total_steps": 9134, "loss": 0.593, "learning_rate": 2.5214962909238397e-05, "epoch": 0.49722214619995075, "percentage": 49.73, "elapsed_time": "3 days, 11:34:20", "remaining_time": "3 days, 12:29:32", "throughput": 2724.55, "total_tokens": 819709856} {"current_steps": 4543, "total_steps": 9134, "loss": 0.857, "learning_rate": 2.5206364592238767e-05, "epoch": 0.4973316182708886, "percentage": 49.74, "elapsed_time": "3 days, 11:35:28", "remaining_time": "3 days, 12:28:27", "throughput": 2724.53, "total_tokens": 819889728} {"current_steps": 4544, "total_steps": 9134, "loss": 0.8211, "learning_rate": 2.5197766250826586e-05, "epoch": 0.49744109034182654, "percentage": 49.75, "elapsed_time": "3 days, 11:36:37", "remaining_time": "3 days, 12:27:24", "throughput": 2724.48, "total_tokens": 820062208} {"current_steps": 4545, "total_steps": 9134, "loss": 0.6393, "learning_rate": 2.518916788601905e-05, "epoch": 0.49755056241276446, "percentage": 49.76, "elapsed_time": "3 days, 11:37:45", "remaining_time": "3 days, 12:26:19", "throughput": 2724.53, "total_tokens": 820259328} {"current_steps": 4546, "total_steps": 9134, "loss": 0.7956, "learning_rate": 2.5180569498833308e-05, "epoch": 0.49766003448370233, "percentage": 49.77, "elapsed_time": "3 days, 11:38:48", "remaining_time": "3 days, 12:25:10", "throughput": 2724.5, "total_tokens": 820425312} {"current_steps": 4547, "total_steps": 9134, "loss": 0.6533, "learning_rate": 2.5171971090286546e-05, "epoch": 0.49776950655464025, "percentage": 49.78, "elapsed_time": "3 days, 11:39:51", "remaining_time": "3 days, 12:24:01", "throughput": 2724.42, "total_tokens": 820572704} {"current_steps": 4548, "total_steps": 9134, "loss": 0.6965, "learning_rate": 2.5163372661395923e-05, "epoch": 0.4978789786255782, "percentage": 49.79, "elapsed_time": "3 days, 11:40:58", "remaining_time": "3 days, 12:22:55", "throughput": 2724.41, "total_tokens": 820751680} {"current_steps": 4549, "total_steps": 9134, "loss": 0.7379, "learning_rate": 2.5154774213178634e-05, "epoch": 0.49798845069651604, "percentage": 49.8, "elapsed_time": "3 days, 11:42:07", "remaining_time": "3 days, 12:21:51", "throughput": 2724.48, "total_tokens": 820959776} {"current_steps": 4550, "total_steps": 9134, "loss": 0.9381, "learning_rate": 2.5146175746651847e-05, "epoch": 0.49809792276745396, "percentage": 49.81, "elapsed_time": "3 days, 11:43:15", "remaining_time": "3 days, 12:20:48", "throughput": 2724.53, "total_tokens": 821163168} {"current_steps": 4551, "total_steps": 9134, "loss": 0.7848, "learning_rate": 2.5137577262832746e-05, "epoch": 0.4982073948383919, "percentage": 49.82, "elapsed_time": "3 days, 11:44:23", "remaining_time": "3 days, 12:19:42", "throughput": 2724.56, "total_tokens": 821354912} {"current_steps": 4552, "total_steps": 9134, "loss": 0.6358, "learning_rate": 2.512897876273852e-05, "epoch": 0.49831686690932975, "percentage": 49.84, "elapsed_time": "3 days, 11:45:31", "remaining_time": "3 days, 12:18:38", "throughput": 2724.58, "total_tokens": 821543968} {"current_steps": 4553, "total_steps": 9134, "loss": 0.6543, "learning_rate": 2.5120380247386356e-05, "epoch": 0.49842633898026767, "percentage": 49.85, "elapsed_time": "3 days, 11:46:34", "remaining_time": "3 days, 12:17:29", "throughput": 2724.56, "total_tokens": 821714208} {"current_steps": 4554, "total_steps": 9134, "loss": 0.9203, "learning_rate": 2.5111781717793436e-05, "epoch": 0.49853581105120554, "percentage": 49.86, "elapsed_time": "3 days, 11:47:43", "remaining_time": "3 days, 12:16:25", "throughput": 2724.57, "total_tokens": 821902816} {"current_steps": 4555, "total_steps": 9134, "loss": 0.7813, "learning_rate": 2.5103183174976953e-05, "epoch": 0.49864528312214346, "percentage": 49.87, "elapsed_time": "3 days, 11:48:49", "remaining_time": "3 days, 12:15:19", "throughput": 2724.54, "total_tokens": 822076416} {"current_steps": 4556, "total_steps": 9134, "loss": 0.6934, "learning_rate": 2.5094584619954105e-05, "epoch": 0.4987547551930814, "percentage": 49.88, "elapsed_time": "3 days, 11:49:54", "remaining_time": "3 days, 12:14:11", "throughput": 2724.56, "total_tokens": 822256288} {"current_steps": 4557, "total_steps": 9134, "loss": 0.7223, "learning_rate": 2.508598605374206e-05, "epoch": 0.49886422726401924, "percentage": 49.89, "elapsed_time": "3 days, 11:51:03", "remaining_time": "3 days, 12:13:08", "throughput": 2724.61, "total_tokens": 822462368} {"current_steps": 4558, "total_steps": 9134, "loss": 0.7381, "learning_rate": 2.5077387477358044e-05, "epoch": 0.49897369933495717, "percentage": 49.9, "elapsed_time": "3 days, 11:52:09", "remaining_time": "3 days, 12:12:02", "throughput": 2724.59, "total_tokens": 822635296} {"current_steps": 4559, "total_steps": 9134, "loss": 0.8709, "learning_rate": 2.5068788891819235e-05, "epoch": 0.4990831714058951, "percentage": 49.91, "elapsed_time": "3 days, 11:53:19", "remaining_time": "3 days, 12:10:59", "throughput": 2724.55, "total_tokens": 822812032} {"current_steps": 4560, "total_steps": 9134, "loss": 0.7359, "learning_rate": 2.5060190298142828e-05, "epoch": 0.49919264347683295, "percentage": 49.92, "elapsed_time": "3 days, 11:54:24", "remaining_time": "3 days, 12:09:51", "throughput": 2724.54, "total_tokens": 822985632} {"current_steps": 4561, "total_steps": 9134, "loss": 0.5459, "learning_rate": 2.5051591697346028e-05, "epoch": 0.4993021155477709, "percentage": 49.93, "elapsed_time": "3 days, 11:55:30", "remaining_time": "3 days, 12:08:45", "throughput": 2724.54, "total_tokens": 823168192} {"current_steps": 4562, "total_steps": 9134, "loss": 0.5383, "learning_rate": 2.504299309044602e-05, "epoch": 0.4994115876187088, "percentage": 49.95, "elapsed_time": "3 days, 11:56:36", "remaining_time": "3 days, 12:07:38", "throughput": 2724.49, "total_tokens": 823329472} {"current_steps": 4563, "total_steps": 9134, "loss": 0.6406, "learning_rate": 2.503439447846002e-05, "epoch": 0.49952105968964666, "percentage": 49.96, "elapsed_time": "3 days, 11:57:42", "remaining_time": "3 days, 12:06:32", "throughput": 2724.51, "total_tokens": 823516736} {"current_steps": 4564, "total_steps": 9134, "loss": 0.6389, "learning_rate": 2.5025795862405216e-05, "epoch": 0.4996305317605846, "percentage": 49.97, "elapsed_time": "3 days, 11:58:47", "remaining_time": "3 days, 12:05:25", "throughput": 2724.52, "total_tokens": 823698624} {"current_steps": 4565, "total_steps": 9134, "loss": 0.7223, "learning_rate": 2.5017197243298813e-05, "epoch": 0.4997400038315225, "percentage": 49.98, "elapsed_time": "3 days, 11:59:55", "remaining_time": "3 days, 12:04:20", "throughput": 2724.53, "total_tokens": 823886560} {"current_steps": 4566, "total_steps": 9134, "loss": 0.6084, "learning_rate": 2.500859862215801e-05, "epoch": 0.49984947590246037, "percentage": 49.99, "elapsed_time": "3 days, 12:01:02", "remaining_time": "3 days, 12:03:15", "throughput": 2724.47, "total_tokens": 824049408} {"current_steps": 4567, "total_steps": 9134, "loss": 0.7948, "learning_rate": 2.5e-05, "epoch": 0.4999589479733983, "percentage": 50.0, "elapsed_time": "3 days, 12:02:07", "remaining_time": "3 days, 12:02:07", "throughput": 2724.46, "total_tokens": 824223904} {"current_steps": 4568, "total_steps": 9134, "loss": 0.7047, "learning_rate": 2.4991401377841993e-05, "epoch": 0.5000684200443362, "percentage": 50.01, "elapsed_time": "3 days, 12:03:09", "remaining_time": "3 days, 12:00:57", "throughput": 2724.44, "total_tokens": 824387872} {"current_steps": 4569, "total_steps": 9134, "loss": 0.7034, "learning_rate": 2.4982802756701193e-05, "epoch": 0.5001778921152741, "percentage": 50.02, "elapsed_time": "3 days, 12:04:19", "remaining_time": "3 days, 11:59:54", "throughput": 2724.46, "total_tokens": 824582080} {"current_steps": 4570, "total_steps": 9134, "loss": 0.5718, "learning_rate": 2.4974204137594786e-05, "epoch": 0.500287364186212, "percentage": 50.03, "elapsed_time": "3 days, 12:05:21", "remaining_time": "3 days, 11:58:44", "throughput": 2724.42, "total_tokens": 824740672} {"current_steps": 4571, "total_steps": 9134, "loss": 0.6985, "learning_rate": 2.4965605521539982e-05, "epoch": 0.5003968362571499, "percentage": 50.04, "elapsed_time": "3 days, 12:06:30", "remaining_time": "3 days, 11:57:40", "throughput": 2724.44, "total_tokens": 824934880} {"current_steps": 4572, "total_steps": 9134, "loss": 0.7332, "learning_rate": 2.4957006909553982e-05, "epoch": 0.5005063083280878, "percentage": 50.05, "elapsed_time": "3 days, 12:07:40", "remaining_time": "3 days, 11:56:37", "throughput": 2724.52, "total_tokens": 825149696} {"current_steps": 4573, "total_steps": 9134, "loss": 0.7051, "learning_rate": 2.4948408302653985e-05, "epoch": 0.5006157803990257, "percentage": 50.07, "elapsed_time": "3 days, 12:08:43", "remaining_time": "3 days, 11:55:28", "throughput": 2724.45, "total_tokens": 825298208} {"current_steps": 4574, "total_steps": 9134, "loss": 0.8565, "learning_rate": 2.4939809701857174e-05, "epoch": 0.5007252524699636, "percentage": 50.08, "elapsed_time": "3 days, 12:09:49", "remaining_time": "3 days, 11:54:21", "throughput": 2724.43, "total_tokens": 825473824} {"current_steps": 4575, "total_steps": 9134, "loss": 0.8587, "learning_rate": 2.4931211108180767e-05, "epoch": 0.5008347245409015, "percentage": 50.09, "elapsed_time": "3 days, 12:10:56", "remaining_time": "3 days, 11:53:16", "throughput": 2724.44, "total_tokens": 825658176} {"current_steps": 4576, "total_steps": 9134, "loss": 0.739, "learning_rate": 2.492261252264196e-05, "epoch": 0.5009441966118394, "percentage": 50.1, "elapsed_time": "3 days, 12:12:03", "remaining_time": "3 days, 11:52:11", "throughput": 2724.48, "total_tokens": 825855072} {"current_steps": 4577, "total_steps": 9134, "loss": 1.0133, "learning_rate": 2.491401394625794e-05, "epoch": 0.5010536686827773, "percentage": 50.11, "elapsed_time": "3 days, 12:13:13", "remaining_time": "3 days, 11:51:08", "throughput": 2724.5, "total_tokens": 826050400} {"current_steps": 4578, "total_steps": 9134, "loss": 0.5579, "learning_rate": 2.490541538004591e-05, "epoch": 0.5011631407537153, "percentage": 50.12, "elapsed_time": "3 days, 12:14:18", "remaining_time": "3 days, 11:50:01", "throughput": 2724.47, "total_tokens": 826219744} {"current_steps": 4579, "total_steps": 9134, "loss": 0.6077, "learning_rate": 2.489681682502305e-05, "epoch": 0.5012726128246531, "percentage": 50.13, "elapsed_time": "3 days, 12:15:28", "remaining_time": "3 days, 11:48:58", "throughput": 2724.51, "total_tokens": 826419104} {"current_steps": 4580, "total_steps": 9134, "loss": 0.6397, "learning_rate": 2.4888218282206573e-05, "epoch": 0.501382084895591, "percentage": 50.14, "elapsed_time": "3 days, 12:16:30", "remaining_time": "3 days, 11:47:48", "throughput": 2724.44, "total_tokens": 826569408} {"current_steps": 4581, "total_steps": 9134, "loss": 0.6157, "learning_rate": 2.4879619752613653e-05, "epoch": 0.5014915569665289, "percentage": 50.15, "elapsed_time": "3 days, 12:17:37", "remaining_time": "3 days, 11:46:42", "throughput": 2724.43, "total_tokens": 826747936} {"current_steps": 4582, "total_steps": 9134, "loss": 0.7546, "learning_rate": 2.487102123726148e-05, "epoch": 0.5016010290374668, "percentage": 50.16, "elapsed_time": "3 days, 12:18:43", "remaining_time": "3 days, 11:45:36", "throughput": 2724.43, "total_tokens": 826927584} {"current_steps": 4583, "total_steps": 9134, "loss": 0.7435, "learning_rate": 2.486242273716726e-05, "epoch": 0.5017105011084048, "percentage": 50.18, "elapsed_time": "3 days, 12:19:50", "remaining_time": "3 days, 11:44:30", "throughput": 2724.44, "total_tokens": 827114176} {"current_steps": 4584, "total_steps": 9134, "loss": 0.742, "learning_rate": 2.4853824253348162e-05, "epoch": 0.5018199731793426, "percentage": 50.19, "elapsed_time": "3 days, 12:20:55", "remaining_time": "3 days, 11:43:23", "throughput": 2724.39, "total_tokens": 827277920} {"current_steps": 4585, "total_steps": 9134, "loss": 0.8854, "learning_rate": 2.484522578682138e-05, "epoch": 0.5019294452502805, "percentage": 50.2, "elapsed_time": "3 days, 12:22:05", "remaining_time": "3 days, 11:42:21", "throughput": 2724.45, "total_tokens": 827485792} {"current_steps": 4586, "total_steps": 9134, "loss": 0.7862, "learning_rate": 2.4836627338604083e-05, "epoch": 0.5020389173212184, "percentage": 50.21, "elapsed_time": "3 days, 12:23:11", "remaining_time": "3 days, 11:41:14", "throughput": 2724.46, "total_tokens": 827667008} {"current_steps": 4587, "total_steps": 9134, "loss": 0.7606, "learning_rate": 2.482802890971347e-05, "epoch": 0.5021483893921563, "percentage": 50.22, "elapsed_time": "3 days, 12:24:16", "remaining_time": "3 days, 11:40:07", "throughput": 2724.46, "total_tokens": 827844192} {"current_steps": 4588, "total_steps": 9134, "loss": 0.7711, "learning_rate": 2.4819430501166695e-05, "epoch": 0.5022578614630943, "percentage": 50.23, "elapsed_time": "3 days, 12:25:25", "remaining_time": "3 days, 11:39:02", "throughput": 2724.42, "total_tokens": 828021376} {"current_steps": 4589, "total_steps": 9134, "loss": 0.5647, "learning_rate": 2.4810832113980952e-05, "epoch": 0.5023673335340322, "percentage": 50.24, "elapsed_time": "3 days, 12:26:32", "remaining_time": "3 days, 11:37:57", "throughput": 2724.51, "total_tokens": 828230368} {"current_steps": 4590, "total_steps": 9134, "loss": 0.815, "learning_rate": 2.4802233749173416e-05, "epoch": 0.50247680560497, "percentage": 50.25, "elapsed_time": "3 days, 12:27:36", "remaining_time": "3 days, 11:36:49", "throughput": 2724.52, "total_tokens": 828409344} {"current_steps": 4591, "total_steps": 9134, "loss": 0.7442, "learning_rate": 2.479363540776124e-05, "epoch": 0.5025862776759079, "percentage": 50.26, "elapsed_time": "3 days, 12:28:45", "remaining_time": "3 days, 11:35:45", "throughput": 2724.52, "total_tokens": 828594816} {"current_steps": 4592, "total_steps": 9134, "loss": 0.8391, "learning_rate": 2.4785037090761605e-05, "epoch": 0.5026957497468458, "percentage": 50.27, "elapsed_time": "3 days, 12:29:48", "remaining_time": "3 days, 11:34:36", "throughput": 2724.49, "total_tokens": 828758112} {"current_steps": 4593, "total_steps": 9134, "loss": 0.8676, "learning_rate": 2.477643879919167e-05, "epoch": 0.5028052218177838, "percentage": 50.28, "elapsed_time": "3 days, 12:30:58", "remaining_time": "3 days, 11:33:33", "throughput": 2724.52, "total_tokens": 828955904} {"current_steps": 4594, "total_steps": 9134, "loss": 0.7869, "learning_rate": 2.47678405340686e-05, "epoch": 0.5029146938887217, "percentage": 50.3, "elapsed_time": "3 days, 12:32:04", "remaining_time": "3 days, 11:32:27", "throughput": 2724.51, "total_tokens": 829134656} {"current_steps": 4595, "total_steps": 9134, "loss": 0.5883, "learning_rate": 2.4759242296409547e-05, "epoch": 0.5030241659596596, "percentage": 50.31, "elapsed_time": "3 days, 12:33:12", "remaining_time": "3 days, 11:31:22", "throughput": 2724.46, "total_tokens": 829305568} {"current_steps": 4596, "total_steps": 9134, "loss": 0.9888, "learning_rate": 2.4750644087231668e-05, "epoch": 0.5031336380305974, "percentage": 50.32, "elapsed_time": "3 days, 12:34:21", "remaining_time": "3 days, 11:30:18", "throughput": 2724.48, "total_tokens": 829496864} {"current_steps": 4597, "total_steps": 9134, "loss": 0.9745, "learning_rate": 2.4742045907552124e-05, "epoch": 0.5032431101015353, "percentage": 50.33, "elapsed_time": "3 days, 12:35:29", "remaining_time": "3 days, 11:29:15", "throughput": 2724.42, "total_tokens": 829668448} {"current_steps": 4598, "total_steps": 9134, "loss": 0.8008, "learning_rate": 2.473344775838805e-05, "epoch": 0.5033525821724733, "percentage": 50.34, "elapsed_time": "3 days, 12:36:37", "remaining_time": "3 days, 11:28:10", "throughput": 2724.39, "total_tokens": 829842496} {"current_steps": 4599, "total_steps": 9134, "loss": 0.6628, "learning_rate": 2.4724849640756608e-05, "epoch": 0.5034620542434112, "percentage": 50.35, "elapsed_time": "3 days, 12:37:42", "remaining_time": "3 days, 11:27:02", "throughput": 2724.4, "total_tokens": 830023264} {"current_steps": 4600, "total_steps": 9134, "loss": 0.6408, "learning_rate": 2.4716251555674913e-05, "epoch": 0.5035715263143491, "percentage": 50.36, "elapsed_time": "3 days, 12:38:44", "remaining_time": "3 days, 11:25:52", "throughput": 2724.31, "total_tokens": 830164384} {"current_steps": 4601, "total_steps": 9134, "loss": 0.8331, "learning_rate": 2.4707653504160118e-05, "epoch": 0.5036809983852869, "percentage": 50.37, "elapsed_time": "3 days, 12:39:54", "remaining_time": "3 days, 11:24:49", "throughput": 2724.37, "total_tokens": 830370912} {"current_steps": 4602, "total_steps": 9134, "loss": 0.454, "learning_rate": 2.4699055487229366e-05, "epoch": 0.5037904704562248, "percentage": 50.38, "elapsed_time": "3 days, 12:41:02", "remaining_time": "3 days, 11:23:45", "throughput": 2724.36, "total_tokens": 830553472} {"current_steps": 4603, "total_steps": 9134, "loss": 0.6247, "learning_rate": 2.4690457505899765e-05, "epoch": 0.5038999425271627, "percentage": 50.39, "elapsed_time": "3 days, 12:42:08", "remaining_time": "3 days, 11:22:38", "throughput": 2724.35, "total_tokens": 830729312} {"current_steps": 4604, "total_steps": 9134, "loss": 0.6947, "learning_rate": 2.468185956118845e-05, "epoch": 0.5040094145981007, "percentage": 50.41, "elapsed_time": "3 days, 12:43:17", "remaining_time": "3 days, 11:21:35", "throughput": 2724.32, "total_tokens": 830910528} {"current_steps": 4605, "total_steps": 9134, "loss": 0.7686, "learning_rate": 2.4673261654112543e-05, "epoch": 0.5041188866690386, "percentage": 50.42, "elapsed_time": "3 days, 12:44:19", "remaining_time": "3 days, 11:20:25", "throughput": 2724.31, "total_tokens": 831076512} {"current_steps": 4606, "total_steps": 9134, "loss": 0.673, "learning_rate": 2.466466378568916e-05, "epoch": 0.5042283587399765, "percentage": 50.43, "elapsed_time": "3 days, 12:45:29", "remaining_time": "3 days, 11:19:21", "throughput": 2724.34, "total_tokens": 831275200} {"current_steps": 4607, "total_steps": 9134, "loss": 0.8783, "learning_rate": 2.4656065956935408e-05, "epoch": 0.5043378308109143, "percentage": 50.44, "elapsed_time": "3 days, 12:46:31", "remaining_time": "3 days, 11:18:11", "throughput": 2724.27, "total_tokens": 831425504} {"current_steps": 4608, "total_steps": 9134, "loss": 0.8276, "learning_rate": 2.464746816886839e-05, "epoch": 0.5044473028818522, "percentage": 50.45, "elapsed_time": "3 days, 12:47:39", "remaining_time": "3 days, 11:17:07", "throughput": 2724.32, "total_tokens": 831625088} {"current_steps": 4609, "total_steps": 9134, "loss": 0.8796, "learning_rate": 2.4638870422505225e-05, "epoch": 0.5045567749527902, "percentage": 50.46, "elapsed_time": "3 days, 12:48:49", "remaining_time": "3 days, 11:16:04", "throughput": 2724.28, "total_tokens": 831803840} {"current_steps": 4610, "total_steps": 9134, "loss": 0.8266, "learning_rate": 2.4630272718862992e-05, "epoch": 0.5046662470237281, "percentage": 50.47, "elapsed_time": "3 days, 12:49:54", "remaining_time": "3 days, 11:14:57", "throughput": 2724.29, "total_tokens": 831984832} {"current_steps": 4611, "total_steps": 9134, "loss": 0.7756, "learning_rate": 2.4621675058958792e-05, "epoch": 0.504775719094666, "percentage": 50.48, "elapsed_time": "3 days, 12:51:03", "remaining_time": "3 days, 11:13:53", "throughput": 2724.33, "total_tokens": 832184192} {"current_steps": 4612, "total_steps": 9134, "loss": 0.6661, "learning_rate": 2.4613077443809706e-05, "epoch": 0.5048851911656039, "percentage": 50.49, "elapsed_time": "3 days, 12:52:09", "remaining_time": "3 days, 11:12:46", "throughput": 2724.23, "total_tokens": 832330464} {"current_steps": 4613, "total_steps": 9134, "loss": 0.7282, "learning_rate": 2.460447987443282e-05, "epoch": 0.5049946632365417, "percentage": 50.5, "elapsed_time": "3 days, 12:53:19", "remaining_time": "3 days, 11:11:44", "throughput": 2724.18, "total_tokens": 832506528} {"current_steps": 4614, "total_steps": 9134, "loss": 0.8362, "learning_rate": 2.459588235184521e-05, "epoch": 0.5051041353074797, "percentage": 50.51, "elapsed_time": "3 days, 12:54:24", "remaining_time": "3 days, 11:10:37", "throughput": 2724.2, "total_tokens": 832690432} {"current_steps": 4615, "total_steps": 9134, "loss": 0.7608, "learning_rate": 2.4587284877063942e-05, "epoch": 0.5052136073784176, "percentage": 50.53, "elapsed_time": "3 days, 12:55:28", "remaining_time": "3 days, 11:09:28", "throughput": 2724.19, "total_tokens": 832862688} {"current_steps": 4616, "total_steps": 9134, "loss": 0.8531, "learning_rate": 2.4578687451106085e-05, "epoch": 0.5053230794493555, "percentage": 50.54, "elapsed_time": "3 days, 12:56:33", "remaining_time": "3 days, 11:08:21", "throughput": 2724.18, "total_tokens": 833037632} {"current_steps": 4617, "total_steps": 9134, "loss": 0.8333, "learning_rate": 2.4570090074988697e-05, "epoch": 0.5054325515202934, "percentage": 50.55, "elapsed_time": "3 days, 12:57:36", "remaining_time": "3 days, 11:07:12", "throughput": 2724.12, "total_tokens": 833191072} {"current_steps": 4618, "total_steps": 9134, "loss": 0.7134, "learning_rate": 2.456149274972884e-05, "epoch": 0.5055420235912312, "percentage": 50.56, "elapsed_time": "3 days, 12:58:41", "remaining_time": "3 days, 11:06:04", "throughput": 2724.1, "total_tokens": 833361312} {"current_steps": 4619, "total_steps": 9134, "loss": 0.7392, "learning_rate": 2.455289547634354e-05, "epoch": 0.5056514956621692, "percentage": 50.57, "elapsed_time": "3 days, 12:59:45", "remaining_time": "3 days, 11:04:56", "throughput": 2724.1, "total_tokens": 833536704} {"current_steps": 4620, "total_steps": 9134, "loss": 0.8226, "learning_rate": 2.4544298255849862e-05, "epoch": 0.5057609677331071, "percentage": 50.58, "elapsed_time": "3 days, 13:00:54", "remaining_time": "3 days, 11:03:52", "throughput": 2724.12, "total_tokens": 833730240} {"current_steps": 4621, "total_steps": 9134, "loss": 0.7372, "learning_rate": 2.453570108926482e-05, "epoch": 0.505870439804045, "percentage": 50.59, "elapsed_time": "3 days, 13:02:00", "remaining_time": "3 days, 11:02:46", "throughput": 2724.11, "total_tokens": 833907424} {"current_steps": 4622, "total_steps": 9134, "loss": 0.8083, "learning_rate": 2.4527103977605447e-05, "epoch": 0.5059799118749829, "percentage": 50.6, "elapsed_time": "3 days, 13:03:08", "remaining_time": "3 days, 11:01:41", "throughput": 2724.18, "total_tokens": 834112160} {"current_steps": 4623, "total_steps": 9134, "loss": 0.6943, "learning_rate": 2.4518506921888788e-05, "epoch": 0.5060893839459208, "percentage": 50.61, "elapsed_time": "3 days, 13:04:13", "remaining_time": "3 days, 11:00:33", "throughput": 2724.17, "total_tokens": 834284640} {"current_steps": 4624, "total_steps": 9134, "loss": 0.8215, "learning_rate": 2.4509909923131822e-05, "epoch": 0.5061988560168587, "percentage": 50.62, "elapsed_time": "3 days, 13:05:20", "remaining_time": "3 days, 10:59:28", "throughput": 2724.14, "total_tokens": 834460256} {"current_steps": 4625, "total_steps": 9134, "loss": 0.7743, "learning_rate": 2.450131298235158e-05, "epoch": 0.5063083280877966, "percentage": 50.63, "elapsed_time": "3 days, 13:06:29", "remaining_time": "3 days, 10:58:24", "throughput": 2724.2, "total_tokens": 834666560} {"current_steps": 4626, "total_steps": 9134, "loss": 0.6635, "learning_rate": 2.449271610056506e-05, "epoch": 0.5064178001587345, "percentage": 50.65, "elapsed_time": "3 days, 13:07:36", "remaining_time": "3 days, 10:57:19", "throughput": 2724.17, "total_tokens": 834838144} {"current_steps": 4627, "total_steps": 9134, "loss": 0.8605, "learning_rate": 2.448411927878926e-05, "epoch": 0.5065272722296724, "percentage": 50.66, "elapsed_time": "3 days, 13:08:43", "remaining_time": "3 days, 10:56:13", "throughput": 2724.19, "total_tokens": 835026752} {"current_steps": 4628, "total_steps": 9134, "loss": 0.8306, "learning_rate": 2.447552251804116e-05, "epoch": 0.5066367443006103, "percentage": 50.67, "elapsed_time": "3 days, 13:09:51", "remaining_time": "3 days, 10:55:08", "throughput": 2724.18, "total_tokens": 835210656} {"current_steps": 4629, "total_steps": 9134, "loss": 0.7278, "learning_rate": 2.4466925819337734e-05, "epoch": 0.5067462163715483, "percentage": 50.68, "elapsed_time": "3 days, 13:10:57", "remaining_time": "3 days, 10:54:02", "throughput": 2724.21, "total_tokens": 835398368} {"current_steps": 4630, "total_steps": 9134, "loss": 0.5558, "learning_rate": 2.4458329183695983e-05, "epoch": 0.5068556884424861, "percentage": 50.69, "elapsed_time": "3 days, 13:12:04", "remaining_time": "3 days, 10:52:57", "throughput": 2724.19, "total_tokens": 835576448} {"current_steps": 4631, "total_steps": 9134, "loss": 0.8294, "learning_rate": 2.444973261213284e-05, "epoch": 0.506965160513424, "percentage": 50.7, "elapsed_time": "3 days, 13:13:12", "remaining_time": "3 days, 10:51:52", "throughput": 2724.22, "total_tokens": 835769312} {"current_steps": 4632, "total_steps": 9134, "loss": 0.6983, "learning_rate": 2.4441136105665284e-05, "epoch": 0.5070746325843619, "percentage": 50.71, "elapsed_time": "3 days, 13:14:20", "remaining_time": "3 days, 10:50:48", "throughput": 2724.19, "total_tokens": 835947168} {"current_steps": 4633, "total_steps": 9134, "loss": 0.8351, "learning_rate": 2.4432539665310252e-05, "epoch": 0.5071841046552998, "percentage": 50.72, "elapsed_time": "3 days, 13:15:27", "remaining_time": "3 days, 10:49:42", "throughput": 2724.19, "total_tokens": 836126816} {"current_steps": 4634, "total_steps": 9134, "loss": 0.6348, "learning_rate": 2.44239432920847e-05, "epoch": 0.5072935767262378, "percentage": 50.73, "elapsed_time": "3 days, 13:16:31", "remaining_time": "3 days, 10:48:34", "throughput": 2724.17, "total_tokens": 836296608} {"current_steps": 4635, "total_steps": 9134, "loss": 0.947, "learning_rate": 2.441534698700555e-05, "epoch": 0.5074030487971756, "percentage": 50.74, "elapsed_time": "3 days, 13:17:38", "remaining_time": "3 days, 10:47:29", "throughput": 2724.21, "total_tokens": 836493280} {"current_steps": 4636, "total_steps": 9134, "loss": 0.6459, "learning_rate": 2.4406750751089737e-05, "epoch": 0.5075125208681135, "percentage": 50.76, "elapsed_time": "3 days, 13:18:43", "remaining_time": "3 days, 10:46:20", "throughput": 2724.17, "total_tokens": 836655456} {"current_steps": 4637, "total_steps": 9134, "loss": 0.8388, "learning_rate": 2.4398154585354174e-05, "epoch": 0.5076219929390514, "percentage": 50.77, "elapsed_time": "3 days, 13:19:44", "remaining_time": "3 days, 10:45:10", "throughput": 2724.15, "total_tokens": 836819200} {"current_steps": 4638, "total_steps": 9134, "loss": 0.8457, "learning_rate": 2.438955849081577e-05, "epoch": 0.5077314650099893, "percentage": 50.78, "elapsed_time": "3 days, 13:20:48", "remaining_time": "3 days, 10:44:01", "throughput": 2724.1, "total_tokens": 836976000} {"current_steps": 4639, "total_steps": 9134, "loss": 0.6062, "learning_rate": 2.4380962468491438e-05, "epoch": 0.5078409370809273, "percentage": 50.79, "elapsed_time": "3 days, 13:21:57", "remaining_time": "3 days, 10:42:58", "throughput": 2724.11, "total_tokens": 837168192} {"current_steps": 4640, "total_steps": 9134, "loss": 0.8231, "learning_rate": 2.4372366519398053e-05, "epoch": 0.5079504091518652, "percentage": 50.8, "elapsed_time": "3 days, 13:23:06", "remaining_time": "3 days, 10:41:54", "throughput": 2724.19, "total_tokens": 837378976} {"current_steps": 4641, "total_steps": 9134, "loss": 0.7786, "learning_rate": 2.4363770644552523e-05, "epoch": 0.508059881222803, "percentage": 50.81, "elapsed_time": "3 days, 13:24:10", "remaining_time": "3 days, 10:40:45", "throughput": 2724.19, "total_tokens": 837553920} {"current_steps": 4642, "total_steps": 9134, "loss": 0.6899, "learning_rate": 2.4355174844971695e-05, "epoch": 0.5081693532937409, "percentage": 50.82, "elapsed_time": "3 days, 13:25:19", "remaining_time": "3 days, 10:39:42", "throughput": 2724.24, "total_tokens": 837756192} {"current_steps": 4643, "total_steps": 9134, "loss": 0.7296, "learning_rate": 2.434657912167245e-05, "epoch": 0.5082788253646788, "percentage": 50.83, "elapsed_time": "3 days, 13:26:25", "remaining_time": "3 days, 10:38:35", "throughput": 2724.16, "total_tokens": 837910304} {"current_steps": 4644, "total_steps": 9134, "loss": 0.6771, "learning_rate": 2.4337983475671657e-05, "epoch": 0.5083882974356168, "percentage": 50.84, "elapsed_time": "3 days, 13:27:30", "remaining_time": "3 days, 10:37:28", "throughput": 2724.09, "total_tokens": 838068896} {"current_steps": 4645, "total_steps": 9134, "loss": 0.6447, "learning_rate": 2.4329387907986145e-05, "epoch": 0.5084977695065547, "percentage": 50.85, "elapsed_time": "3 days, 13:28:39", "remaining_time": "3 days, 10:36:25", "throughput": 2724.11, "total_tokens": 838261536} {"current_steps": 4646, "total_steps": 9134, "loss": 0.5491, "learning_rate": 2.4320792419632764e-05, "epoch": 0.5086072415774926, "percentage": 50.86, "elapsed_time": "3 days, 13:29:45", "remaining_time": "3 days, 10:35:18", "throughput": 2724.14, "total_tokens": 838451040} {"current_steps": 4647, "total_steps": 9134, "loss": 0.762, "learning_rate": 2.431219701162834e-05, "epoch": 0.5087167136484304, "percentage": 50.88, "elapsed_time": "3 days, 13:30:49", "remaining_time": "3 days, 10:34:09", "throughput": 2724.12, "total_tokens": 838617024} {"current_steps": 4648, "total_steps": 9134, "loss": 0.7074, "learning_rate": 2.4303601684989698e-05, "epoch": 0.5088261857193683, "percentage": 50.89, "elapsed_time": "3 days, 13:31:51", "remaining_time": "3 days, 10:32:59", "throughput": 2724.07, "total_tokens": 838774048} {"current_steps": 4649, "total_steps": 9134, "loss": 0.8319, "learning_rate": 2.429500644073364e-05, "epoch": 0.5089356577903063, "percentage": 50.9, "elapsed_time": "3 days, 13:32:54", "remaining_time": "3 days, 10:31:50", "throughput": 2724.1, "total_tokens": 838955488} {"current_steps": 4650, "total_steps": 9134, "loss": 0.854, "learning_rate": 2.428641127987697e-05, "epoch": 0.5090451298612442, "percentage": 50.91, "elapsed_time": "3 days, 13:34:01", "remaining_time": "3 days, 10:30:44", "throughput": 2724.12, "total_tokens": 839140512} {"current_steps": 4651, "total_steps": 9134, "loss": 0.7887, "learning_rate": 2.4277816203436498e-05, "epoch": 0.5091546019321821, "percentage": 50.92, "elapsed_time": "3 days, 13:35:09", "remaining_time": "3 days, 10:29:40", "throughput": 2724.12, "total_tokens": 839327776} {"current_steps": 4652, "total_steps": 9134, "loss": 0.8172, "learning_rate": 2.426922121242897e-05, "epoch": 0.5092640740031199, "percentage": 50.93, "elapsed_time": "3 days, 13:36:12", "remaining_time": "3 days, 10:28:30", "throughput": 2724.05, "total_tokens": 839476512} {"current_steps": 4653, "total_steps": 9134, "loss": 0.7144, "learning_rate": 2.426062630787119e-05, "epoch": 0.5093735460740578, "percentage": 50.94, "elapsed_time": "3 days, 13:37:18", "remaining_time": "3 days, 10:27:24", "throughput": 2724.04, "total_tokens": 839655264} {"current_steps": 4654, "total_steps": 9134, "loss": 0.8514, "learning_rate": 2.4252031490779894e-05, "epoch": 0.5094830181449957, "percentage": 50.95, "elapsed_time": "3 days, 13:38:23", "remaining_time": "3 days, 10:26:16", "throughput": 2724.05, "total_tokens": 839833792} {"current_steps": 4655, "total_steps": 9134, "loss": 0.6819, "learning_rate": 2.4243436762171848e-05, "epoch": 0.5095924902159337, "percentage": 50.96, "elapsed_time": "3 days, 13:39:24", "remaining_time": "3 days, 10:25:05", "throughput": 2724.04, "total_tokens": 839998432} {"current_steps": 4656, "total_steps": 9134, "loss": 0.9939, "learning_rate": 2.4234842123063786e-05, "epoch": 0.5097019622868716, "percentage": 50.97, "elapsed_time": "3 days, 13:40:34", "remaining_time": "3 days, 10:24:02", "throughput": 2724.11, "total_tokens": 840208544} {"current_steps": 4657, "total_steps": 9134, "loss": 0.635, "learning_rate": 2.4226247574472433e-05, "epoch": 0.5098114343578095, "percentage": 50.99, "elapsed_time": "3 days, 13:41:42", "remaining_time": "3 days, 10:22:58", "throughput": 2724.11, "total_tokens": 840393344} {"current_steps": 4658, "total_steps": 9134, "loss": 0.7471, "learning_rate": 2.421765311741452e-05, "epoch": 0.5099209064287473, "percentage": 51.0, "elapsed_time": "3 days, 13:42:48", "remaining_time": "3 days, 10:21:51", "throughput": 2724.09, "total_tokens": 840566944} {"current_steps": 4659, "total_steps": 9134, "loss": 0.5094, "learning_rate": 2.420905875290674e-05, "epoch": 0.5100303784996852, "percentage": 51.01, "elapsed_time": "3 days, 13:43:53", "remaining_time": "3 days, 10:20:44", "throughput": 2724.06, "total_tokens": 840736288} {"current_steps": 4660, "total_steps": 9134, "loss": 0.7844, "learning_rate": 2.4200464481965807e-05, "epoch": 0.5101398505706232, "percentage": 51.02, "elapsed_time": "3 days, 13:45:03", "remaining_time": "3 days, 10:19:41", "throughput": 2724.1, "total_tokens": 840937664} {"current_steps": 4661, "total_steps": 9134, "loss": 0.7691, "learning_rate": 2.419187030560839e-05, "epoch": 0.5102493226415611, "percentage": 51.03, "elapsed_time": "3 days, 13:46:13", "remaining_time": "3 days, 10:18:38", "throughput": 2724.12, "total_tokens": 841136128} {"current_steps": 4662, "total_steps": 9134, "loss": 0.6193, "learning_rate": 2.4183276224851178e-05, "epoch": 0.510358794712499, "percentage": 51.04, "elapsed_time": "3 days, 13:47:20", "remaining_time": "3 days, 10:17:34", "throughput": 2724.14, "total_tokens": 841324288} {"current_steps": 4663, "total_steps": 9134, "loss": 0.6841, "learning_rate": 2.417468224071082e-05, "epoch": 0.5104682667834369, "percentage": 51.05, "elapsed_time": "3 days, 13:48:25", "remaining_time": "3 days, 10:16:26", "throughput": 2724.04, "total_tokens": 841469888} {"current_steps": 4664, "total_steps": 9134, "loss": 0.9889, "learning_rate": 2.4166088354203974e-05, "epoch": 0.5105777388543747, "percentage": 51.06, "elapsed_time": "3 days, 13:49:29", "remaining_time": "3 days, 10:15:17", "throughput": 2724.02, "total_tokens": 841637888} {"current_steps": 4665, "total_steps": 9134, "loss": 0.5168, "learning_rate": 2.415749456634729e-05, "epoch": 0.5106872109253127, "percentage": 51.07, "elapsed_time": "3 days, 13:50:33", "remaining_time": "3 days, 10:14:09", "throughput": 2724.03, "total_tokens": 841817760} {"current_steps": 4666, "total_steps": 9134, "loss": 0.864, "learning_rate": 2.4148900878157378e-05, "epoch": 0.5107966829962506, "percentage": 51.08, "elapsed_time": "3 days, 13:51:41", "remaining_time": "3 days, 10:13:05", "throughput": 2724.13, "total_tokens": 842032576} {"current_steps": 4667, "total_steps": 9134, "loss": 0.4939, "learning_rate": 2.4140307290650874e-05, "epoch": 0.5109061550671885, "percentage": 51.09, "elapsed_time": "3 days, 13:52:50", "remaining_time": "3 days, 10:12:01", "throughput": 2724.15, "total_tokens": 842226560} {"current_steps": 4668, "total_steps": 9134, "loss": 0.8269, "learning_rate": 2.4131713804844364e-05, "epoch": 0.5110156271381264, "percentage": 51.11, "elapsed_time": "3 days, 13:53:58", "remaining_time": "3 days, 10:10:56", "throughput": 2724.16, "total_tokens": 842414496} {"current_steps": 4669, "total_steps": 9134, "loss": 0.5688, "learning_rate": 2.412312042175446e-05, "epoch": 0.5111250992090642, "percentage": 51.12, "elapsed_time": "3 days, 13:55:08", "remaining_time": "3 days, 10:09:53", "throughput": 2724.17, "total_tokens": 842608704} {"current_steps": 4670, "total_steps": 9134, "loss": 0.7895, "learning_rate": 2.4114527142397732e-05, "epoch": 0.5112345712800022, "percentage": 51.13, "elapsed_time": "3 days, 13:56:13", "remaining_time": "3 days, 10:08:46", "throughput": 2724.15, "total_tokens": 842780064} {"current_steps": 4671, "total_steps": 9134, "loss": 0.6927, "learning_rate": 2.4105933967790744e-05, "epoch": 0.5113440433509401, "percentage": 51.14, "elapsed_time": "3 days, 13:57:19", "remaining_time": "3 days, 10:07:40", "throughput": 2724.22, "total_tokens": 842981440} {"current_steps": 4672, "total_steps": 9134, "loss": 0.772, "learning_rate": 2.4097340898950073e-05, "epoch": 0.511453515421878, "percentage": 51.15, "elapsed_time": "3 days, 13:58:28", "remaining_time": "3 days, 10:06:36", "throughput": 2724.25, "total_tokens": 843179456} {"current_steps": 4673, "total_steps": 9134, "loss": 1.0709, "learning_rate": 2.4088747936892237e-05, "epoch": 0.5115629874928159, "percentage": 51.16, "elapsed_time": "3 days, 13:59:36", "remaining_time": "3 days, 10:05:31", "throughput": 2724.27, "total_tokens": 843370528} {"current_steps": 4674, "total_steps": 9134, "loss": 0.7427, "learning_rate": 2.4080155082633784e-05, "epoch": 0.5116724595637538, "percentage": 51.17, "elapsed_time": "3 days, 14:00:40", "remaining_time": "3 days, 10:04:23", "throughput": 2724.27, "total_tokens": 843543232} {"current_steps": 4675, "total_steps": 9134, "loss": 0.7398, "learning_rate": 2.407156233719122e-05, "epoch": 0.5117819316346917, "percentage": 51.18, "elapsed_time": "3 days, 14:01:49", "remaining_time": "3 days, 10:03:20", "throughput": 2724.35, "total_tokens": 843756480} {"current_steps": 4676, "total_steps": 9134, "loss": 0.7332, "learning_rate": 2.4062969701581054e-05, "epoch": 0.5118914037056296, "percentage": 51.19, "elapsed_time": "3 days, 14:02:58", "remaining_time": "3 days, 10:02:16", "throughput": 2724.38, "total_tokens": 843955392} {"current_steps": 4677, "total_steps": 9134, "loss": 0.5909, "learning_rate": 2.4054377176819793e-05, "epoch": 0.5120008757765675, "percentage": 51.2, "elapsed_time": "3 days, 14:04:08", "remaining_time": "3 days, 10:01:13", "throughput": 2724.44, "total_tokens": 844163488} {"current_steps": 4678, "total_steps": 9134, "loss": 0.7168, "learning_rate": 2.4045784763923893e-05, "epoch": 0.5121103478475054, "percentage": 51.22, "elapsed_time": "3 days, 14:05:16", "remaining_time": "3 days, 10:00:09", "throughput": 2724.43, "total_tokens": 844345824} {"current_steps": 4679, "total_steps": 9134, "loss": 0.8186, "learning_rate": 2.4037192463909837e-05, "epoch": 0.5122198199184433, "percentage": 51.23, "elapsed_time": "3 days, 14:06:24", "remaining_time": "3 days, 9:59:04", "throughput": 2724.36, "total_tokens": 844507776} {"current_steps": 4680, "total_steps": 9134, "loss": 0.9017, "learning_rate": 2.4028600277794066e-05, "epoch": 0.5123292919893813, "percentage": 51.24, "elapsed_time": "3 days, 14:07:34", "remaining_time": "3 days, 9:58:01", "throughput": 2724.41, "total_tokens": 844713856} {"current_steps": 4681, "total_steps": 9134, "loss": 0.6588, "learning_rate": 2.4020008206593036e-05, "epoch": 0.5124387640603191, "percentage": 51.25, "elapsed_time": "3 days, 14:08:39", "remaining_time": "3 days, 9:56:54", "throughput": 2724.38, "total_tokens": 844884096} {"current_steps": 4682, "total_steps": 9134, "loss": 0.6475, "learning_rate": 2.401141625132315e-05, "epoch": 0.512548236131257, "percentage": 51.26, "elapsed_time": "3 days, 14:09:46", "remaining_time": "3 days, 9:55:48", "throughput": 2724.31, "total_tokens": 845043360} {"current_steps": 4683, "total_steps": 9134, "loss": 0.6861, "learning_rate": 2.4002824413000836e-05, "epoch": 0.5126577082021949, "percentage": 51.27, "elapsed_time": "3 days, 14:10:49", "remaining_time": "3 days, 9:54:39", "throughput": 2724.21, "total_tokens": 845185824} {"current_steps": 4684, "total_steps": 9134, "loss": 0.6432, "learning_rate": 2.3994232692642496e-05, "epoch": 0.5127671802731328, "percentage": 51.28, "elapsed_time": "3 days, 14:11:55", "remaining_time": "3 days, 9:53:33", "throughput": 2724.18, "total_tokens": 845354944} {"current_steps": 4685, "total_steps": 9134, "loss": 0.8197, "learning_rate": 2.3985641091264495e-05, "epoch": 0.5128766523440708, "percentage": 51.29, "elapsed_time": "3 days, 14:13:01", "remaining_time": "3 days, 9:52:26", "throughput": 2724.22, "total_tokens": 845546912} {"current_steps": 4686, "total_steps": 9134, "loss": 0.7045, "learning_rate": 2.3977049609883222e-05, "epoch": 0.5129861244150086, "percentage": 51.3, "elapsed_time": "3 days, 14:14:02", "remaining_time": "3 days, 9:51:15", "throughput": 2724.16, "total_tokens": 845696768} {"current_steps": 4687, "total_steps": 9134, "loss": 0.7707, "learning_rate": 2.3968458249515016e-05, "epoch": 0.5130955964859465, "percentage": 51.31, "elapsed_time": "3 days, 14:15:08", "remaining_time": "3 days, 9:50:09", "throughput": 2724.12, "total_tokens": 845863200} {"current_steps": 4688, "total_steps": 9134, "loss": 1.0119, "learning_rate": 2.395986701117623e-05, "epoch": 0.5132050685568844, "percentage": 51.32, "elapsed_time": "3 days, 14:16:17", "remaining_time": "3 days, 9:49:04", "throughput": 2724.08, "total_tokens": 846036576} {"current_steps": 4689, "total_steps": 9134, "loss": 0.8651, "learning_rate": 2.3951275895883188e-05, "epoch": 0.5133145406278223, "percentage": 51.34, "elapsed_time": "3 days, 14:17:23", "remaining_time": "3 days, 9:47:58", "throughput": 2724.08, "total_tokens": 846219136} {"current_steps": 4690, "total_steps": 9134, "loss": 0.7929, "learning_rate": 2.3942684904652204e-05, "epoch": 0.5134240126987603, "percentage": 51.35, "elapsed_time": "3 days, 14:18:32", "remaining_time": "3 days, 9:46:54", "throughput": 2724.07, "total_tokens": 846402368} {"current_steps": 4691, "total_steps": 9134, "loss": 0.8649, "learning_rate": 2.3934094038499577e-05, "epoch": 0.5135334847696982, "percentage": 51.36, "elapsed_time": "3 days, 14:19:38", "remaining_time": "3 days, 9:45:48", "throughput": 2724.04, "total_tokens": 846574400} {"current_steps": 4692, "total_steps": 9134, "loss": 0.7526, "learning_rate": 2.392550329844158e-05, "epoch": 0.513642956840636, "percentage": 51.37, "elapsed_time": "3 days, 14:20:48", "remaining_time": "3 days, 9:44:46", "throughput": 2723.97, "total_tokens": 846742624} {"current_steps": 4693, "total_steps": 9134, "loss": 0.6734, "learning_rate": 2.3916912685494502e-05, "epoch": 0.5137524289115739, "percentage": 51.38, "elapsed_time": "3 days, 14:21:54", "remaining_time": "3 days, 9:43:39", "throughput": 2723.99, "total_tokens": 846930336} {"current_steps": 4694, "total_steps": 9134, "loss": 0.7444, "learning_rate": 2.390832220067457e-05, "epoch": 0.5138619009825118, "percentage": 51.39, "elapsed_time": "3 days, 14:23:03", "remaining_time": "3 days, 9:42:35", "throughput": 2724.02, "total_tokens": 847123648} {"current_steps": 4695, "total_steps": 9134, "loss": 0.8045, "learning_rate": 2.3899731844998048e-05, "epoch": 0.5139713730534498, "percentage": 51.4, "elapsed_time": "3 days, 14:24:09", "remaining_time": "3 days, 9:41:29", "throughput": 2723.97, "total_tokens": 847290752} {"current_steps": 4696, "total_steps": 9134, "loss": 0.7587, "learning_rate": 2.3891141619481132e-05, "epoch": 0.5140808451243877, "percentage": 51.41, "elapsed_time": "3 days, 14:25:14", "remaining_time": "3 days, 9:40:21", "throughput": 2723.97, "total_tokens": 847467488} {"current_steps": 4697, "total_steps": 9134, "loss": 0.682, "learning_rate": 2.388255152514004e-05, "epoch": 0.5141903171953256, "percentage": 51.42, "elapsed_time": "3 days, 14:26:23", "remaining_time": "3 days, 9:39:18", "throughput": 2723.98, "total_tokens": 847657664} {"current_steps": 4698, "total_steps": 9134, "loss": 0.4822, "learning_rate": 2.387396156299098e-05, "epoch": 0.5142997892662634, "percentage": 51.43, "elapsed_time": "3 days, 14:27:28", "remaining_time": "3 days, 9:38:10", "throughput": 2723.97, "total_tokens": 847830144} {"current_steps": 4699, "total_steps": 9134, "loss": 0.6122, "learning_rate": 2.3865371734050107e-05, "epoch": 0.5144092613372013, "percentage": 51.45, "elapsed_time": "3 days, 14:28:30", "remaining_time": "3 days, 9:37:00", "throughput": 2723.95, "total_tokens": 847996352} {"current_steps": 4700, "total_steps": 9134, "loss": 0.687, "learning_rate": 2.385678203933359e-05, "epoch": 0.5145187334081393, "percentage": 51.46, "elapsed_time": "3 days, 14:29:37", "remaining_time": "3 days, 9:35:55", "throughput": 2723.93, "total_tokens": 848172416} {"current_steps": 4701, "total_steps": 9134, "loss": 0.6665, "learning_rate": 2.3848192479857566e-05, "epoch": 0.5146282054790772, "percentage": 51.47, "elapsed_time": "3 days, 14:30:46", "remaining_time": "3 days, 9:34:51", "throughput": 2724.0, "total_tokens": 848379392} {"current_steps": 4702, "total_steps": 9134, "loss": 0.7487, "learning_rate": 2.3839603056638186e-05, "epoch": 0.5147376775500151, "percentage": 51.48, "elapsed_time": "3 days, 14:31:49", "remaining_time": "3 days, 9:33:41", "throughput": 2723.96, "total_tokens": 848538208} {"current_steps": 4703, "total_steps": 9134, "loss": 0.6476, "learning_rate": 2.3831013770691533e-05, "epoch": 0.5148471496209529, "percentage": 51.49, "elapsed_time": "3 days, 14:32:50", "remaining_time": "3 days, 9:32:30", "throughput": 2723.91, "total_tokens": 848689408} {"current_steps": 4704, "total_steps": 9134, "loss": 0.9179, "learning_rate": 2.3822424623033712e-05, "epoch": 0.5149566216918908, "percentage": 51.5, "elapsed_time": "3 days, 14:33:56", "remaining_time": "3 days, 9:31:24", "throughput": 2723.9, "total_tokens": 848866592} {"current_steps": 4705, "total_steps": 9134, "loss": 0.6197, "learning_rate": 2.381383561468082e-05, "epoch": 0.5150660937628287, "percentage": 51.51, "elapsed_time": "3 days, 14:35:06", "remaining_time": "3 days, 9:30:21", "throughput": 2723.94, "total_tokens": 849069088} {"current_steps": 4706, "total_steps": 9134, "loss": 0.8342, "learning_rate": 2.38052467466489e-05, "epoch": 0.5151755658337667, "percentage": 51.52, "elapsed_time": "3 days, 14:36:08", "remaining_time": "3 days, 9:29:11", "throughput": 2723.84, "total_tokens": 849207072} {"current_steps": 4707, "total_steps": 9134, "loss": 0.8924, "learning_rate": 2.3796658019954013e-05, "epoch": 0.5152850379047046, "percentage": 51.53, "elapsed_time": "3 days, 14:37:17", "remaining_time": "3 days, 9:28:07", "throughput": 2723.87, "total_tokens": 849402400} {"current_steps": 4708, "total_steps": 9134, "loss": 0.6358, "learning_rate": 2.3788069435612174e-05, "epoch": 0.5153945099756425, "percentage": 51.54, "elapsed_time": "3 days, 14:38:21", "remaining_time": "3 days, 9:26:59", "throughput": 2723.83, "total_tokens": 849567712} {"current_steps": 4709, "total_steps": 9134, "loss": 0.8459, "learning_rate": 2.3779480994639406e-05, "epoch": 0.5155039820465803, "percentage": 51.55, "elapsed_time": "3 days, 14:39:26", "remaining_time": "3 days, 9:25:51", "throughput": 2723.86, "total_tokens": 849753184} {"current_steps": 4710, "total_steps": 9134, "loss": 0.6796, "learning_rate": 2.37708926980517e-05, "epoch": 0.5156134541175182, "percentage": 51.57, "elapsed_time": "3 days, 14:40:29", "remaining_time": "3 days, 9:24:42", "throughput": 2723.81, "total_tokens": 849909984} {"current_steps": 4711, "total_steps": 9134, "loss": 0.707, "learning_rate": 2.3762304546865042e-05, "epoch": 0.5157229261884562, "percentage": 51.58, "elapsed_time": "3 days, 14:41:32", "remaining_time": "3 days, 9:23:32", "throughput": 2723.7, "total_tokens": 850046400} {"current_steps": 4712, "total_steps": 9134, "loss": 0.7439, "learning_rate": 2.375371654209539e-05, "epoch": 0.5158323982593941, "percentage": 51.59, "elapsed_time": "3 days, 14:42:40", "remaining_time": "3 days, 9:22:28", "throughput": 2723.78, "total_tokens": 850255392} {"current_steps": 4713, "total_steps": 9134, "loss": 0.8206, "learning_rate": 2.3745128684758684e-05, "epoch": 0.515941870330332, "percentage": 51.6, "elapsed_time": "3 days, 14:43:45", "remaining_time": "3 days, 9:21:21", "throughput": 2723.78, "total_tokens": 850433696} {"current_steps": 4714, "total_steps": 9134, "loss": 0.9746, "learning_rate": 2.3736540975870865e-05, "epoch": 0.5160513424012699, "percentage": 51.61, "elapsed_time": "3 days, 14:44:51", "remaining_time": "3 days, 9:20:14", "throughput": 2723.81, "total_tokens": 850622304} {"current_steps": 4715, "total_steps": 9134, "loss": 0.6455, "learning_rate": 2.3727953416447826e-05, "epoch": 0.5161608144722077, "percentage": 51.62, "elapsed_time": "3 days, 14:46:00", "remaining_time": "3 days, 9:19:10", "throughput": 2723.84, "total_tokens": 850818976} {"current_steps": 4716, "total_steps": 9134, "loss": 0.5936, "learning_rate": 2.3719366007505477e-05, "epoch": 0.5162702865431457, "percentage": 51.63, "elapsed_time": "3 days, 14:47:05", "remaining_time": "3 days, 9:18:03", "throughput": 2723.81, "total_tokens": 850986976} {"current_steps": 4717, "total_steps": 9134, "loss": 0.8448, "learning_rate": 2.3710778750059665e-05, "epoch": 0.5163797586140836, "percentage": 51.64, "elapsed_time": "3 days, 14:48:15", "remaining_time": "3 days, 9:17:00", "throughput": 2723.77, "total_tokens": 851166176} {"current_steps": 4718, "total_steps": 9134, "loss": 0.7961, "learning_rate": 2.3702191645126266e-05, "epoch": 0.5164892306850215, "percentage": 51.65, "elapsed_time": "3 days, 14:49:23", "remaining_time": "3 days, 9:15:56", "throughput": 2723.84, "total_tokens": 851374272} {"current_steps": 4719, "total_steps": 9134, "loss": 0.6708, "learning_rate": 2.3693604693721126e-05, "epoch": 0.5165987027559594, "percentage": 51.66, "elapsed_time": "3 days, 14:50:26", "remaining_time": "3 days, 9:14:46", "throughput": 2723.82, "total_tokens": 851537792} {"current_steps": 4720, "total_steps": 9134, "loss": 0.6459, "learning_rate": 2.368501789686004e-05, "epoch": 0.5167081748268972, "percentage": 51.68, "elapsed_time": "3 days, 14:51:32", "remaining_time": "3 days, 9:13:40", "throughput": 2723.82, "total_tokens": 851719456} {"current_steps": 4721, "total_steps": 9134, "loss": 0.5755, "learning_rate": 2.367643125555883e-05, "epoch": 0.5168176468978352, "percentage": 51.69, "elapsed_time": "3 days, 14:52:40", "remaining_time": "3 days, 9:12:35", "throughput": 2723.86, "total_tokens": 851915680} {"current_steps": 4722, "total_steps": 9134, "loss": 0.8051, "learning_rate": 2.3667844770833265e-05, "epoch": 0.5169271189687731, "percentage": 51.7, "elapsed_time": "3 days, 14:53:49", "remaining_time": "3 days, 9:11:32", "throughput": 2723.95, "total_tokens": 852133408} {"current_steps": 4723, "total_steps": 9134, "loss": 0.665, "learning_rate": 2.3659258443699128e-05, "epoch": 0.517036591039711, "percentage": 51.71, "elapsed_time": "3 days, 14:55:00", "remaining_time": "3 days, 9:10:30", "throughput": 2724.01, "total_tokens": 852343968} {"current_steps": 4724, "total_steps": 9134, "loss": 0.6773, "learning_rate": 2.3650672275172145e-05, "epoch": 0.5171460631106489, "percentage": 51.72, "elapsed_time": "3 days, 14:56:07", "remaining_time": "3 days, 9:09:24", "throughput": 2724.04, "total_tokens": 852535712} {"current_steps": 4725, "total_steps": 9134, "loss": 0.6971, "learning_rate": 2.3642086266268053e-05, "epoch": 0.5172555351815868, "percentage": 51.73, "elapsed_time": "3 days, 14:57:11", "remaining_time": "3 days, 9:08:16", "throughput": 2724.01, "total_tokens": 852701024} {"current_steps": 4726, "total_steps": 9134, "loss": 0.8445, "learning_rate": 2.363350041800257e-05, "epoch": 0.5173650072525247, "percentage": 51.74, "elapsed_time": "3 days, 14:58:18", "remaining_time": "3 days, 9:07:11", "throughput": 2724.03, "total_tokens": 852890080} {"current_steps": 4727, "total_steps": 9134, "loss": 0.8064, "learning_rate": 2.362491473139136e-05, "epoch": 0.5174744793234626, "percentage": 51.75, "elapsed_time": "3 days, 14:59:24", "remaining_time": "3 days, 9:06:04", "throughput": 2724.01, "total_tokens": 853063680} {"current_steps": 4728, "total_steps": 9134, "loss": 0.8204, "learning_rate": 2.3616329207450124e-05, "epoch": 0.5175839513944005, "percentage": 51.76, "elapsed_time": "3 days, 15:00:30", "remaining_time": "3 days, 9:04:57", "throughput": 2724.03, "total_tokens": 853249824} {"current_steps": 4729, "total_steps": 9134, "loss": 0.6753, "learning_rate": 2.360774384719449e-05, "epoch": 0.5176934234653384, "percentage": 51.77, "elapsed_time": "3 days, 15:01:37", "remaining_time": "3 days, 9:03:52", "throughput": 2724.03, "total_tokens": 853431040} {"current_steps": 4730, "total_steps": 9134, "loss": 0.8935, "learning_rate": 2.359915865164009e-05, "epoch": 0.5178028955362763, "percentage": 51.78, "elapsed_time": "3 days, 15:02:46", "remaining_time": "3 days, 9:02:48", "throughput": 2724.08, "total_tokens": 853635104} {"current_steps": 4731, "total_steps": 9134, "loss": 0.7694, "learning_rate": 2.3590573621802553e-05, "epoch": 0.5179123676072143, "percentage": 51.8, "elapsed_time": "3 days, 15:03:55", "remaining_time": "3 days, 9:01:45", "throughput": 2724.14, "total_tokens": 853842976} {"current_steps": 4732, "total_steps": 9134, "loss": 0.7688, "learning_rate": 2.3581988758697463e-05, "epoch": 0.5180218396781521, "percentage": 51.81, "elapsed_time": "3 days, 15:05:02", "remaining_time": "3 days, 9:00:39", "throughput": 2724.12, "total_tokens": 854019488} {"current_steps": 4733, "total_steps": 9134, "loss": 0.905, "learning_rate": 2.3573404063340386e-05, "epoch": 0.51813131174909, "percentage": 51.82, "elapsed_time": "3 days, 15:06:09", "remaining_time": "3 days, 8:59:33", "throughput": 2724.12, "total_tokens": 854198688} {"current_steps": 4734, "total_steps": 9134, "loss": 0.593, "learning_rate": 2.3564819536746883e-05, "epoch": 0.5182407838200279, "percentage": 51.83, "elapsed_time": "3 days, 15:07:16", "remaining_time": "3 days, 8:58:27", "throughput": 2724.14, "total_tokens": 854389984} {"current_steps": 4735, "total_steps": 9134, "loss": 0.7793, "learning_rate": 2.3556235179932494e-05, "epoch": 0.5183502558909658, "percentage": 51.84, "elapsed_time": "3 days, 15:08:22", "remaining_time": "3 days, 8:57:21", "throughput": 2724.19, "total_tokens": 854586208} {"current_steps": 4736, "total_steps": 9134, "loss": 0.7146, "learning_rate": 2.354765099391271e-05, "epoch": 0.5184597279619038, "percentage": 51.85, "elapsed_time": "3 days, 15:09:29", "remaining_time": "3 days, 8:56:15", "throughput": 2724.21, "total_tokens": 854773920} {"current_steps": 4737, "total_steps": 9134, "loss": 0.7044, "learning_rate": 2.353906697970304e-05, "epoch": 0.5185692000328416, "percentage": 51.86, "elapsed_time": "3 days, 15:10:37", "remaining_time": "3 days, 8:55:11", "throughput": 2724.23, "total_tokens": 854964320} {"current_steps": 4738, "total_steps": 9134, "loss": 0.8837, "learning_rate": 2.3530483138318964e-05, "epoch": 0.5186786721037795, "percentage": 51.87, "elapsed_time": "3 days, 15:11:40", "remaining_time": "3 days, 8:54:02", "throughput": 2724.14, "total_tokens": 855109024} {"current_steps": 4739, "total_steps": 9134, "loss": 0.6832, "learning_rate": 2.352189947077591e-05, "epoch": 0.5187881441747174, "percentage": 51.88, "elapsed_time": "3 days, 15:12:46", "remaining_time": "3 days, 8:52:55", "throughput": 2724.13, "total_tokens": 855285312} {"current_steps": 4740, "total_steps": 9134, "loss": 0.652, "learning_rate": 2.3513315978089336e-05, "epoch": 0.5188976162456553, "percentage": 51.89, "elapsed_time": "3 days, 15:13:47", "remaining_time": "3 days, 8:51:45", "throughput": 2724.04, "total_tokens": 855423968} {"current_steps": 4741, "total_steps": 9134, "loss": 0.7119, "learning_rate": 2.3504732661274627e-05, "epoch": 0.5190070883165933, "percentage": 51.9, "elapsed_time": "3 days, 15:14:53", "remaining_time": "3 days, 8:50:38", "throughput": 2724.01, "total_tokens": 855593312} {"current_steps": 4742, "total_steps": 9134, "loss": 0.8052, "learning_rate": 2.3496149521347194e-05, "epoch": 0.5191165603875312, "percentage": 51.92, "elapsed_time": "3 days, 15:15:59", "remaining_time": "3 days, 8:49:31", "throughput": 2724.01, "total_tokens": 855771616} {"current_steps": 4743, "total_steps": 9134, "loss": 0.8435, "learning_rate": 2.348756655932239e-05, "epoch": 0.519226032458469, "percentage": 51.93, "elapsed_time": "3 days, 15:17:07", "remaining_time": "3 days, 8:48:26", "throughput": 2724.08, "total_tokens": 855980384} {"current_steps": 4744, "total_steps": 9134, "loss": 0.7079, "learning_rate": 2.3478983776215572e-05, "epoch": 0.5193355045294069, "percentage": 51.94, "elapsed_time": "3 days, 15:18:12", "remaining_time": "3 days, 8:47:19", "throughput": 2724.06, "total_tokens": 856150848} {"current_steps": 4745, "total_steps": 9134, "loss": 0.647, "learning_rate": 2.3470401173042076e-05, "epoch": 0.5194449766003448, "percentage": 51.95, "elapsed_time": "3 days, 15:19:15", "remaining_time": "3 days, 8:46:10", "throughput": 2724.04, "total_tokens": 856319296} {"current_steps": 4746, "total_steps": 9134, "loss": 0.6906, "learning_rate": 2.3461818750817186e-05, "epoch": 0.5195544486712828, "percentage": 51.96, "elapsed_time": "3 days, 15:20:22", "remaining_time": "3 days, 8:45:04", "throughput": 2724.1, "total_tokens": 856516864} {"current_steps": 4747, "total_steps": 9134, "loss": 0.6833, "learning_rate": 2.3453236510556207e-05, "epoch": 0.5196639207422207, "percentage": 51.97, "elapsed_time": "3 days, 15:21:25", "remaining_time": "3 days, 8:43:55", "throughput": 2724.06, "total_tokens": 856678144} {"current_steps": 4748, "total_steps": 9134, "loss": 0.7495, "learning_rate": 2.344465445327438e-05, "epoch": 0.5197733928131586, "percentage": 51.98, "elapsed_time": "3 days, 15:22:30", "remaining_time": "3 days, 8:42:48", "throughput": 2724.01, "total_tokens": 856839424} {"current_steps": 4749, "total_steps": 9134, "loss": 0.5976, "learning_rate": 2.3436072579986973e-05, "epoch": 0.5198828648840964, "percentage": 51.99, "elapsed_time": "3 days, 15:23:36", "remaining_time": "3 days, 8:41:42", "throughput": 2724.01, "total_tokens": 857019072} {"current_steps": 4750, "total_steps": 9134, "loss": 0.6886, "learning_rate": 2.3427490891709176e-05, "epoch": 0.5199923369550343, "percentage": 52.0, "elapsed_time": "3 days, 15:24:46", "remaining_time": "3 days, 8:40:38", "throughput": 2724.09, "total_tokens": 857234336} {"current_steps": 4751, "total_steps": 9134, "loss": 0.5229, "learning_rate": 2.3418909389456203e-05, "epoch": 0.5201018090259723, "percentage": 52.01, "elapsed_time": "3 days, 15:25:49", "remaining_time": "3 days, 8:39:29", "throughput": 2724.05, "total_tokens": 857394496} {"current_steps": 4752, "total_steps": 9134, "loss": 0.6878, "learning_rate": 2.3410328074243232e-05, "epoch": 0.5202112810969102, "percentage": 52.03, "elapsed_time": "3 days, 15:26:59", "remaining_time": "3 days, 8:38:27", "throughput": 2724.06, "total_tokens": 857587136} {"current_steps": 4753, "total_steps": 9134, "loss": 0.6391, "learning_rate": 2.340174694708541e-05, "epoch": 0.5203207531678481, "percentage": 52.04, "elapsed_time": "3 days, 15:28:08", "remaining_time": "3 days, 8:37:23", "throughput": 2724.05, "total_tokens": 857772832} {"current_steps": 4754, "total_steps": 9134, "loss": 0.6634, "learning_rate": 2.339316600899787e-05, "epoch": 0.5204302252387859, "percentage": 52.05, "elapsed_time": "3 days, 15:29:12", "remaining_time": "3 days, 8:36:14", "throughput": 2724.0, "total_tokens": 857929856} {"current_steps": 4755, "total_steps": 9134, "loss": 0.885, "learning_rate": 2.338458526099571e-05, "epoch": 0.5205396973097238, "percentage": 52.06, "elapsed_time": "3 days, 15:30:20", "remaining_time": "3 days, 8:35:09", "throughput": 2723.99, "total_tokens": 858113088} {"current_steps": 4756, "total_steps": 9134, "loss": 0.7307, "learning_rate": 2.337600470409404e-05, "epoch": 0.5206491693806617, "percentage": 52.07, "elapsed_time": "3 days, 15:31:24", "remaining_time": "3 days, 8:34:02", "throughput": 2723.93, "total_tokens": 858268768} {"current_steps": 4757, "total_steps": 9134, "loss": 0.7408, "learning_rate": 2.3367424339307895e-05, "epoch": 0.5207586414515997, "percentage": 52.08, "elapsed_time": "3 days, 15:32:31", "remaining_time": "3 days, 8:32:56", "throughput": 2723.98, "total_tokens": 858467456} {"current_steps": 4758, "total_steps": 9134, "loss": 0.7521, "learning_rate": 2.3358844167652334e-05, "epoch": 0.5208681135225376, "percentage": 52.09, "elapsed_time": "3 days, 15:33:40", "remaining_time": "3 days, 8:31:53", "throughput": 2724.0, "total_tokens": 858660320} {"current_steps": 4759, "total_steps": 9134, "loss": 0.7516, "learning_rate": 2.3350264190142377e-05, "epoch": 0.5209775855934755, "percentage": 52.1, "elapsed_time": "3 days, 15:34:50", "remaining_time": "3 days, 8:30:49", "throughput": 2724.04, "total_tokens": 858864160} {"current_steps": 4760, "total_steps": 9134, "loss": 0.8894, "learning_rate": 2.3341684407793004e-05, "epoch": 0.5210870576644133, "percentage": 52.11, "elapsed_time": "3 days, 15:35:56", "remaining_time": "3 days, 8:29:43", "throughput": 2723.97, "total_tokens": 859019168} {"current_steps": 4761, "total_steps": 9134, "loss": 0.5534, "learning_rate": 2.3333104821619207e-05, "epoch": 0.5211965297353512, "percentage": 52.12, "elapsed_time": "3 days, 15:37:01", "remaining_time": "3 days, 8:28:36", "throughput": 2723.95, "total_tokens": 859194112} {"current_steps": 4762, "total_steps": 9134, "loss": 0.6153, "learning_rate": 2.332452543263591e-05, "epoch": 0.5213060018062892, "percentage": 52.13, "elapsed_time": "3 days, 15:38:01", "remaining_time": "3 days, 8:27:24", "throughput": 2723.85, "total_tokens": 859324256} {"current_steps": 4763, "total_steps": 9134, "loss": 0.7163, "learning_rate": 2.3315946241858058e-05, "epoch": 0.5214154738772271, "percentage": 52.15, "elapsed_time": "3 days, 15:39:06", "remaining_time": "3 days, 8:26:17", "throughput": 2723.87, "total_tokens": 859509952} {"current_steps": 4764, "total_steps": 9134, "loss": 0.7455, "learning_rate": 2.330736725030054e-05, "epoch": 0.521524945948165, "percentage": 52.16, "elapsed_time": "3 days, 15:40:12", "remaining_time": "3 days, 8:25:10", "throughput": 2723.85, "total_tokens": 859683328} {"current_steps": 4765, "total_steps": 9134, "loss": 0.7198, "learning_rate": 2.329878845897824e-05, "epoch": 0.5216344180191029, "percentage": 52.17, "elapsed_time": "3 days, 15:41:12", "remaining_time": "3 days, 8:23:58", "throughput": 2723.81, "total_tokens": 859834528} {"current_steps": 4766, "total_steps": 9134, "loss": 0.7367, "learning_rate": 2.3290209868906025e-05, "epoch": 0.5217438900900407, "percentage": 52.18, "elapsed_time": "3 days, 15:42:19", "remaining_time": "3 days, 8:22:53", "throughput": 2723.77, "total_tokens": 860001632} {"current_steps": 4767, "total_steps": 9134, "loss": 0.4768, "learning_rate": 2.3281631481098704e-05, "epoch": 0.5218533621609787, "percentage": 52.19, "elapsed_time": "3 days, 15:43:28", "remaining_time": "3 days, 8:21:49", "throughput": 2723.82, "total_tokens": 860206368} {"current_steps": 4768, "total_steps": 9134, "loss": 0.7879, "learning_rate": 2.3273053296571104e-05, "epoch": 0.5219628342319166, "percentage": 52.2, "elapsed_time": "3 days, 15:44:35", "remaining_time": "3 days, 8:20:43", "throughput": 2723.77, "total_tokens": 860373696} {"current_steps": 4769, "total_steps": 9134, "loss": 0.9015, "learning_rate": 2.326447531633799e-05, "epoch": 0.5220723063028545, "percentage": 52.21, "elapsed_time": "3 days, 15:45:45", "remaining_time": "3 days, 8:19:40", "throughput": 2723.84, "total_tokens": 860584704} {"current_steps": 4770, "total_steps": 9134, "loss": 1.005, "learning_rate": 2.3255897541414133e-05, "epoch": 0.5221817783737924, "percentage": 52.22, "elapsed_time": "3 days, 15:46:55", "remaining_time": "3 days, 8:18:37", "throughput": 2723.88, "total_tokens": 860787872} {"current_steps": 4771, "total_steps": 9134, "loss": 0.8123, "learning_rate": 2.3247319972814256e-05, "epoch": 0.5222912504447302, "percentage": 52.23, "elapsed_time": "3 days, 15:48:04", "remaining_time": "3 days, 8:17:33", "throughput": 2723.84, "total_tokens": 860964384} {"current_steps": 4772, "total_steps": 9134, "loss": 0.7913, "learning_rate": 2.3238742611553075e-05, "epoch": 0.5224007225156682, "percentage": 52.24, "elapsed_time": "3 days, 15:49:07", "remaining_time": "3 days, 8:16:24", "throughput": 2723.85, "total_tokens": 861138656} {"current_steps": 4773, "total_steps": 9134, "loss": 0.646, "learning_rate": 2.3230165458645282e-05, "epoch": 0.5225101945866061, "percentage": 52.26, "elapsed_time": "3 days, 15:50:10", "remaining_time": "3 days, 8:15:15", "throughput": 2723.75, "total_tokens": 861280224} {"current_steps": 4774, "total_steps": 9134, "loss": 0.7289, "learning_rate": 2.322158851510553e-05, "epoch": 0.522619666657544, "percentage": 52.27, "elapsed_time": "3 days, 15:51:18", "remaining_time": "3 days, 8:14:10", "throughput": 2723.77, "total_tokens": 861469504} {"current_steps": 4775, "total_steps": 9134, "loss": 0.8554, "learning_rate": 2.3213011781948456e-05, "epoch": 0.5227291387284819, "percentage": 52.28, "elapsed_time": "3 days, 15:52:27", "remaining_time": "3 days, 8:13:07", "throughput": 2723.82, "total_tokens": 861674912} {"current_steps": 4776, "total_steps": 9134, "loss": 0.7139, "learning_rate": 2.320443526018867e-05, "epoch": 0.5228386107994198, "percentage": 52.29, "elapsed_time": "3 days, 15:53:36", "remaining_time": "3 days, 8:12:03", "throughput": 2723.85, "total_tokens": 861871136} {"current_steps": 4777, "total_steps": 9134, "loss": 0.7043, "learning_rate": 2.319585895084077e-05, "epoch": 0.5229480828703577, "percentage": 52.3, "elapsed_time": "3 days, 15:54:38", "remaining_time": "3 days, 8:10:53", "throughput": 2723.79, "total_tokens": 862021664} {"current_steps": 4778, "total_steps": 9134, "loss": 0.686, "learning_rate": 2.3187282854919296e-05, "epoch": 0.5230575549412956, "percentage": 52.31, "elapsed_time": "3 days, 15:55:44", "remaining_time": "3 days, 8:09:46", "throughput": 2723.83, "total_tokens": 862212960} {"current_steps": 4779, "total_steps": 9134, "loss": 0.5277, "learning_rate": 2.3178706973438793e-05, "epoch": 0.5231670270122335, "percentage": 52.32, "elapsed_time": "3 days, 15:56:51", "remaining_time": "3 days, 8:08:41", "throughput": 2723.89, "total_tokens": 862412768} {"current_steps": 4780, "total_steps": 9134, "loss": 0.7344, "learning_rate": 2.3170131307413788e-05, "epoch": 0.5232764990831714, "percentage": 52.33, "elapsed_time": "3 days, 15:58:00", "remaining_time": "3 days, 8:07:37", "throughput": 2723.86, "total_tokens": 862595552} {"current_steps": 4781, "total_steps": 9134, "loss": 0.6211, "learning_rate": 2.3161555857858735e-05, "epoch": 0.5233859711541093, "percentage": 52.34, "elapsed_time": "3 days, 15:59:10", "remaining_time": "3 days, 8:06:34", "throughput": 2723.92, "total_tokens": 862802976} {"current_steps": 4782, "total_steps": 9134, "loss": 0.6523, "learning_rate": 2.3152980625788126e-05, "epoch": 0.5234954432250473, "percentage": 52.35, "elapsed_time": "3 days, 16:00:19", "remaining_time": "3 days, 8:05:30", "throughput": 2723.97, "total_tokens": 863005024} {"current_steps": 4783, "total_steps": 9134, "loss": 0.6374, "learning_rate": 2.3144405612216365e-05, "epoch": 0.5236049152959851, "percentage": 52.36, "elapsed_time": "3 days, 16:01:27", "remaining_time": "3 days, 8:04:26", "throughput": 2723.96, "total_tokens": 863190048} {"current_steps": 4784, "total_steps": 9134, "loss": 0.6081, "learning_rate": 2.3135830818157877e-05, "epoch": 0.523714387366923, "percentage": 52.38, "elapsed_time": "3 days, 16:02:37", "remaining_time": "3 days, 8:03:23", "throughput": 2724.05, "total_tokens": 863408224} {"current_steps": 4785, "total_steps": 9134, "loss": 0.8334, "learning_rate": 2.3127256244627036e-05, "epoch": 0.5238238594378609, "percentage": 52.39, "elapsed_time": "3 days, 16:03:42", "remaining_time": "3 days, 8:02:16", "throughput": 2724.07, "total_tokens": 863591680} {"current_steps": 4786, "total_steps": 9134, "loss": 0.747, "learning_rate": 2.31186818926382e-05, "epoch": 0.5239333315087988, "percentage": 52.4, "elapsed_time": "3 days, 16:04:44", "remaining_time": "3 days, 8:01:05", "throughput": 2723.98, "total_tokens": 863731680} {"current_steps": 4787, "total_steps": 9134, "loss": 0.6623, "learning_rate": 2.311010776320571e-05, "epoch": 0.5240428035797368, "percentage": 52.41, "elapsed_time": "3 days, 16:05:50", "remaining_time": "3 days, 7:59:59", "throughput": 2723.92, "total_tokens": 863892960} {"current_steps": 4788, "total_steps": 9134, "loss": 0.8344, "learning_rate": 2.3101533857343848e-05, "epoch": 0.5241522756506746, "percentage": 52.42, "elapsed_time": "3 days, 16:06:55", "remaining_time": "3 days, 7:58:52", "throughput": 2723.93, "total_tokens": 864073504} {"current_steps": 4789, "total_steps": 9134, "loss": 0.6367, "learning_rate": 2.3092960176066912e-05, "epoch": 0.5242617477216125, "percentage": 52.43, "elapsed_time": "3 days, 16:07:58", "remaining_time": "3 days, 7:57:42", "throughput": 2723.85, "total_tokens": 864219552} {"current_steps": 4790, "total_steps": 9134, "loss": 0.597, "learning_rate": 2.3084386720389135e-05, "epoch": 0.5243712197925504, "percentage": 52.44, "elapsed_time": "3 days, 16:09:04", "remaining_time": "3 days, 7:56:36", "throughput": 2723.89, "total_tokens": 864410176} {"current_steps": 4791, "total_steps": 9134, "loss": 0.6825, "learning_rate": 2.3075813491324743e-05, "epoch": 0.5244806918634883, "percentage": 52.45, "elapsed_time": "3 days, 16:10:10", "remaining_time": "3 days, 7:55:29", "throughput": 2723.92, "total_tokens": 864601920} {"current_steps": 4792, "total_steps": 9134, "loss": 0.8041, "learning_rate": 2.3067240489887947e-05, "epoch": 0.5245901639344263, "percentage": 52.46, "elapsed_time": "3 days, 16:11:20", "remaining_time": "3 days, 7:54:26", "throughput": 2723.95, "total_tokens": 864798592} {"current_steps": 4793, "total_steps": 9134, "loss": 0.6823, "learning_rate": 2.3058667717092895e-05, "epoch": 0.5246996360053642, "percentage": 52.47, "elapsed_time": "3 days, 16:12:24", "remaining_time": "3 days, 7:53:18", "throughput": 2723.92, "total_tokens": 864965024} {"current_steps": 4794, "total_steps": 9134, "loss": 0.7255, "learning_rate": 2.305009517395375e-05, "epoch": 0.524809108076302, "percentage": 52.49, "elapsed_time": "3 days, 16:13:30", "remaining_time": "3 days, 7:52:12", "throughput": 2723.92, "total_tokens": 865144896} {"current_steps": 4795, "total_steps": 9134, "loss": 0.7192, "learning_rate": 2.3041522861484617e-05, "epoch": 0.5249185801472399, "percentage": 52.5, "elapsed_time": "3 days, 16:14:38", "remaining_time": "3 days, 7:51:07", "throughput": 2723.95, "total_tokens": 865338880} {"current_steps": 4796, "total_steps": 9134, "loss": 0.683, "learning_rate": 2.3032950780699582e-05, "epoch": 0.5250280522181778, "percentage": 52.51, "elapsed_time": "3 days, 16:15:47", "remaining_time": "3 days, 7:50:03", "throughput": 2723.99, "total_tokens": 865540928} {"current_steps": 4797, "total_steps": 9134, "loss": 0.8557, "learning_rate": 2.302437893261271e-05, "epoch": 0.5251375242891158, "percentage": 52.52, "elapsed_time": "3 days, 16:16:56", "remaining_time": "3 days, 7:48:59", "throughput": 2724.01, "total_tokens": 865735584} {"current_steps": 4798, "total_steps": 9134, "loss": 0.5805, "learning_rate": 2.3015807318238027e-05, "epoch": 0.5252469963600537, "percentage": 52.53, "elapsed_time": "3 days, 16:18:04", "remaining_time": "3 days, 7:47:55", "throughput": 2723.99, "total_tokens": 865913888} {"current_steps": 4799, "total_steps": 9134, "loss": 0.7204, "learning_rate": 2.300723593858956e-05, "epoch": 0.5253564684309916, "percentage": 52.54, "elapsed_time": "3 days, 16:19:13", "remaining_time": "3 days, 7:46:51", "throughput": 2723.98, "total_tokens": 866098912} {"current_steps": 4800, "total_steps": 9134, "loss": 0.8575, "learning_rate": 2.299866479468126e-05, "epoch": 0.5254659405019294, "percentage": 52.55, "elapsed_time": "3 days, 16:20:17", "remaining_time": "3 days, 7:45:42", "throughput": 2723.95, "total_tokens": 866262880} {"current_steps": 4801, "total_steps": 9134, "loss": 0.937, "learning_rate": 2.29900938875271e-05, "epoch": 0.5255754125728673, "percentage": 52.56, "elapsed_time": "3 days, 16:21:27", "remaining_time": "3 days, 7:44:40", "throughput": 2723.97, "total_tokens": 866459328} {"current_steps": 4802, "total_steps": 9134, "loss": 0.7265, "learning_rate": 2.298152321814098e-05, "epoch": 0.5256848846438053, "percentage": 52.57, "elapsed_time": "3 days, 16:22:33", "remaining_time": "3 days, 7:43:33", "throughput": 2723.93, "total_tokens": 866625536} {"current_steps": 4803, "total_steps": 9134, "loss": 0.417, "learning_rate": 2.2972952787536815e-05, "epoch": 0.5257943567147432, "percentage": 52.58, "elapsed_time": "3 days, 16:23:38", "remaining_time": "3 days, 7:42:26", "throughput": 2723.92, "total_tokens": 866801152} {"current_steps": 4804, "total_steps": 9134, "loss": 0.7237, "learning_rate": 2.2964382596728447e-05, "epoch": 0.5259038287856811, "percentage": 52.59, "elapsed_time": "3 days, 16:24:44", "remaining_time": "3 days, 7:41:19", "throughput": 2723.85, "total_tokens": 866957504} {"current_steps": 4805, "total_steps": 9134, "loss": 0.5086, "learning_rate": 2.295581264672973e-05, "epoch": 0.5260133008566189, "percentage": 52.61, "elapsed_time": "3 days, 16:25:47", "remaining_time": "3 days, 7:40:10", "throughput": 2723.82, "total_tokens": 867122144} {"current_steps": 4806, "total_steps": 9134, "loss": 0.5052, "learning_rate": 2.2947242938554475e-05, "epoch": 0.5261227729275568, "percentage": 52.62, "elapsed_time": "3 days, 16:26:54", "remaining_time": "3 days, 7:39:05", "throughput": 2723.85, "total_tokens": 867315008} {"current_steps": 4807, "total_steps": 9134, "loss": 0.8607, "learning_rate": 2.2938673473216448e-05, "epoch": 0.5262322449984947, "percentage": 52.63, "elapsed_time": "3 days, 16:27:59", "remaining_time": "3 days, 7:37:58", "throughput": 2723.85, "total_tokens": 867491296} {"current_steps": 4808, "total_steps": 9134, "loss": 0.6455, "learning_rate": 2.293010425172942e-05, "epoch": 0.5263417170694327, "percentage": 52.64, "elapsed_time": "3 days, 16:29:01", "remaining_time": "3 days, 7:36:48", "throughput": 2723.81, "total_tokens": 867647872} {"current_steps": 4809, "total_steps": 9134, "loss": 0.6339, "learning_rate": 2.2921535275107092e-05, "epoch": 0.5264511891403706, "percentage": 52.65, "elapsed_time": "3 days, 16:30:08", "remaining_time": "3 days, 7:35:42", "throughput": 2723.8, "total_tokens": 867824832} {"current_steps": 4810, "total_steps": 9134, "loss": 0.6224, "learning_rate": 2.291296654436318e-05, "epoch": 0.5265606612113085, "percentage": 52.66, "elapsed_time": "3 days, 16:31:17", "remaining_time": "3 days, 7:34:38", "throughput": 2723.86, "total_tokens": 868034944} {"current_steps": 4811, "total_steps": 9134, "loss": 0.8253, "learning_rate": 2.2904398060511324e-05, "epoch": 0.5266701332822463, "percentage": 52.67, "elapsed_time": "3 days, 16:32:25", "remaining_time": "3 days, 7:33:33", "throughput": 2723.85, "total_tokens": 868213696} {"current_steps": 4812, "total_steps": 9134, "loss": 0.6109, "learning_rate": 2.289582982456517e-05, "epoch": 0.5267796053531842, "percentage": 52.68, "elapsed_time": "3 days, 16:33:32", "remaining_time": "3 days, 7:32:28", "throughput": 2723.92, "total_tokens": 868419776} {"current_steps": 4813, "total_steps": 9134, "loss": 0.6017, "learning_rate": 2.2887261837538335e-05, "epoch": 0.5268890774241222, "percentage": 52.69, "elapsed_time": "3 days, 16:34:39", "remaining_time": "3 days, 7:31:22", "throughput": 2723.96, "total_tokens": 868614880} {"current_steps": 4814, "total_steps": 9134, "loss": 0.7352, "learning_rate": 2.2878694100444377e-05, "epoch": 0.5269985494950601, "percentage": 52.7, "elapsed_time": "3 days, 16:35:41", "remaining_time": "3 days, 7:30:12", "throughput": 2723.92, "total_tokens": 868771680} {"current_steps": 4815, "total_steps": 9134, "loss": 0.7668, "learning_rate": 2.2870126614296856e-05, "epoch": 0.527108021565998, "percentage": 52.72, "elapsed_time": "3 days, 16:36:43", "remaining_time": "3 days, 7:29:02", "throughput": 2723.93, "total_tokens": 868944608} {"current_steps": 4816, "total_steps": 9134, "loss": 0.78, "learning_rate": 2.2861559380109287e-05, "epoch": 0.5272174936369359, "percentage": 52.73, "elapsed_time": "3 days, 16:37:53", "remaining_time": "3 days, 7:27:59", "throughput": 2723.98, "total_tokens": 869149792} {"current_steps": 4817, "total_steps": 9134, "loss": 0.6638, "learning_rate": 2.2852992398895155e-05, "epoch": 0.5273269657078737, "percentage": 52.74, "elapsed_time": "3 days, 16:38:55", "remaining_time": "3 days, 7:26:49", "throughput": 2723.98, "total_tokens": 869318912} {"current_steps": 4818, "total_steps": 9134, "loss": 0.7344, "learning_rate": 2.284442567166791e-05, "epoch": 0.5274364377788117, "percentage": 52.75, "elapsed_time": "3 days, 16:40:05", "remaining_time": "3 days, 7:25:46", "throughput": 2724.06, "total_tokens": 869535072} {"current_steps": 4819, "total_steps": 9134, "loss": 0.8286, "learning_rate": 2.283585919944099e-05, "epoch": 0.5275459098497496, "percentage": 52.76, "elapsed_time": "3 days, 16:41:10", "remaining_time": "3 days, 7:24:39", "throughput": 2724.07, "total_tokens": 869713600} {"current_steps": 4820, "total_steps": 9134, "loss": 0.7133, "learning_rate": 2.28272929832278e-05, "epoch": 0.5276553819206875, "percentage": 52.77, "elapsed_time": "3 days, 16:42:13", "remaining_time": "3 days, 7:23:30", "throughput": 2724.0, "total_tokens": 869864800} {"current_steps": 4821, "total_steps": 9134, "loss": 0.7637, "learning_rate": 2.2818727024041685e-05, "epoch": 0.5277648539916254, "percentage": 52.78, "elapsed_time": "3 days, 16:43:20", "remaining_time": "3 days, 7:22:24", "throughput": 2723.96, "total_tokens": 870032352} {"current_steps": 4822, "total_steps": 9134, "loss": 0.7537, "learning_rate": 2.2810161322896e-05, "epoch": 0.5278743260625632, "percentage": 52.79, "elapsed_time": "3 days, 16:44:27", "remaining_time": "3 days, 7:21:18", "throughput": 2724.0, "total_tokens": 870229024} {"current_steps": 4823, "total_steps": 9134, "loss": 0.7722, "learning_rate": 2.2801595880804037e-05, "epoch": 0.5279837981335012, "percentage": 52.8, "elapsed_time": "3 days, 16:45:34", "remaining_time": "3 days, 7:20:13", "throughput": 2724.03, "total_tokens": 870419648} {"current_steps": 4824, "total_steps": 9134, "loss": 0.7127, "learning_rate": 2.279303069877909e-05, "epoch": 0.5280932702044391, "percentage": 52.81, "elapsed_time": "3 days, 16:46:42", "remaining_time": "3 days, 7:19:08", "throughput": 2724.03, "total_tokens": 870605120} {"current_steps": 4825, "total_steps": 9134, "loss": 0.8827, "learning_rate": 2.2784465777834383e-05, "epoch": 0.528202742275377, "percentage": 52.82, "elapsed_time": "3 days, 16:47:51", "remaining_time": "3 days, 7:18:05", "throughput": 2724.07, "total_tokens": 870809408} {"current_steps": 4826, "total_steps": 9134, "loss": 0.6874, "learning_rate": 2.2775901118983138e-05, "epoch": 0.5283122143463149, "percentage": 52.84, "elapsed_time": "3 days, 16:49:00", "remaining_time": "3 days, 7:17:00", "throughput": 2724.1, "total_tokens": 871003392} {"current_steps": 4827, "total_steps": 9134, "loss": 0.7421, "learning_rate": 2.2767336723238543e-05, "epoch": 0.5284216864172528, "percentage": 52.85, "elapsed_time": "3 days, 16:50:08", "remaining_time": "3 days, 7:15:56", "throughput": 2724.07, "total_tokens": 871181472} {"current_steps": 4828, "total_steps": 9134, "loss": 0.71, "learning_rate": 2.2758772591613743e-05, "epoch": 0.5285311584881907, "percentage": 52.86, "elapsed_time": "3 days, 16:51:15", "remaining_time": "3 days, 7:14:50", "throughput": 2724.05, "total_tokens": 871355744} {"current_steps": 4829, "total_steps": 9134, "loss": 0.8326, "learning_rate": 2.275020872512187e-05, "epoch": 0.5286406305591286, "percentage": 52.87, "elapsed_time": "3 days, 16:52:22", "remaining_time": "3 days, 7:13:45", "throughput": 2724.1, "total_tokens": 871553536} {"current_steps": 4830, "total_steps": 9134, "loss": 0.9164, "learning_rate": 2.274164512477599e-05, "epoch": 0.5287501026300665, "percentage": 52.88, "elapsed_time": "3 days, 16:53:24", "remaining_time": "3 days, 7:12:35", "throughput": 2724.03, "total_tokens": 871702496} {"current_steps": 4831, "total_steps": 9134, "loss": 0.7647, "learning_rate": 2.2733081791589188e-05, "epoch": 0.5288595747010044, "percentage": 52.89, "elapsed_time": "3 days, 16:54:30", "remaining_time": "3 days, 7:11:28", "throughput": 2723.96, "total_tokens": 871857280} {"current_steps": 4832, "total_steps": 9134, "loss": 0.6724, "learning_rate": 2.272451872657447e-05, "epoch": 0.5289690467719423, "percentage": 52.9, "elapsed_time": "3 days, 16:55:32", "remaining_time": "3 days, 7:10:18", "throughput": 2723.86, "total_tokens": 871994816} {"current_steps": 4833, "total_steps": 9134, "loss": 0.6445, "learning_rate": 2.2715955930744828e-05, "epoch": 0.5290785188428803, "percentage": 52.91, "elapsed_time": "3 days, 16:56:38", "remaining_time": "3 days, 7:09:12", "throughput": 2723.84, "total_tokens": 872168640} {"current_steps": 4834, "total_steps": 9134, "loss": 0.8357, "learning_rate": 2.2707393405113246e-05, "epoch": 0.5291879909138181, "percentage": 52.92, "elapsed_time": "3 days, 16:57:43", "remaining_time": "3 days, 7:08:04", "throughput": 2723.8, "total_tokens": 872334624} {"current_steps": 4835, "total_steps": 9134, "loss": 0.654, "learning_rate": 2.2698831150692635e-05, "epoch": 0.529297462984756, "percentage": 52.93, "elapsed_time": "3 days, 16:58:51", "remaining_time": "3 days, 7:06:59", "throughput": 2723.78, "total_tokens": 872512704} {"current_steps": 4836, "total_steps": 9134, "loss": 0.7207, "learning_rate": 2.2690269168495904e-05, "epoch": 0.5294069350556939, "percentage": 52.95, "elapsed_time": "3 days, 16:59:57", "remaining_time": "3 days, 7:05:53", "throughput": 2723.79, "total_tokens": 872695712} {"current_steps": 4837, "total_steps": 9134, "loss": 0.8417, "learning_rate": 2.2681707459535912e-05, "epoch": 0.5295164071266318, "percentage": 52.96, "elapsed_time": "3 days, 17:01:04", "remaining_time": "3 days, 7:04:48", "throughput": 2723.83, "total_tokens": 872890816} {"current_steps": 4838, "total_steps": 9134, "loss": 0.5884, "learning_rate": 2.2673146024825496e-05, "epoch": 0.5296258791975698, "percentage": 52.97, "elapsed_time": "3 days, 17:02:11", "remaining_time": "3 days, 7:03:42", "throughput": 2723.82, "total_tokens": 873069344} {"current_steps": 4839, "total_steps": 9134, "loss": 0.6925, "learning_rate": 2.2664584865377454e-05, "epoch": 0.5297353512685076, "percentage": 52.98, "elapsed_time": "3 days, 17:03:15", "remaining_time": "3 days, 7:02:34", "throughput": 2723.8, "total_tokens": 873238240} {"current_steps": 4840, "total_steps": 9134, "loss": 0.6294, "learning_rate": 2.2656023982204556e-05, "epoch": 0.5298448233394455, "percentage": 52.99, "elapsed_time": "3 days, 17:04:18", "remaining_time": "3 days, 7:01:24", "throughput": 2723.78, "total_tokens": 873401984} {"current_steps": 4841, "total_steps": 9134, "loss": 0.6402, "learning_rate": 2.2647463376319556e-05, "epoch": 0.5299542954103834, "percentage": 53.0, "elapsed_time": "3 days, 17:05:24", "remaining_time": "3 days, 7:00:18", "throughput": 2723.75, "total_tokens": 873573120} {"current_steps": 4842, "total_steps": 9134, "loss": 0.8164, "learning_rate": 2.2638903048735124e-05, "epoch": 0.5300637674813213, "percentage": 53.01, "elapsed_time": "3 days, 17:06:32", "remaining_time": "3 days, 6:59:13", "throughput": 2723.76, "total_tokens": 873760832} {"current_steps": 4843, "total_steps": 9134, "loss": 0.5049, "learning_rate": 2.263034300046396e-05, "epoch": 0.5301732395522593, "percentage": 53.02, "elapsed_time": "3 days, 17:07:34", "remaining_time": "3 days, 6:58:03", "throughput": 2723.66, "total_tokens": 873896352} {"current_steps": 4844, "total_steps": 9134, "loss": 0.7309, "learning_rate": 2.262178323251868e-05, "epoch": 0.5302827116231972, "percentage": 53.03, "elapsed_time": "3 days, 17:08:40", "remaining_time": "3 days, 6:56:57", "throughput": 2723.61, "total_tokens": 874062112} {"current_steps": 4845, "total_steps": 9134, "loss": 0.5604, "learning_rate": 2.2613223745911906e-05, "epoch": 0.530392183694135, "percentage": 53.04, "elapsed_time": "3 days, 17:09:47", "remaining_time": "3 days, 6:55:51", "throughput": 2723.55, "total_tokens": 874224512} {"current_steps": 4846, "total_steps": 9134, "loss": 0.6768, "learning_rate": 2.2604664541656193e-05, "epoch": 0.5305016557650729, "percentage": 53.05, "elapsed_time": "3 days, 17:10:53", "remaining_time": "3 days, 6:54:44", "throughput": 2723.59, "total_tokens": 874417152} {"current_steps": 4847, "total_steps": 9134, "loss": 0.8151, "learning_rate": 2.2596105620764083e-05, "epoch": 0.5306111278360108, "percentage": 53.07, "elapsed_time": "3 days, 17:12:02", "remaining_time": "3 days, 6:53:41", "throughput": 2723.61, "total_tokens": 874611584} {"current_steps": 4848, "total_steps": 9134, "loss": 0.7907, "learning_rate": 2.2587546984248086e-05, "epoch": 0.5307205999069488, "percentage": 53.08, "elapsed_time": "3 days, 17:13:07", "remaining_time": "3 days, 6:52:34", "throughput": 2723.55, "total_tokens": 874769952} {"current_steps": 4849, "total_steps": 9134, "loss": 0.6988, "learning_rate": 2.2578988633120667e-05, "epoch": 0.5308300719778867, "percentage": 53.09, "elapsed_time": "3 days, 17:14:14", "remaining_time": "3 days, 6:51:28", "throughput": 2723.54, "total_tokens": 874949376} {"current_steps": 4850, "total_steps": 9134, "loss": 0.7918, "learning_rate": 2.2570430568394275e-05, "epoch": 0.5309395440488246, "percentage": 53.1, "elapsed_time": "3 days, 17:15:20", "remaining_time": "3 days, 6:50:22", "throughput": 2723.54, "total_tokens": 875129472} {"current_steps": 4851, "total_steps": 9134, "loss": 0.8634, "learning_rate": 2.256187279108129e-05, "epoch": 0.5310490161197624, "percentage": 53.11, "elapsed_time": "3 days, 17:16:30", "remaining_time": "3 days, 6:49:18", "throughput": 2723.56, "total_tokens": 875325248} {"current_steps": 4852, "total_steps": 9134, "loss": 0.8175, "learning_rate": 2.2553315302194102e-05, "epoch": 0.5311584881907003, "percentage": 53.12, "elapsed_time": "3 days, 17:17:36", "remaining_time": "3 days, 6:48:12", "throughput": 2723.56, "total_tokens": 875504672} {"current_steps": 4853, "total_steps": 9134, "loss": 0.7567, "learning_rate": 2.254475810274503e-05, "epoch": 0.5312679602616383, "percentage": 53.13, "elapsed_time": "3 days, 17:18:45", "remaining_time": "3 days, 6:47:08", "throughput": 2723.58, "total_tokens": 875701792} {"current_steps": 4854, "total_steps": 9134, "loss": 0.7238, "learning_rate": 2.2536201193746375e-05, "epoch": 0.5313774323325762, "percentage": 53.14, "elapsed_time": "3 days, 17:19:52", "remaining_time": "3 days, 6:46:03", "throughput": 2723.62, "total_tokens": 875894880} {"current_steps": 4855, "total_steps": 9134, "loss": 0.7429, "learning_rate": 2.2527644576210423e-05, "epoch": 0.5314869044035141, "percentage": 53.15, "elapsed_time": "3 days, 17:21:01", "remaining_time": "3 days, 6:44:59", "throughput": 2723.66, "total_tokens": 876098272} {"current_steps": 4856, "total_steps": 9134, "loss": 0.548, "learning_rate": 2.2519088251149385e-05, "epoch": 0.5315963764744519, "percentage": 53.16, "elapsed_time": "3 days, 17:22:07", "remaining_time": "3 days, 6:43:52", "throughput": 2723.67, "total_tokens": 876279264} {"current_steps": 4857, "total_steps": 9134, "loss": 0.845, "learning_rate": 2.2510532219575465e-05, "epoch": 0.5317058485453898, "percentage": 53.17, "elapsed_time": "3 days, 17:23:15", "remaining_time": "3 days, 6:42:48", "throughput": 2723.74, "total_tokens": 876488256} {"current_steps": 4858, "total_steps": 9134, "loss": 0.8563, "learning_rate": 2.2501976482500823e-05, "epoch": 0.5318153206163277, "percentage": 53.19, "elapsed_time": "3 days, 17:24:25", "remaining_time": "3 days, 6:41:45", "throughput": 2723.85, "total_tokens": 876711360} {"current_steps": 4859, "total_steps": 9134, "loss": 0.8203, "learning_rate": 2.2493421040937585e-05, "epoch": 0.5319247926872657, "percentage": 53.2, "elapsed_time": "3 days, 17:25:34", "remaining_time": "3 days, 6:40:41", "throughput": 2723.91, "total_tokens": 876921472} {"current_steps": 4860, "total_steps": 9134, "loss": 0.7309, "learning_rate": 2.248486589589785e-05, "epoch": 0.5320342647582036, "percentage": 53.21, "elapsed_time": "3 days, 17:26:35", "remaining_time": "3 days, 6:39:30", "throughput": 2723.88, "total_tokens": 877076928} {"current_steps": 4861, "total_steps": 9134, "loss": 0.8316, "learning_rate": 2.2476311048393666e-05, "epoch": 0.5321437368291415, "percentage": 53.22, "elapsed_time": "3 days, 17:27:43", "remaining_time": "3 days, 6:38:25", "throughput": 2723.9, "total_tokens": 877270240} {"current_steps": 4862, "total_steps": 9134, "loss": 0.8748, "learning_rate": 2.246775649943707e-05, "epoch": 0.5322532089000793, "percentage": 53.23, "elapsed_time": "3 days, 17:28:49", "remaining_time": "3 days, 6:37:19", "throughput": 2723.91, "total_tokens": 877451680} {"current_steps": 4863, "total_steps": 9134, "loss": 0.7787, "learning_rate": 2.2459202250040032e-05, "epoch": 0.5323626809710172, "percentage": 53.24, "elapsed_time": "3 days, 17:29:53", "remaining_time": "3 days, 6:36:11", "throughput": 2723.84, "total_tokens": 877605344} {"current_steps": 4864, "total_steps": 9134, "loss": 0.7077, "learning_rate": 2.2450648301214517e-05, "epoch": 0.5324721530419552, "percentage": 53.25, "elapsed_time": "3 days, 17:31:00", "remaining_time": "3 days, 6:35:05", "throughput": 2723.85, "total_tokens": 877791040} {"current_steps": 4865, "total_steps": 9134, "loss": 0.8287, "learning_rate": 2.2442094653972428e-05, "epoch": 0.5325816251128931, "percentage": 53.26, "elapsed_time": "3 days, 17:32:08", "remaining_time": "3 days, 6:34:00", "throughput": 2723.81, "total_tokens": 877963296} {"current_steps": 4866, "total_steps": 9134, "loss": 0.6878, "learning_rate": 2.243354130932565e-05, "epoch": 0.532691097183831, "percentage": 53.27, "elapsed_time": "3 days, 17:33:16", "remaining_time": "3 days, 6:32:56", "throughput": 2723.77, "total_tokens": 878135104} {"current_steps": 4867, "total_steps": 9134, "loss": 0.7541, "learning_rate": 2.242498826828604e-05, "epoch": 0.5328005692547689, "percentage": 53.28, "elapsed_time": "3 days, 17:34:23", "remaining_time": "3 days, 6:31:50", "throughput": 2723.79, "total_tokens": 878321920} {"current_steps": 4868, "total_steps": 9134, "loss": 0.7641, "learning_rate": 2.241643553186538e-05, "epoch": 0.5329100413257067, "percentage": 53.3, "elapsed_time": "3 days, 17:35:31", "remaining_time": "3 days, 6:30:45", "throughput": 2723.81, "total_tokens": 878513440} {"current_steps": 4869, "total_steps": 9134, "loss": 0.4879, "learning_rate": 2.240788310107547e-05, "epoch": 0.5330195133966447, "percentage": 53.31, "elapsed_time": "3 days, 17:36:39", "remaining_time": "3 days, 6:29:40", "throughput": 2723.79, "total_tokens": 878692864} {"current_steps": 4870, "total_steps": 9134, "loss": 0.8938, "learning_rate": 2.2399330976928028e-05, "epoch": 0.5331289854675826, "percentage": 53.32, "elapsed_time": "3 days, 17:37:48", "remaining_time": "3 days, 6:28:36", "throughput": 2723.79, "total_tokens": 878879456} {"current_steps": 4871, "total_steps": 9134, "loss": 0.5721, "learning_rate": 2.2390779160434767e-05, "epoch": 0.5332384575385205, "percentage": 53.33, "elapsed_time": "3 days, 17:38:54", "remaining_time": "3 days, 6:27:30", "throughput": 2723.81, "total_tokens": 879064928} {"current_steps": 4872, "total_steps": 9134, "loss": 0.7968, "learning_rate": 2.2382227652607333e-05, "epoch": 0.5333479296094584, "percentage": 53.34, "elapsed_time": "3 days, 17:40:02", "remaining_time": "3 days, 6:26:26", "throughput": 2723.86, "total_tokens": 879269664} {"current_steps": 4873, "total_steps": 9134, "loss": 0.6469, "learning_rate": 2.2373676454457364e-05, "epoch": 0.5334574016803962, "percentage": 53.35, "elapsed_time": "3 days, 17:41:12", "remaining_time": "3 days, 6:25:22", "throughput": 2723.85, "total_tokens": 879455360} {"current_steps": 4874, "total_steps": 9134, "loss": 0.7378, "learning_rate": 2.2365125566996457e-05, "epoch": 0.5335668737513342, "percentage": 53.36, "elapsed_time": "3 days, 17:42:19", "remaining_time": "3 days, 6:24:17", "throughput": 2723.91, "total_tokens": 879658976} {"current_steps": 4875, "total_steps": 9134, "loss": 0.8755, "learning_rate": 2.2356574991236154e-05, "epoch": 0.5336763458222721, "percentage": 53.37, "elapsed_time": "3 days, 17:43:21", "remaining_time": "3 days, 6:23:07", "throughput": 2723.84, "total_tokens": 879803008} {"current_steps": 4876, "total_steps": 9134, "loss": 0.7691, "learning_rate": 2.2348024728187983e-05, "epoch": 0.53378581789321, "percentage": 53.38, "elapsed_time": "3 days, 17:44:30", "remaining_time": "3 days, 6:22:03", "throughput": 2723.9, "total_tokens": 880011776} {"current_steps": 4877, "total_steps": 9134, "loss": 0.5424, "learning_rate": 2.2339474778863408e-05, "epoch": 0.5338952899641479, "percentage": 53.39, "elapsed_time": "3 days, 17:45:38", "remaining_time": "3 days, 6:20:59", "throughput": 2723.95, "total_tokens": 880214720} {"current_steps": 4878, "total_steps": 9134, "loss": 0.7147, "learning_rate": 2.2330925144273884e-05, "epoch": 0.5340047620350858, "percentage": 53.4, "elapsed_time": "3 days, 17:46:45", "remaining_time": "3 days, 6:19:53", "throughput": 2723.92, "total_tokens": 880385856} {"current_steps": 4879, "total_steps": 9134, "loss": 0.6893, "learning_rate": 2.2322375825430815e-05, "epoch": 0.5341142341060237, "percentage": 53.42, "elapsed_time": "3 days, 17:47:49", "remaining_time": "3 days, 6:18:44", "throughput": 2723.9, "total_tokens": 880555200} {"current_steps": 4880, "total_steps": 9134, "loss": 0.6847, "learning_rate": 2.231382682334556e-05, "epoch": 0.5342237061769616, "percentage": 53.43, "elapsed_time": "3 days, 17:48:57", "remaining_time": "3 days, 6:17:39", "throughput": 2723.94, "total_tokens": 880750752} {"current_steps": 4881, "total_steps": 9134, "loss": 0.7432, "learning_rate": 2.2305278139029465e-05, "epoch": 0.5343331782478995, "percentage": 53.44, "elapsed_time": "3 days, 17:50:00", "remaining_time": "3 days, 6:16:31", "throughput": 2723.91, "total_tokens": 880914272} {"current_steps": 4882, "total_steps": 9134, "loss": 0.9886, "learning_rate": 2.2296729773493806e-05, "epoch": 0.5344426503188374, "percentage": 53.45, "elapsed_time": "3 days, 17:51:04", "remaining_time": "3 days, 6:15:22", "throughput": 2723.9, "total_tokens": 881082720} {"current_steps": 4883, "total_steps": 9134, "loss": 0.8082, "learning_rate": 2.228818172774986e-05, "epoch": 0.5345521223897753, "percentage": 53.46, "elapsed_time": "3 days, 17:52:13", "remaining_time": "3 days, 6:14:18", "throughput": 2723.97, "total_tokens": 881295968} {"current_steps": 4884, "total_steps": 9134, "loss": 0.5442, "learning_rate": 2.2279634002808818e-05, "epoch": 0.5346615944607133, "percentage": 53.47, "elapsed_time": "3 days, 17:53:15", "remaining_time": "3 days, 6:13:09", "throughput": 2723.92, "total_tokens": 881448064} {"current_steps": 4885, "total_steps": 9134, "loss": 0.6449, "learning_rate": 2.2271086599681887e-05, "epoch": 0.5347710665316511, "percentage": 53.48, "elapsed_time": "3 days, 17:54:19", "remaining_time": "3 days, 6:12:00", "throughput": 2723.9, "total_tokens": 881614944} {"current_steps": 4886, "total_steps": 9134, "loss": 0.7576, "learning_rate": 2.2262539519380182e-05, "epoch": 0.534880538602589, "percentage": 53.49, "elapsed_time": "3 days, 17:55:25", "remaining_time": "3 days, 6:10:54", "throughput": 2723.86, "total_tokens": 881781152} {"current_steps": 4887, "total_steps": 9134, "loss": 0.8247, "learning_rate": 2.225399276291482e-05, "epoch": 0.5349900106735269, "percentage": 53.5, "elapsed_time": "3 days, 17:56:33", "remaining_time": "3 days, 6:09:49", "throughput": 2723.92, "total_tokens": 881989472} {"current_steps": 4888, "total_steps": 9134, "loss": 0.6711, "learning_rate": 2.2245446331296874e-05, "epoch": 0.5350994827444648, "percentage": 53.51, "elapsed_time": "3 days, 17:57:39", "remaining_time": "3 days, 6:08:43", "throughput": 2723.87, "total_tokens": 882151872} {"current_steps": 4889, "total_steps": 9134, "loss": 0.6098, "learning_rate": 2.223690022553735e-05, "epoch": 0.5352089548154028, "percentage": 53.53, "elapsed_time": "3 days, 17:58:48", "remaining_time": "3 days, 6:07:38", "throughput": 2723.93, "total_tokens": 882358176} {"current_steps": 4890, "total_steps": 9134, "loss": 0.6655, "learning_rate": 2.2228354446647252e-05, "epoch": 0.5353184268863406, "percentage": 53.54, "elapsed_time": "3 days, 17:59:56", "remaining_time": "3 days, 6:06:34", "throughput": 2723.93, "total_tokens": 882541632} {"current_steps": 4891, "total_steps": 9134, "loss": 0.6633, "learning_rate": 2.2219808995637524e-05, "epoch": 0.5354278989572785, "percentage": 53.55, "elapsed_time": "3 days, 18:01:04", "remaining_time": "3 days, 6:05:29", "throughput": 2723.92, "total_tokens": 882725760} {"current_steps": 4892, "total_steps": 9134, "loss": 0.9358, "learning_rate": 2.2211263873519082e-05, "epoch": 0.5355373710282164, "percentage": 53.56, "elapsed_time": "3 days, 18:02:13", "remaining_time": "3 days, 6:04:26", "throughput": 2723.94, "total_tokens": 882919968} {"current_steps": 4893, "total_steps": 9134, "loss": 0.6534, "learning_rate": 2.2202719081302785e-05, "epoch": 0.5356468430991543, "percentage": 53.57, "elapsed_time": "3 days, 18:03:19", "remaining_time": "3 days, 6:03:19", "throughput": 2723.92, "total_tokens": 883092224} {"current_steps": 4894, "total_steps": 9134, "loss": 0.8227, "learning_rate": 2.219417461999947e-05, "epoch": 0.5357563151700923, "percentage": 53.58, "elapsed_time": "3 days, 18:04:25", "remaining_time": "3 days, 6:02:12", "throughput": 2723.97, "total_tokens": 883288448} {"current_steps": 4895, "total_steps": 9134, "loss": 0.9085, "learning_rate": 2.218563049061995e-05, "epoch": 0.5358657872410302, "percentage": 53.59, "elapsed_time": "3 days, 18:05:32", "remaining_time": "3 days, 6:01:07", "throughput": 2723.98, "total_tokens": 883475488} {"current_steps": 4896, "total_steps": 9134, "loss": 0.6109, "learning_rate": 2.217708669417495e-05, "epoch": 0.535975259311968, "percentage": 53.6, "elapsed_time": "3 days, 18:06:34", "remaining_time": "3 days, 5:59:57", "throughput": 2723.9, "total_tokens": 883618400} {"current_steps": 4897, "total_steps": 9134, "loss": 0.7116, "learning_rate": 2.2168543231675204e-05, "epoch": 0.5360847313829059, "percentage": 53.61, "elapsed_time": "3 days, 18:07:38", "remaining_time": "3 days, 5:58:48", "throughput": 2723.9, "total_tokens": 883790432} {"current_steps": 4898, "total_steps": 9134, "loss": 0.6061, "learning_rate": 2.2160000104131372e-05, "epoch": 0.5361942034538438, "percentage": 53.62, "elapsed_time": "3 days, 18:08:34", "remaining_time": "3 days, 5:57:34", "throughput": 2723.81, "total_tokens": 883917440} {"current_steps": 4899, "total_steps": 9134, "loss": 0.8024, "learning_rate": 2.215145731255411e-05, "epoch": 0.5363036755247818, "percentage": 53.63, "elapsed_time": "3 days, 18:09:41", "remaining_time": "3 days, 5:56:28", "throughput": 2723.8, "total_tokens": 884096640} {"current_steps": 4900, "total_steps": 9134, "loss": 0.6452, "learning_rate": 2.2142914857953993e-05, "epoch": 0.5364131475957197, "percentage": 53.65, "elapsed_time": "3 days, 18:10:49", "remaining_time": "3 days, 5:55:23", "throughput": 2723.77, "total_tokens": 884271136} {"current_steps": 4901, "total_steps": 9134, "loss": 0.6526, "learning_rate": 2.2134372741341585e-05, "epoch": 0.5365226196666576, "percentage": 53.66, "elapsed_time": "3 days, 18:11:58", "remaining_time": "3 days, 5:54:20", "throughput": 2723.84, "total_tokens": 884481696} {"current_steps": 4902, "total_steps": 9134, "loss": 0.858, "learning_rate": 2.2125830963727412e-05, "epoch": 0.5366320917375954, "percentage": 53.67, "elapsed_time": "3 days, 18:13:05", "remaining_time": "3 days, 5:53:14", "throughput": 2723.78, "total_tokens": 884645216} {"current_steps": 4903, "total_steps": 9134, "loss": 0.685, "learning_rate": 2.2117289526121934e-05, "epoch": 0.5367415638085333, "percentage": 53.68, "elapsed_time": "3 days, 18:14:13", "remaining_time": "3 days, 5:52:09", "throughput": 2723.8, "total_tokens": 884837184} {"current_steps": 4904, "total_steps": 9134, "loss": 0.8191, "learning_rate": 2.2108748429535603e-05, "epoch": 0.5368510358794713, "percentage": 53.69, "elapsed_time": "3 days, 18:15:20", "remaining_time": "3 days, 5:51:03", "throughput": 2723.77, "total_tokens": 885007872} {"current_steps": 4905, "total_steps": 9134, "loss": 0.7797, "learning_rate": 2.21002076749788e-05, "epoch": 0.5369605079504092, "percentage": 53.7, "elapsed_time": "3 days, 18:16:29", "remaining_time": "3 days, 5:49:59", "throughput": 2723.83, "total_tokens": 885215072} {"current_steps": 4906, "total_steps": 9134, "loss": 0.7178, "learning_rate": 2.209166726346189e-05, "epoch": 0.5370699800213471, "percentage": 53.71, "elapsed_time": "3 days, 18:17:33", "remaining_time": "3 days, 5:48:51", "throughput": 2723.83, "total_tokens": 885391136} {"current_steps": 4907, "total_steps": 9134, "loss": 0.8455, "learning_rate": 2.2083127195995176e-05, "epoch": 0.5371794520922849, "percentage": 53.72, "elapsed_time": "3 days, 18:18:40", "remaining_time": "3 days, 5:47:46", "throughput": 2723.77, "total_tokens": 885553536} {"current_steps": 4908, "total_steps": 9134, "loss": 0.718, "learning_rate": 2.2074587473588936e-05, "epoch": 0.5372889241632228, "percentage": 53.73, "elapsed_time": "3 days, 18:19:45", "remaining_time": "3 days, 5:46:38", "throughput": 2723.76, "total_tokens": 885725792} {"current_steps": 4909, "total_steps": 9134, "loss": 0.7993, "learning_rate": 2.206604809725342e-05, "epoch": 0.5373983962341607, "percentage": 53.74, "elapsed_time": "3 days, 18:20:53", "remaining_time": "3 days, 5:45:33", "throughput": 2723.81, "total_tokens": 885928960} {"current_steps": 4910, "total_steps": 9134, "loss": 0.7634, "learning_rate": 2.205750906799879e-05, "epoch": 0.5375078683050987, "percentage": 53.76, "elapsed_time": "3 days, 18:21:59", "remaining_time": "3 days, 5:44:27", "throughput": 2723.83, "total_tokens": 886114208} {"current_steps": 4911, "total_steps": 9134, "loss": 0.5729, "learning_rate": 2.204897038683522e-05, "epoch": 0.5376173403760366, "percentage": 53.77, "elapsed_time": "3 days, 18:23:03", "remaining_time": "3 days, 5:43:19", "throughput": 2723.82, "total_tokens": 886288032} {"current_steps": 4912, "total_steps": 9134, "loss": 0.8703, "learning_rate": 2.2040432054772807e-05, "epoch": 0.5377268124469745, "percentage": 53.78, "elapsed_time": "3 days, 18:24:12", "remaining_time": "3 days, 5:42:15", "throughput": 2723.87, "total_tokens": 886492992} {"current_steps": 4913, "total_steps": 9134, "loss": 0.6991, "learning_rate": 2.2031894072821633e-05, "epoch": 0.5378362845179123, "percentage": 53.79, "elapsed_time": "3 days, 18:25:20", "remaining_time": "3 days, 5:41:10", "throughput": 2723.83, "total_tokens": 886663904} {"current_steps": 4914, "total_steps": 9134, "loss": 0.5344, "learning_rate": 2.2023356441991712e-05, "epoch": 0.5379457565888502, "percentage": 53.8, "elapsed_time": "3 days, 18:26:24", "remaining_time": "3 days, 5:40:02", "throughput": 2723.83, "total_tokens": 886837056} {"current_steps": 4915, "total_steps": 9134, "loss": 0.6827, "learning_rate": 2.2014819163293028e-05, "epoch": 0.5380552286597882, "percentage": 53.81, "elapsed_time": "3 days, 18:27:30", "remaining_time": "3 days, 5:38:55", "throughput": 2723.76, "total_tokens": 886992960} {"current_steps": 4916, "total_steps": 9134, "loss": 0.7791, "learning_rate": 2.200628223773554e-05, "epoch": 0.5381647007307261, "percentage": 53.82, "elapsed_time": "3 days, 18:28:37", "remaining_time": "3 days, 5:37:50", "throughput": 2723.73, "total_tokens": 887167904} {"current_steps": 4917, "total_steps": 9134, "loss": 0.8381, "learning_rate": 2.199774566632913e-05, "epoch": 0.538274172801664, "percentage": 53.83, "elapsed_time": "3 days, 18:29:45", "remaining_time": "3 days, 5:36:45", "throughput": 2723.76, "total_tokens": 887362560} {"current_steps": 4918, "total_steps": 9134, "loss": 1.0244, "learning_rate": 2.198920945008368e-05, "epoch": 0.5383836448726019, "percentage": 53.84, "elapsed_time": "3 days, 18:30:53", "remaining_time": "3 days, 5:35:41", "throughput": 2723.83, "total_tokens": 887569088} {"current_steps": 4919, "total_steps": 9134, "loss": 0.5345, "learning_rate": 2.198067359000899e-05, "epoch": 0.5384931169435397, "percentage": 53.85, "elapsed_time": "3 days, 18:32:01", "remaining_time": "3 days, 5:34:36", "throughput": 2723.85, "total_tokens": 887761504} {"current_steps": 4920, "total_steps": 9134, "loss": 0.6864, "learning_rate": 2.1972138087114835e-05, "epoch": 0.5386025890144777, "percentage": 53.86, "elapsed_time": "3 days, 18:33:04", "remaining_time": "3 days, 5:33:27", "throughput": 2723.8, "total_tokens": 887918752} {"current_steps": 4921, "total_steps": 9134, "loss": 0.5941, "learning_rate": 2.1963602942410968e-05, "epoch": 0.5387120610854156, "percentage": 53.88, "elapsed_time": "3 days, 18:34:09", "remaining_time": "3 days, 5:32:20", "throughput": 2723.78, "total_tokens": 888087200} {"current_steps": 4922, "total_steps": 9134, "loss": 0.7483, "learning_rate": 2.195506815690706e-05, "epoch": 0.5388215331563535, "percentage": 53.89, "elapsed_time": "3 days, 18:35:19", "remaining_time": "3 days, 5:31:16", "throughput": 2723.86, "total_tokens": 888303808} {"current_steps": 4923, "total_steps": 9134, "loss": 0.5528, "learning_rate": 2.1946533731612773e-05, "epoch": 0.5389310052272914, "percentage": 53.9, "elapsed_time": "3 days, 18:36:22", "remaining_time": "3 days, 5:30:07", "throughput": 2723.82, "total_tokens": 888461952} {"current_steps": 4924, "total_steps": 9134, "loss": 0.7557, "learning_rate": 2.1937999667537704e-05, "epoch": 0.5390404772982292, "percentage": 53.91, "elapsed_time": "3 days, 18:37:25", "remaining_time": "3 days, 5:28:58", "throughput": 2723.83, "total_tokens": 888637120} {"current_steps": 4925, "total_steps": 9134, "loss": 0.7313, "learning_rate": 2.192946596569143e-05, "epoch": 0.5391499493691672, "percentage": 53.92, "elapsed_time": "3 days, 18:38:31", "remaining_time": "3 days, 5:27:51", "throughput": 2723.88, "total_tokens": 888831776} {"current_steps": 4926, "total_steps": 9134, "loss": 0.622, "learning_rate": 2.192093262708345e-05, "epoch": 0.5392594214401051, "percentage": 53.93, "elapsed_time": "3 days, 18:39:37", "remaining_time": "3 days, 5:26:45", "throughput": 2723.9, "total_tokens": 889020384} {"current_steps": 4927, "total_steps": 9134, "loss": 0.668, "learning_rate": 2.1912399652723255e-05, "epoch": 0.539368893511043, "percentage": 53.94, "elapsed_time": "3 days, 18:40:44", "remaining_time": "3 days, 5:25:40", "throughput": 2723.94, "total_tokens": 889217056} {"current_steps": 4928, "total_steps": 9134, "loss": 0.78, "learning_rate": 2.190386704362029e-05, "epoch": 0.5394783655819809, "percentage": 53.95, "elapsed_time": "3 days, 18:41:51", "remaining_time": "3 days, 5:24:34", "throughput": 2723.94, "total_tokens": 889398720} {"current_steps": 4929, "total_steps": 9134, "loss": 0.7584, "learning_rate": 2.1895334800783925e-05, "epoch": 0.5395878376529188, "percentage": 53.96, "elapsed_time": "3 days, 18:42:59", "remaining_time": "3 days, 5:23:29", "throughput": 2723.99, "total_tokens": 889598976} {"current_steps": 4930, "total_steps": 9134, "loss": 0.7702, "learning_rate": 2.188680292522353e-05, "epoch": 0.5396973097238567, "percentage": 53.97, "elapsed_time": "3 days, 18:44:08", "remaining_time": "3 days, 5:22:25", "throughput": 2724.05, "total_tokens": 889806400} {"current_steps": 4931, "total_steps": 9134, "loss": 0.6694, "learning_rate": 2.1878271417948385e-05, "epoch": 0.5398067817947946, "percentage": 53.99, "elapsed_time": "3 days, 18:45:17", "remaining_time": "3 days, 5:21:21", "throughput": 2724.14, "total_tokens": 890024128} {"current_steps": 4932, "total_steps": 9134, "loss": 0.7419, "learning_rate": 2.1869740279967768e-05, "epoch": 0.5399162538657325, "percentage": 54.0, "elapsed_time": "3 days, 18:46:25", "remaining_time": "3 days, 5:20:16", "throughput": 2724.13, "total_tokens": 890206912} {"current_steps": 4933, "total_steps": 9134, "loss": 1.0243, "learning_rate": 2.1861209512290888e-05, "epoch": 0.5400257259366704, "percentage": 54.01, "elapsed_time": "3 days, 18:47:32", "remaining_time": "3 days, 5:19:11", "throughput": 2724.1, "total_tokens": 890378272} {"current_steps": 4934, "total_steps": 9134, "loss": 0.7983, "learning_rate": 2.1852679115926926e-05, "epoch": 0.5401351980076083, "percentage": 54.02, "elapsed_time": "3 days, 18:48:38", "remaining_time": "3 days, 5:18:05", "throughput": 2724.07, "total_tokens": 890549856} {"current_steps": 4935, "total_steps": 9134, "loss": 0.7991, "learning_rate": 2.184414909188501e-05, "epoch": 0.5402446700785463, "percentage": 54.03, "elapsed_time": "3 days, 18:49:42", "remaining_time": "3 days, 5:16:56", "throughput": 2723.98, "total_tokens": 890693440} {"current_steps": 4936, "total_steps": 9134, "loss": 0.851, "learning_rate": 2.1835619441174214e-05, "epoch": 0.5403541421494841, "percentage": 54.04, "elapsed_time": "3 days, 18:50:49", "remaining_time": "3 days, 5:15:51", "throughput": 2723.95, "total_tokens": 890868832} {"current_steps": 4937, "total_steps": 9134, "loss": 0.8924, "learning_rate": 2.1827090164803605e-05, "epoch": 0.540463614220422, "percentage": 54.05, "elapsed_time": "3 days, 18:51:56", "remaining_time": "3 days, 5:14:45", "throughput": 2723.96, "total_tokens": 891052512} {"current_steps": 4938, "total_steps": 9134, "loss": 0.5744, "learning_rate": 2.181856126378215e-05, "epoch": 0.5405730862913599, "percentage": 54.06, "elapsed_time": "3 days, 18:53:03", "remaining_time": "3 days, 5:13:39", "throughput": 2724.03, "total_tokens": 891258592} {"current_steps": 4939, "total_steps": 9134, "loss": 0.7564, "learning_rate": 2.181003273911883e-05, "epoch": 0.5406825583622978, "percentage": 54.07, "elapsed_time": "3 days, 18:54:12", "remaining_time": "3 days, 5:12:36", "throughput": 2724.09, "total_tokens": 891467136} {"current_steps": 4940, "total_steps": 9134, "loss": 0.6313, "learning_rate": 2.1801504591822526e-05, "epoch": 0.5407920304332358, "percentage": 54.08, "elapsed_time": "3 days, 18:55:19", "remaining_time": "3 days, 5:11:30", "throughput": 2724.12, "total_tokens": 891658656} {"current_steps": 4941, "total_steps": 9134, "loss": 0.8119, "learning_rate": 2.179297682290211e-05, "epoch": 0.5409015025041736, "percentage": 54.09, "elapsed_time": "3 days, 18:56:22", "remaining_time": "3 days, 5:10:21", "throughput": 2724.1, "total_tokens": 891823520} {"current_steps": 4942, "total_steps": 9134, "loss": 0.6588, "learning_rate": 2.178444943336642e-05, "epoch": 0.5410109745751115, "percentage": 54.11, "elapsed_time": "3 days, 18:57:31", "remaining_time": "3 days, 5:09:17", "throughput": 2724.1, "total_tokens": 892011456} {"current_steps": 4943, "total_steps": 9134, "loss": 0.5618, "learning_rate": 2.1775922424224203e-05, "epoch": 0.5411204466460494, "percentage": 54.12, "elapsed_time": "3 days, 18:58:37", "remaining_time": "3 days, 5:08:10", "throughput": 2724.12, "total_tokens": 892196928} {"current_steps": 4944, "total_steps": 9134, "loss": 0.7244, "learning_rate": 2.1767395796484207e-05, "epoch": 0.5412299187169873, "percentage": 54.13, "elapsed_time": "3 days, 18:59:37", "remaining_time": "3 days, 5:06:58", "throughput": 2724.04, "total_tokens": 892331776} {"current_steps": 4945, "total_steps": 9134, "loss": 0.5291, "learning_rate": 2.17588695511551e-05, "epoch": 0.5413393907879253, "percentage": 54.14, "elapsed_time": "3 days, 19:00:45", "remaining_time": "3 days, 5:05:54", "throughput": 2724.06, "total_tokens": 892524192} {"current_steps": 4946, "total_steps": 9134, "loss": 0.7808, "learning_rate": 2.1750343689245544e-05, "epoch": 0.5414488628588632, "percentage": 54.15, "elapsed_time": "3 days, 19:01:50", "remaining_time": "3 days, 5:04:46", "throughput": 2724.04, "total_tokens": 892695104} {"current_steps": 4947, "total_steps": 9134, "loss": 0.6706, "learning_rate": 2.1741818211764103e-05, "epoch": 0.541558334929801, "percentage": 54.16, "elapsed_time": "3 days, 19:02:56", "remaining_time": "3 days, 5:03:40", "throughput": 2724.03, "total_tokens": 892873632} {"current_steps": 4948, "total_steps": 9134, "loss": 0.7458, "learning_rate": 2.173329311971934e-05, "epoch": 0.5416678070007389, "percentage": 54.17, "elapsed_time": "3 days, 19:03:56", "remaining_time": "3 days, 5:02:29", "throughput": 2723.96, "total_tokens": 893013856} {"current_steps": 4949, "total_steps": 9134, "loss": 0.5248, "learning_rate": 2.1724768414119766e-05, "epoch": 0.5417772790716768, "percentage": 54.18, "elapsed_time": "3 days, 19:04:57", "remaining_time": "3 days, 5:01:18", "throughput": 2723.93, "total_tokens": 893171328} {"current_steps": 4950, "total_steps": 9134, "loss": 0.6172, "learning_rate": 2.171624409597382e-05, "epoch": 0.5418867511426148, "percentage": 54.19, "elapsed_time": "3 days, 19:06:06", "remaining_time": "3 days, 5:00:14", "throughput": 2724.0, "total_tokens": 893381888} {"current_steps": 4951, "total_steps": 9134, "loss": 0.9146, "learning_rate": 2.170772016628993e-05, "epoch": 0.5419962232135527, "percentage": 54.2, "elapsed_time": "3 days, 19:07:15", "remaining_time": "3 days, 4:59:10", "throughput": 2723.98, "total_tokens": 893562208} {"current_steps": 4952, "total_steps": 9134, "loss": 0.7089, "learning_rate": 2.1699196626076437e-05, "epoch": 0.5421056952844906, "percentage": 54.22, "elapsed_time": "3 days, 19:08:18", "remaining_time": "3 days, 4:58:01", "throughput": 2724.0, "total_tokens": 893741856} {"current_steps": 4953, "total_steps": 9134, "loss": 0.6406, "learning_rate": 2.169067347634168e-05, "epoch": 0.5422151673554284, "percentage": 54.23, "elapsed_time": "3 days, 19:09:23", "remaining_time": "3 days, 4:56:54", "throughput": 2724.0, "total_tokens": 893917472} {"current_steps": 4954, "total_steps": 9134, "loss": 0.6338, "learning_rate": 2.168215071809392e-05, "epoch": 0.5423246394263663, "percentage": 54.24, "elapsed_time": "3 days, 19:10:30", "remaining_time": "3 days, 4:55:48", "throughput": 2723.98, "total_tokens": 894091968} {"current_steps": 4955, "total_steps": 9134, "loss": 0.7927, "learning_rate": 2.167362835234139e-05, "epoch": 0.5424341114973042, "percentage": 54.25, "elapsed_time": "3 days, 19:11:36", "remaining_time": "3 days, 4:54:41", "throughput": 2723.97, "total_tokens": 894268256} {"current_steps": 4956, "total_steps": 9134, "loss": 0.5165, "learning_rate": 2.166510638009227e-05, "epoch": 0.5425435835682422, "percentage": 54.26, "elapsed_time": "3 days, 19:12:41", "remaining_time": "3 days, 4:53:34", "throughput": 2723.93, "total_tokens": 894431776} {"current_steps": 4957, "total_steps": 9134, "loss": 0.6557, "learning_rate": 2.1656584802354678e-05, "epoch": 0.5426530556391801, "percentage": 54.27, "elapsed_time": "3 days, 19:13:49", "remaining_time": "3 days, 4:52:29", "throughput": 2723.92, "total_tokens": 894613216} {"current_steps": 4958, "total_steps": 9134, "loss": 0.7383, "learning_rate": 2.1648063620136733e-05, "epoch": 0.5427625277101179, "percentage": 54.28, "elapsed_time": "3 days, 19:14:55", "remaining_time": "3 days, 4:51:23", "throughput": 2723.96, "total_tokens": 894808096} {"current_steps": 4959, "total_steps": 9134, "loss": 0.4883, "learning_rate": 2.1639542834446434e-05, "epoch": 0.5428719997810558, "percentage": 54.29, "elapsed_time": "3 days, 19:16:01", "remaining_time": "3 days, 4:50:16", "throughput": 2723.95, "total_tokens": 894985280} {"current_steps": 4960, "total_steps": 9134, "loss": 0.7986, "learning_rate": 2.163102244629181e-05, "epoch": 0.5429814718519937, "percentage": 54.3, "elapsed_time": "3 days, 19:17:08", "remaining_time": "3 days, 4:49:11", "throughput": 2723.97, "total_tokens": 895175232} {"current_steps": 4961, "total_steps": 9134, "loss": 0.5528, "learning_rate": 2.162250245668078e-05, "epoch": 0.5430909439229317, "percentage": 54.31, "elapsed_time": "3 days, 19:18:14", "remaining_time": "3 days, 4:48:05", "throughput": 2723.93, "total_tokens": 895342560} {"current_steps": 4962, "total_steps": 9134, "loss": 0.5849, "learning_rate": 2.1613982866621252e-05, "epoch": 0.5432004159938696, "percentage": 54.32, "elapsed_time": "3 days, 19:19:13", "remaining_time": "3 days, 4:46:52", "throughput": 2723.84, "total_tokens": 895472256} {"current_steps": 4963, "total_steps": 9134, "loss": 0.5903, "learning_rate": 2.1605463677121086e-05, "epoch": 0.5433098880648075, "percentage": 54.34, "elapsed_time": "3 days, 19:20:21", "remaining_time": "3 days, 4:45:47", "throughput": 2723.85, "total_tokens": 895659520} {"current_steps": 4964, "total_steps": 9134, "loss": 0.805, "learning_rate": 2.159694488918807e-05, "epoch": 0.5434193601357453, "percentage": 54.35, "elapsed_time": "3 days, 19:21:27", "remaining_time": "3 days, 4:44:41", "throughput": 2723.9, "total_tokens": 895858208} {"current_steps": 4965, "total_steps": 9134, "loss": 0.7356, "learning_rate": 2.158842650382997e-05, "epoch": 0.5435288322066832, "percentage": 54.36, "elapsed_time": "3 days, 19:22:34", "remaining_time": "3 days, 4:43:35", "throughput": 2723.92, "total_tokens": 896044800} {"current_steps": 4966, "total_steps": 9134, "loss": 0.8172, "learning_rate": 2.157990852205449e-05, "epoch": 0.5436383042776212, "percentage": 54.37, "elapsed_time": "3 days, 19:23:41", "remaining_time": "3 days, 4:42:30", "throughput": 2723.94, "total_tokens": 896234304} {"current_steps": 4967, "total_steps": 9134, "loss": 0.9159, "learning_rate": 2.1571390944869306e-05, "epoch": 0.5437477763485591, "percentage": 54.38, "elapsed_time": "3 days, 19:24:44", "remaining_time": "3 days, 4:41:21", "throughput": 2723.91, "total_tokens": 896397376} {"current_steps": 4968, "total_steps": 9134, "loss": 1.0406, "learning_rate": 2.1562873773282005e-05, "epoch": 0.543857248419497, "percentage": 54.39, "elapsed_time": "3 days, 19:25:51", "remaining_time": "3 days, 4:40:15", "throughput": 2723.96, "total_tokens": 896594944} {"current_steps": 4969, "total_steps": 9134, "loss": 0.6399, "learning_rate": 2.1554357008300164e-05, "epoch": 0.5439667204904349, "percentage": 54.4, "elapsed_time": "3 days, 19:26:51", "remaining_time": "3 days, 4:39:03", "throughput": 2723.91, "total_tokens": 896740992} {"current_steps": 4970, "total_steps": 9134, "loss": 0.7745, "learning_rate": 2.1545840650931317e-05, "epoch": 0.5440761925613727, "percentage": 54.41, "elapsed_time": "3 days, 19:28:00", "remaining_time": "3 days, 4:38:00", "throughput": 2723.93, "total_tokens": 896937888} {"current_steps": 4971, "total_steps": 9134, "loss": 0.8711, "learning_rate": 2.1537324702182907e-05, "epoch": 0.5441856646323107, "percentage": 54.42, "elapsed_time": "3 days, 19:29:06", "remaining_time": "3 days, 4:36:53", "throughput": 2723.95, "total_tokens": 897123136} {"current_steps": 4972, "total_steps": 9134, "loss": 0.6281, "learning_rate": 2.1528809163062375e-05, "epoch": 0.5442951367032486, "percentage": 54.43, "elapsed_time": "3 days, 19:30:13", "remaining_time": "3 days, 4:35:48", "throughput": 2724.0, "total_tokens": 897322272} {"current_steps": 4973, "total_steps": 9134, "loss": 0.6747, "learning_rate": 2.1520294034577072e-05, "epoch": 0.5444046087741865, "percentage": 54.44, "elapsed_time": "3 days, 19:31:21", "remaining_time": "3 days, 4:34:42", "throughput": 2724.02, "total_tokens": 897513120} {"current_steps": 4974, "total_steps": 9134, "loss": 0.8038, "learning_rate": 2.1511779317734336e-05, "epoch": 0.5445140808451244, "percentage": 54.46, "elapsed_time": "3 days, 19:32:26", "remaining_time": "3 days, 4:33:36", "throughput": 2724.04, "total_tokens": 897697472} {"current_steps": 4975, "total_steps": 9134, "loss": 0.6547, "learning_rate": 2.1503265013541433e-05, "epoch": 0.5446235529160622, "percentage": 54.47, "elapsed_time": "3 days, 19:33:32", "remaining_time": "3 days, 4:32:29", "throughput": 2723.99, "total_tokens": 897860320} {"current_steps": 4976, "total_steps": 9134, "loss": 0.8771, "learning_rate": 2.1494751123005605e-05, "epoch": 0.5447330249870002, "percentage": 54.48, "elapsed_time": "3 days, 19:34:40", "remaining_time": "3 days, 4:31:24", "throughput": 2724.08, "total_tokens": 898075360} {"current_steps": 4977, "total_steps": 9134, "loss": 0.6275, "learning_rate": 2.1486237647134014e-05, "epoch": 0.5448424970579381, "percentage": 54.49, "elapsed_time": "3 days, 19:35:47", "remaining_time": "3 days, 4:30:18", "throughput": 2724.13, "total_tokens": 898273376} {"current_steps": 4978, "total_steps": 9134, "loss": 0.6879, "learning_rate": 2.147772458693379e-05, "epoch": 0.544951969128876, "percentage": 54.5, "elapsed_time": "3 days, 19:36:54", "remaining_time": "3 days, 4:29:13", "throughput": 2724.2, "total_tokens": 898481920} {"current_steps": 4979, "total_steps": 9134, "loss": 0.6392, "learning_rate": 2.146921194341202e-05, "epoch": 0.5450614411998139, "percentage": 54.51, "elapsed_time": "3 days, 19:37:58", "remaining_time": "3 days, 4:28:05", "throughput": 2724.18, "total_tokens": 898649472} {"current_steps": 4980, "total_steps": 9134, "loss": 0.5415, "learning_rate": 2.1460699717575718e-05, "epoch": 0.5451709132707518, "percentage": 54.52, "elapsed_time": "3 days, 19:39:07", "remaining_time": "3 days, 4:27:00", "throughput": 2724.18, "total_tokens": 898834048} {"current_steps": 4981, "total_steps": 9134, "loss": 0.8757, "learning_rate": 2.1452187910431875e-05, "epoch": 0.5452803853416897, "percentage": 54.53, "elapsed_time": "3 days, 19:40:15", "remaining_time": "3 days, 4:25:56", "throughput": 2724.24, "total_tokens": 899041696} {"current_steps": 4982, "total_steps": 9134, "loss": 0.8687, "learning_rate": 2.1443676522987432e-05, "epoch": 0.5453898574126276, "percentage": 54.54, "elapsed_time": "3 days, 19:41:19", "remaining_time": "3 days, 4:24:48", "throughput": 2724.25, "total_tokens": 899218880} {"current_steps": 4983, "total_steps": 9134, "loss": 0.728, "learning_rate": 2.1435165556249246e-05, "epoch": 0.5454993294835655, "percentage": 54.55, "elapsed_time": "3 days, 19:42:25", "remaining_time": "3 days, 4:23:41", "throughput": 2724.23, "total_tokens": 899391808} {"current_steps": 4984, "total_steps": 9134, "loss": 0.769, "learning_rate": 2.142665501122417e-05, "epoch": 0.5456088015545034, "percentage": 54.57, "elapsed_time": "3 days, 19:43:33", "remaining_time": "3 days, 4:22:37", "throughput": 2724.28, "total_tokens": 899596096} {"current_steps": 4985, "total_steps": 9134, "loss": 0.6841, "learning_rate": 2.141814488891896e-05, "epoch": 0.5457182736254413, "percentage": 54.58, "elapsed_time": "3 days, 19:44:40", "remaining_time": "3 days, 4:21:31", "throughput": 2724.25, "total_tokens": 899767456} {"current_steps": 4986, "total_steps": 9134, "loss": 0.6675, "learning_rate": 2.1409635190340373e-05, "epoch": 0.5458277456963793, "percentage": 54.59, "elapsed_time": "3 days, 19:45:46", "remaining_time": "3 days, 4:20:24", "throughput": 2724.28, "total_tokens": 899954720} {"current_steps": 4987, "total_steps": 9134, "loss": 0.5039, "learning_rate": 2.1401125916495072e-05, "epoch": 0.5459372177673171, "percentage": 54.6, "elapsed_time": "3 days, 19:46:52", "remaining_time": "3 days, 4:19:18", "throughput": 2724.33, "total_tokens": 900154528} {"current_steps": 4988, "total_steps": 9134, "loss": 0.5491, "learning_rate": 2.1392617068389697e-05, "epoch": 0.546046689838255, "percentage": 54.61, "elapsed_time": "3 days, 19:47:55", "remaining_time": "3 days, 4:18:09", "throughput": 2724.31, "total_tokens": 900317824} {"current_steps": 4989, "total_steps": 9134, "loss": 0.8438, "learning_rate": 2.1384108647030836e-05, "epoch": 0.5461561619091929, "percentage": 54.62, "elapsed_time": "3 days, 19:49:04", "remaining_time": "3 days, 4:17:05", "throughput": 2724.37, "total_tokens": 900527488} {"current_steps": 4990, "total_steps": 9134, "loss": 0.7102, "learning_rate": 2.1375600653425003e-05, "epoch": 0.5462656339801308, "percentage": 54.63, "elapsed_time": "3 days, 19:50:10", "remaining_time": "3 days, 4:15:59", "throughput": 2724.35, "total_tokens": 900698176} {"current_steps": 4991, "total_steps": 9134, "loss": 0.7787, "learning_rate": 2.136709308857869e-05, "epoch": 0.5463751060510688, "percentage": 54.64, "elapsed_time": "3 days, 19:51:20", "remaining_time": "3 days, 4:14:55", "throughput": 2724.42, "total_tokens": 900909856} {"current_steps": 4992, "total_steps": 9134, "loss": 0.7027, "learning_rate": 2.135858595349831e-05, "epoch": 0.5464845781220066, "percentage": 54.65, "elapsed_time": "3 days, 19:52:23", "remaining_time": "3 days, 4:13:47", "throughput": 2724.35, "total_tokens": 901063744} {"current_steps": 4993, "total_steps": 9134, "loss": 0.5379, "learning_rate": 2.135007924919026e-05, "epoch": 0.5465940501929445, "percentage": 54.66, "elapsed_time": "3 days, 19:53:33", "remaining_time": "3 days, 4:12:43", "throughput": 2724.34, "total_tokens": 901246976} {"current_steps": 4994, "total_steps": 9134, "loss": 0.6421, "learning_rate": 2.134157297666085e-05, "epoch": 0.5467035222638824, "percentage": 54.67, "elapsed_time": "3 days, 19:54:37", "remaining_time": "3 days, 4:11:35", "throughput": 2724.24, "total_tokens": 901387872} {"current_steps": 4995, "total_steps": 9134, "loss": 0.7068, "learning_rate": 2.133306713691636e-05, "epoch": 0.5468129943348203, "percentage": 54.69, "elapsed_time": "3 days, 19:55:43", "remaining_time": "3 days, 4:10:29", "throughput": 2724.29, "total_tokens": 901588352} {"current_steps": 4996, "total_steps": 9134, "loss": 0.7041, "learning_rate": 2.1324561730963025e-05, "epoch": 0.5469224664057583, "percentage": 54.7, "elapsed_time": "3 days, 19:56:48", "remaining_time": "3 days, 4:09:22", "throughput": 2724.26, "total_tokens": 901753216} {"current_steps": 4997, "total_steps": 9134, "loss": 0.5395, "learning_rate": 2.1316056759807006e-05, "epoch": 0.5470319384766962, "percentage": 54.71, "elapsed_time": "3 days, 19:57:52", "remaining_time": "3 days, 4:08:14", "throughput": 2724.26, "total_tokens": 901928160} {"current_steps": 4998, "total_steps": 9134, "loss": 0.7918, "learning_rate": 2.1307552224454435e-05, "epoch": 0.547141410547634, "percentage": 54.72, "elapsed_time": "3 days, 19:59:01", "remaining_time": "3 days, 4:07:09", "throughput": 2724.29, "total_tokens": 902123936} {"current_steps": 4999, "total_steps": 9134, "loss": 0.791, "learning_rate": 2.129904812591137e-05, "epoch": 0.5472508826185719, "percentage": 54.73, "elapsed_time": "3 days, 20:00:02", "remaining_time": "3 days, 4:05:59", "throughput": 2724.22, "total_tokens": 902269088} {"current_steps": 5000, "total_steps": 9134, "loss": 0.989, "learning_rate": 2.129054446518385e-05, "epoch": 0.5473603546895098, "percentage": 54.74, "elapsed_time": "3 days, 20:01:12", "remaining_time": "3 days, 4:04:55", "throughput": 2724.28, "total_tokens": 902477632} {"current_steps": 5001, "total_steps": 9134, "loss": 0.8198, "learning_rate": 2.1282041243277816e-05, "epoch": 0.5474698267604478, "percentage": 54.75, "elapsed_time": "3 days, 20:02:19", "remaining_time": "3 days, 4:03:50", "throughput": 2724.26, "total_tokens": 902657504} {"current_steps": 5002, "total_steps": 9134, "loss": 0.8118, "learning_rate": 2.1273538461199194e-05, "epoch": 0.5475792988313857, "percentage": 54.76, "elapsed_time": "3 days, 20:03:29", "remaining_time": "3 days, 4:02:47", "throughput": 2724.29, "total_tokens": 902853728} {"current_steps": 5003, "total_steps": 9134, "loss": 0.6153, "learning_rate": 2.1265036119953864e-05, "epoch": 0.5476887709023236, "percentage": 54.77, "elapsed_time": "3 days, 20:04:34", "remaining_time": "3 days, 4:01:39", "throughput": 2724.3, "total_tokens": 903033376} {"current_steps": 5004, "total_steps": 9134, "loss": 0.7814, "learning_rate": 2.12565342205476e-05, "epoch": 0.5477982429732614, "percentage": 54.78, "elapsed_time": "3 days, 20:05:41", "remaining_time": "3 days, 4:00:34", "throughput": 2724.31, "total_tokens": 903221088} {"current_steps": 5005, "total_steps": 9134, "loss": 0.6778, "learning_rate": 2.1248032763986203e-05, "epoch": 0.5479077150441993, "percentage": 54.8, "elapsed_time": "3 days, 20:06:42", "remaining_time": "3 days, 3:59:23", "throughput": 2724.25, "total_tokens": 903366240} {"current_steps": 5006, "total_steps": 9134, "loss": 0.8157, "learning_rate": 2.1239531751275344e-05, "epoch": 0.5480171871151372, "percentage": 54.81, "elapsed_time": "3 days, 20:07:48", "remaining_time": "3 days, 3:58:17", "throughput": 2724.25, "total_tokens": 903549696} {"current_steps": 5007, "total_steps": 9134, "loss": 0.8017, "learning_rate": 2.123103118342069e-05, "epoch": 0.5481266591860752, "percentage": 54.82, "elapsed_time": "3 days, 20:08:57", "remaining_time": "3 days, 3:57:13", "throughput": 2724.28, "total_tokens": 903746144} {"current_steps": 5008, "total_steps": 9134, "loss": 0.8181, "learning_rate": 2.1222531061427843e-05, "epoch": 0.5482361312570131, "percentage": 54.83, "elapsed_time": "3 days, 20:10:07", "remaining_time": "3 days, 3:56:09", "throughput": 2724.28, "total_tokens": 903936768} {"current_steps": 5009, "total_steps": 9134, "loss": 0.6677, "learning_rate": 2.1214031386302347e-05, "epoch": 0.5483456033279509, "percentage": 54.84, "elapsed_time": "3 days, 20:11:07", "remaining_time": "3 days, 3:54:58", "throughput": 2724.2, "total_tokens": 904072064} {"current_steps": 5010, "total_steps": 9134, "loss": 0.8803, "learning_rate": 2.1205532159049714e-05, "epoch": 0.5484550753988888, "percentage": 54.85, "elapsed_time": "3 days, 20:12:15", "remaining_time": "3 days, 3:53:54", "throughput": 2724.18, "total_tokens": 904252832} {"current_steps": 5011, "total_steps": 9134, "loss": 0.8263, "learning_rate": 2.1197033380675357e-05, "epoch": 0.5485645474698267, "percentage": 54.86, "elapsed_time": "3 days, 20:13:21", "remaining_time": "3 days, 3:52:47", "throughput": 2724.18, "total_tokens": 904433600} {"current_steps": 5012, "total_steps": 9134, "loss": 0.8637, "learning_rate": 2.1188535052184695e-05, "epoch": 0.5486740195407647, "percentage": 54.87, "elapsed_time": "3 days, 20:14:29", "remaining_time": "3 days, 3:51:42", "throughput": 2724.23, "total_tokens": 904634528} {"current_steps": 5013, "total_steps": 9134, "loss": 0.5752, "learning_rate": 2.118003717458304e-05, "epoch": 0.5487834916117026, "percentage": 54.88, "elapsed_time": "3 days, 20:15:32", "remaining_time": "3 days, 3:50:33", "throughput": 2724.23, "total_tokens": 904804768} {"current_steps": 5014, "total_steps": 9134, "loss": 0.6304, "learning_rate": 2.1171539748875692e-05, "epoch": 0.5488929636826405, "percentage": 54.89, "elapsed_time": "3 days, 20:16:37", "remaining_time": "3 days, 3:49:26", "throughput": 2724.23, "total_tokens": 904981728} {"current_steps": 5015, "total_steps": 9134, "loss": 1.0495, "learning_rate": 2.1163042776067865e-05, "epoch": 0.5490024357535783, "percentage": 54.9, "elapsed_time": "3 days, 20:17:47", "remaining_time": "3 days, 3:48:23", "throughput": 2724.28, "total_tokens": 905188704} {"current_steps": 5016, "total_steps": 9134, "loss": 0.6804, "learning_rate": 2.1154546257164744e-05, "epoch": 0.5491119078245162, "percentage": 54.92, "elapsed_time": "3 days, 20:18:55", "remaining_time": "3 days, 3:47:18", "throughput": 2724.28, "total_tokens": 905377088} {"current_steps": 5017, "total_steps": 9134, "loss": 0.694, "learning_rate": 2.114605019317145e-05, "epoch": 0.5492213798954542, "percentage": 54.93, "elapsed_time": "3 days, 20:20:02", "remaining_time": "3 days, 3:46:12", "throughput": 2724.26, "total_tokens": 905549568} {"current_steps": 5018, "total_steps": 9134, "loss": 0.8062, "learning_rate": 2.1137554585093056e-05, "epoch": 0.5493308519663921, "percentage": 54.94, "elapsed_time": "3 days, 20:21:09", "remaining_time": "3 days, 3:45:07", "throughput": 2724.24, "total_tokens": 905728992} {"current_steps": 5019, "total_steps": 9134, "loss": 0.5581, "learning_rate": 2.1129059433934567e-05, "epoch": 0.54944032403733, "percentage": 54.95, "elapsed_time": "3 days, 20:22:14", "remaining_time": "3 days, 3:43:59", "throughput": 2724.23, "total_tokens": 905901696} {"current_steps": 5020, "total_steps": 9134, "loss": 0.7647, "learning_rate": 2.1120564740700945e-05, "epoch": 0.5495497961082679, "percentage": 54.96, "elapsed_time": "3 days, 20:23:20", "remaining_time": "3 days, 3:42:53", "throughput": 2724.24, "total_tokens": 906082688} {"current_steps": 5021, "total_steps": 9134, "loss": 0.6781, "learning_rate": 2.1112070506397105e-05, "epoch": 0.5496592681792057, "percentage": 54.97, "elapsed_time": "3 days, 20:24:24", "remaining_time": "3 days, 3:41:45", "throughput": 2724.23, "total_tokens": 906252704} {"current_steps": 5022, "total_steps": 9134, "loss": 0.715, "learning_rate": 2.1103576732027882e-05, "epoch": 0.5497687402501437, "percentage": 54.98, "elapsed_time": "3 days, 20:25:28", "remaining_time": "3 days, 3:40:37", "throughput": 2724.21, "total_tokens": 906422720} {"current_steps": 5023, "total_steps": 9134, "loss": 0.7709, "learning_rate": 2.1095083418598083e-05, "epoch": 0.5498782123210816, "percentage": 54.99, "elapsed_time": "3 days, 20:26:34", "remaining_time": "3 days, 3:39:30", "throughput": 2724.19, "total_tokens": 906594080} {"current_steps": 5024, "total_steps": 9134, "loss": 0.7461, "learning_rate": 2.1086590567112463e-05, "epoch": 0.5499876843920195, "percentage": 55.0, "elapsed_time": "3 days, 20:27:41", "remaining_time": "3 days, 3:38:25", "throughput": 2724.21, "total_tokens": 906786272} {"current_steps": 5025, "total_steps": 9134, "loss": 0.5154, "learning_rate": 2.1078098178575686e-05, "epoch": 0.5500971564629574, "percentage": 55.01, "elapsed_time": "3 days, 20:28:49", "remaining_time": "3 days, 3:37:20", "throughput": 2724.2, "total_tokens": 906967040} {"current_steps": 5026, "total_steps": 9134, "loss": 0.8948, "learning_rate": 2.1069606253992406e-05, "epoch": 0.5502066285338952, "percentage": 55.03, "elapsed_time": "3 days, 20:29:58", "remaining_time": "3 days, 3:36:16", "throughput": 2724.24, "total_tokens": 907167968} {"current_steps": 5027, "total_steps": 9134, "loss": 0.7384, "learning_rate": 2.1061114794367185e-05, "epoch": 0.5503161006048332, "percentage": 55.04, "elapsed_time": "3 days, 20:31:07", "remaining_time": "3 days, 3:35:12", "throughput": 2724.24, "total_tokens": 907356352} {"current_steps": 5028, "total_steps": 9134, "loss": 0.9204, "learning_rate": 2.1052623800704557e-05, "epoch": 0.5504255726757711, "percentage": 55.05, "elapsed_time": "3 days, 20:32:13", "remaining_time": "3 days, 3:34:06", "throughput": 2724.3, "total_tokens": 907557056} {"current_steps": 5029, "total_steps": 9134, "loss": 0.8109, "learning_rate": 2.1044133274008983e-05, "epoch": 0.550535044746709, "percentage": 55.06, "elapsed_time": "3 days, 20:33:21", "remaining_time": "3 days, 3:33:00", "throughput": 2724.28, "total_tokens": 907734688} {"current_steps": 5030, "total_steps": 9134, "loss": 0.7335, "learning_rate": 2.1035643215284882e-05, "epoch": 0.5506445168176469, "percentage": 55.07, "elapsed_time": "3 days, 20:34:29", "remaining_time": "3 days, 3:31:56", "throughput": 2724.33, "total_tokens": 907937184} {"current_steps": 5031, "total_steps": 9134, "loss": 0.5591, "learning_rate": 2.1027153625536616e-05, "epoch": 0.5507539888885848, "percentage": 55.08, "elapsed_time": "3 days, 20:35:36", "remaining_time": "3 days, 3:30:50", "throughput": 2724.3, "total_tokens": 908108544} {"current_steps": 5032, "total_steps": 9134, "loss": 0.6129, "learning_rate": 2.1018664505768476e-05, "epoch": 0.5508634609595227, "percentage": 55.09, "elapsed_time": "3 days, 20:36:39", "remaining_time": "3 days, 3:29:41", "throughput": 2724.27, "total_tokens": 908271840} {"current_steps": 5033, "total_steps": 9134, "loss": 0.66, "learning_rate": 2.101017585698472e-05, "epoch": 0.5509729330304606, "percentage": 55.1, "elapsed_time": "3 days, 20:37:41", "remaining_time": "3 days, 3:28:31", "throughput": 2724.22, "total_tokens": 908423040} {"current_steps": 5034, "total_steps": 9134, "loss": 0.777, "learning_rate": 2.1001687680189524e-05, "epoch": 0.5510824051013985, "percentage": 55.11, "elapsed_time": "3 days, 20:38:48", "remaining_time": "3 days, 3:27:26", "throughput": 2724.28, "total_tokens": 908625088} {"current_steps": 5035, "total_steps": 9134, "loss": 0.6753, "learning_rate": 2.0993199976387043e-05, "epoch": 0.5511918771723364, "percentage": 55.12, "elapsed_time": "3 days, 20:39:55", "remaining_time": "3 days, 3:26:20", "throughput": 2724.3, "total_tokens": 908813024} {"current_steps": 5036, "total_steps": 9134, "loss": 0.6891, "learning_rate": 2.0984712746581337e-05, "epoch": 0.5513013492432743, "percentage": 55.13, "elapsed_time": "3 days, 20:40:59", "remaining_time": "3 days, 3:25:12", "throughput": 2724.3, "total_tokens": 908989088} {"current_steps": 5037, "total_steps": 9134, "loss": 0.6448, "learning_rate": 2.0976225991776434e-05, "epoch": 0.5514108213142123, "percentage": 55.15, "elapsed_time": "3 days, 20:42:05", "remaining_time": "3 days, 3:24:05", "throughput": 2724.25, "total_tokens": 909151040} {"current_steps": 5038, "total_steps": 9134, "loss": 0.7178, "learning_rate": 2.0967739712976308e-05, "epoch": 0.5515202933851501, "percentage": 55.16, "elapsed_time": "3 days, 20:43:14", "remaining_time": "3 days, 3:23:01", "throughput": 2724.25, "total_tokens": 909338976} {"current_steps": 5039, "total_steps": 9134, "loss": 0.6415, "learning_rate": 2.0959253911184867e-05, "epoch": 0.551629765456088, "percentage": 55.17, "elapsed_time": "3 days, 20:44:19", "remaining_time": "3 days, 3:21:54", "throughput": 2724.27, "total_tokens": 909522208} {"current_steps": 5040, "total_steps": 9134, "loss": 0.7438, "learning_rate": 2.0950768587405963e-05, "epoch": 0.5517392375270259, "percentage": 55.18, "elapsed_time": "3 days, 20:45:25", "remaining_time": "3 days, 3:20:48", "throughput": 2724.28, "total_tokens": 909708352} {"current_steps": 5041, "total_steps": 9134, "loss": 0.7387, "learning_rate": 2.0942283742643392e-05, "epoch": 0.5518487095979638, "percentage": 55.19, "elapsed_time": "3 days, 20:46:31", "remaining_time": "3 days, 3:19:41", "throughput": 2724.3, "total_tokens": 909893376} {"current_steps": 5042, "total_steps": 9134, "loss": 0.6153, "learning_rate": 2.0933799377900907e-05, "epoch": 0.5519581816689018, "percentage": 55.2, "elapsed_time": "3 days, 20:47:38", "remaining_time": "3 days, 3:18:35", "throughput": 2724.32, "total_tokens": 910082432} {"current_steps": 5043, "total_steps": 9134, "loss": 0.7827, "learning_rate": 2.0925315494182168e-05, "epoch": 0.5520676537398396, "percentage": 55.21, "elapsed_time": "3 days, 20:48:41", "remaining_time": "3 days, 3:17:26", "throughput": 2724.31, "total_tokens": 910248416} {"current_steps": 5044, "total_steps": 9134, "loss": 0.7814, "learning_rate": 2.091683209249082e-05, "epoch": 0.5521771258107775, "percentage": 55.22, "elapsed_time": "3 days, 20:49:50", "remaining_time": "3 days, 3:16:23", "throughput": 2724.29, "total_tokens": 910433216} {"current_steps": 5045, "total_steps": 9134, "loss": 0.6318, "learning_rate": 2.090834917383044e-05, "epoch": 0.5522865978817154, "percentage": 55.23, "elapsed_time": "3 days, 20:50:55", "remaining_time": "3 days, 3:15:16", "throughput": 2724.3, "total_tokens": 910613312} {"current_steps": 5046, "total_steps": 9134, "loss": 0.6972, "learning_rate": 2.089986673920452e-05, "epoch": 0.5523960699526533, "percentage": 55.24, "elapsed_time": "3 days, 20:52:02", "remaining_time": "3 days, 3:14:10", "throughput": 2724.31, "total_tokens": 910800128} {"current_steps": 5047, "total_steps": 9134, "loss": 0.7616, "learning_rate": 2.0891384789616535e-05, "epoch": 0.5525055420235913, "percentage": 55.26, "elapsed_time": "3 days, 20:53:10", "remaining_time": "3 days, 3:13:05", "throughput": 2724.37, "total_tokens": 911003296} {"current_steps": 5048, "total_steps": 9134, "loss": 0.7694, "learning_rate": 2.088290332606987e-05, "epoch": 0.5526150140945292, "percentage": 55.27, "elapsed_time": "3 days, 20:54:15", "remaining_time": "3 days, 3:11:57", "throughput": 2724.35, "total_tokens": 911171520} {"current_steps": 5049, "total_steps": 9134, "loss": 0.6619, "learning_rate": 2.0874422349567866e-05, "epoch": 0.552724486165467, "percentage": 55.28, "elapsed_time": "3 days, 20:55:18", "remaining_time": "3 days, 3:10:48", "throughput": 2724.34, "total_tokens": 911342432} {"current_steps": 5050, "total_steps": 9134, "loss": 0.9613, "learning_rate": 2.0865941861113818e-05, "epoch": 0.5528339582364049, "percentage": 55.29, "elapsed_time": "3 days, 20:56:27", "remaining_time": "3 days, 3:09:45", "throughput": 2724.41, "total_tokens": 911553664} {"current_steps": 5051, "total_steps": 9134, "loss": 0.6672, "learning_rate": 2.085746186171094e-05, "epoch": 0.5529434303073428, "percentage": 55.3, "elapsed_time": "3 days, 20:57:34", "remaining_time": "3 days, 3:08:39", "throughput": 2724.43, "total_tokens": 911740928} {"current_steps": 5052, "total_steps": 9134, "loss": 0.8157, "learning_rate": 2.0848982352362413e-05, "epoch": 0.5530529023782808, "percentage": 55.31, "elapsed_time": "3 days, 20:58:37", "remaining_time": "3 days, 3:07:30", "throughput": 2724.38, "total_tokens": 911899968} {"current_steps": 5053, "total_steps": 9134, "loss": 0.8, "learning_rate": 2.0840503334071332e-05, "epoch": 0.5531623744492187, "percentage": 55.32, "elapsed_time": "3 days, 20:59:43", "remaining_time": "3 days, 3:06:24", "throughput": 2724.36, "total_tokens": 912071104} {"current_steps": 5054, "total_steps": 9134, "loss": 0.812, "learning_rate": 2.0832024807840762e-05, "epoch": 0.5532718465201566, "percentage": 55.33, "elapsed_time": "3 days, 21:00:52", "remaining_time": "3 days, 3:05:20", "throughput": 2724.42, "total_tokens": 912278528} {"current_steps": 5055, "total_steps": 9134, "loss": 0.767, "learning_rate": 2.082354677467368e-05, "epoch": 0.5533813185910944, "percentage": 55.34, "elapsed_time": "3 days, 21:02:02", "remaining_time": "3 days, 3:04:16", "throughput": 2724.44, "total_tokens": 912476544} {"current_steps": 5056, "total_steps": 9134, "loss": 0.699, "learning_rate": 2.081506923557303e-05, "epoch": 0.5534907906620323, "percentage": 55.35, "elapsed_time": "3 days, 21:03:09", "remaining_time": "3 days, 3:03:11", "throughput": 2724.42, "total_tokens": 912651936} {"current_steps": 5057, "total_steps": 9134, "loss": 0.5955, "learning_rate": 2.08065921915417e-05, "epoch": 0.5536002627329702, "percentage": 55.36, "elapsed_time": "3 days, 21:04:18", "remaining_time": "3 days, 3:02:07", "throughput": 2724.44, "total_tokens": 912847712} {"current_steps": 5058, "total_steps": 9134, "loss": 0.8396, "learning_rate": 2.079811564358249e-05, "epoch": 0.5537097348039082, "percentage": 55.38, "elapsed_time": "3 days, 21:05:27", "remaining_time": "3 days, 3:01:03", "throughput": 2724.45, "total_tokens": 913037440} {"current_steps": 5059, "total_steps": 9134, "loss": 0.7926, "learning_rate": 2.0789639592698164e-05, "epoch": 0.5538192068748461, "percentage": 55.39, "elapsed_time": "3 days, 21:06:35", "remaining_time": "3 days, 2:59:58", "throughput": 2724.46, "total_tokens": 913226048} {"current_steps": 5060, "total_steps": 9134, "loss": 0.8552, "learning_rate": 2.0781164039891432e-05, "epoch": 0.5539286789457839, "percentage": 55.4, "elapsed_time": "3 days, 21:07:38", "remaining_time": "3 days, 2:58:49", "throughput": 2724.44, "total_tokens": 913391584} {"current_steps": 5061, "total_steps": 9134, "loss": 0.7468, "learning_rate": 2.0772688986164928e-05, "epoch": 0.5540381510167218, "percentage": 55.41, "elapsed_time": "3 days, 21:08:43", "remaining_time": "3 days, 2:57:42", "throughput": 2724.42, "total_tokens": 913563392} {"current_steps": 5062, "total_steps": 9134, "loss": 0.5846, "learning_rate": 2.076421443252123e-05, "epoch": 0.5541476230876597, "percentage": 55.42, "elapsed_time": "3 days, 21:09:48", "remaining_time": "3 days, 2:56:35", "throughput": 2724.43, "total_tokens": 913742368} {"current_steps": 5063, "total_steps": 9134, "loss": 0.8922, "learning_rate": 2.0755740379962864e-05, "epoch": 0.5542570951585977, "percentage": 55.43, "elapsed_time": "3 days, 21:10:58", "remaining_time": "3 days, 2:55:31", "throughput": 2724.46, "total_tokens": 913942624} {"current_steps": 5064, "total_steps": 9134, "loss": 0.7978, "learning_rate": 2.0747266829492312e-05, "epoch": 0.5543665672295356, "percentage": 55.44, "elapsed_time": "3 days, 21:12:06", "remaining_time": "3 days, 2:54:26", "throughput": 2724.48, "total_tokens": 914136160} {"current_steps": 5065, "total_steps": 9134, "loss": 0.8024, "learning_rate": 2.0738793782111954e-05, "epoch": 0.5544760393004735, "percentage": 55.45, "elapsed_time": "3 days, 21:13:13", "remaining_time": "3 days, 2:53:21", "throughput": 2724.5, "total_tokens": 914324096} {"current_steps": 5066, "total_steps": 9134, "loss": 0.6321, "learning_rate": 2.0730321238824156e-05, "epoch": 0.5545855113714113, "percentage": 55.46, "elapsed_time": "3 days, 21:14:16", "remaining_time": "3 days, 2:52:11", "throughput": 2724.48, "total_tokens": 914487392} {"current_steps": 5067, "total_steps": 9134, "loss": 0.6425, "learning_rate": 2.072184920063118e-05, "epoch": 0.5546949834423492, "percentage": 55.47, "elapsed_time": "3 days, 21:15:25", "remaining_time": "3 days, 2:51:08", "throughput": 2724.56, "total_tokens": 914703328} {"current_steps": 5068, "total_steps": 9134, "loss": 0.7127, "learning_rate": 2.0713377668535276e-05, "epoch": 0.5548044555132872, "percentage": 55.49, "elapsed_time": "3 days, 21:16:31", "remaining_time": "3 days, 2:50:02", "throughput": 2724.58, "total_tokens": 914892608} {"current_steps": 5069, "total_steps": 9134, "loss": 0.7138, "learning_rate": 2.070490664353859e-05, "epoch": 0.5549139275842251, "percentage": 55.5, "elapsed_time": "3 days, 21:17:36", "remaining_time": "3 days, 2:48:54", "throughput": 2724.58, "total_tokens": 915070464} {"current_steps": 5070, "total_steps": 9134, "loss": 0.9494, "learning_rate": 2.0696436126643236e-05, "epoch": 0.555023399655163, "percentage": 55.51, "elapsed_time": "3 days, 21:18:43", "remaining_time": "3 days, 2:47:48", "throughput": 2724.6, "total_tokens": 915258400} {"current_steps": 5071, "total_steps": 9134, "loss": 0.8068, "learning_rate": 2.0687966118851268e-05, "epoch": 0.5551328717261009, "percentage": 55.52, "elapsed_time": "3 days, 21:19:52", "remaining_time": "3 days, 2:46:45", "throughput": 2724.63, "total_tokens": 915457536} {"current_steps": 5072, "total_steps": 9134, "loss": 0.7889, "learning_rate": 2.067949662116466e-05, "epoch": 0.5552423437970387, "percentage": 55.53, "elapsed_time": "3 days, 21:20:54", "remaining_time": "3 days, 2:45:35", "throughput": 2724.57, "total_tokens": 915602912} {"current_steps": 5073, "total_steps": 9134, "loss": 0.6716, "learning_rate": 2.067102763458535e-05, "epoch": 0.5553518158679767, "percentage": 55.54, "elapsed_time": "3 days, 21:21:57", "remaining_time": "3 days, 2:44:26", "throughput": 2724.51, "total_tokens": 915756352} {"current_steps": 5074, "total_steps": 9134, "loss": 0.6023, "learning_rate": 2.0662559160115186e-05, "epoch": 0.5554612879389146, "percentage": 55.55, "elapsed_time": "3 days, 21:23:01", "remaining_time": "3 days, 2:43:18", "throughput": 2724.51, "total_tokens": 915930848} {"current_steps": 5075, "total_steps": 9134, "loss": 0.823, "learning_rate": 2.065409119875599e-05, "epoch": 0.5555707600098525, "percentage": 55.56, "elapsed_time": "3 days, 21:24:10", "remaining_time": "3 days, 2:42:14", "throughput": 2724.54, "total_tokens": 916127968} {"current_steps": 5076, "total_steps": 9134, "loss": 0.7421, "learning_rate": 2.0645623751509495e-05, "epoch": 0.5556802320807904, "percentage": 55.57, "elapsed_time": "3 days, 21:25:09", "remaining_time": "3 days, 2:41:02", "throughput": 2724.5, "total_tokens": 916274688} {"current_steps": 5077, "total_steps": 9134, "loss": 0.6162, "learning_rate": 2.0637156819377378e-05, "epoch": 0.5557897041517282, "percentage": 55.58, "elapsed_time": "3 days, 21:26:16", "remaining_time": "3 days, 2:39:56", "throughput": 2724.53, "total_tokens": 916468896} {"current_steps": 5078, "total_steps": 9134, "loss": 0.9308, "learning_rate": 2.0628690403361285e-05, "epoch": 0.5558991762226662, "percentage": 55.59, "elapsed_time": "3 days, 21:27:24", "remaining_time": "3 days, 2:38:51", "throughput": 2724.5, "total_tokens": 916642944} {"current_steps": 5079, "total_steps": 9134, "loss": 0.7521, "learning_rate": 2.0620224504462742e-05, "epoch": 0.5560086482936041, "percentage": 55.61, "elapsed_time": "3 days, 21:28:31", "remaining_time": "3 days, 2:37:46", "throughput": 2724.54, "total_tokens": 916838496} {"current_steps": 5080, "total_steps": 9134, "loss": 0.5736, "learning_rate": 2.061175912368328e-05, "epoch": 0.556118120364542, "percentage": 55.62, "elapsed_time": "3 days, 21:29:37", "remaining_time": "3 days, 2:36:39", "throughput": 2724.54, "total_tokens": 917018368} {"current_steps": 5081, "total_steps": 9134, "loss": 0.65, "learning_rate": 2.0603294262024323e-05, "epoch": 0.5562275924354799, "percentage": 55.63, "elapsed_time": "3 days, 21:30:44", "remaining_time": "3 days, 2:35:33", "throughput": 2724.54, "total_tokens": 917200928} {"current_steps": 5082, "total_steps": 9134, "loss": 0.7929, "learning_rate": 2.059482992048725e-05, "epoch": 0.5563370645064178, "percentage": 55.64, "elapsed_time": "3 days, 21:31:53", "remaining_time": "3 days, 2:34:29", "throughput": 2724.59, "total_tokens": 917408128} {"current_steps": 5083, "total_steps": 9134, "loss": 0.8905, "learning_rate": 2.058636610007337e-05, "epoch": 0.5564465365773557, "percentage": 55.65, "elapsed_time": "3 days, 21:33:02", "remaining_time": "3 days, 2:33:25", "throughput": 2724.56, "total_tokens": 917584416} {"current_steps": 5084, "total_steps": 9134, "loss": 0.6044, "learning_rate": 2.057790280178394e-05, "epoch": 0.5565560086482936, "percentage": 55.66, "elapsed_time": "3 days, 21:34:09", "remaining_time": "3 days, 2:32:20", "throughput": 2724.57, "total_tokens": 917769664} {"current_steps": 5085, "total_steps": 9134, "loss": 0.8594, "learning_rate": 2.056944002662017e-05, "epoch": 0.5566654807192315, "percentage": 55.67, "elapsed_time": "3 days, 21:35:19", "remaining_time": "3 days, 2:31:16", "throughput": 2724.58, "total_tokens": 917963424} {"current_steps": 5086, "total_steps": 9134, "loss": 0.8714, "learning_rate": 2.0560977775583162e-05, "epoch": 0.5567749527901694, "percentage": 55.68, "elapsed_time": "3 days, 21:36:28", "remaining_time": "3 days, 2:30:12", "throughput": 2724.64, "total_tokens": 918172416} {"current_steps": 5087, "total_steps": 9134, "loss": 0.6985, "learning_rate": 2.0552516049674007e-05, "epoch": 0.5568844248611073, "percentage": 55.69, "elapsed_time": "3 days, 21:37:29", "remaining_time": "3 days, 2:29:02", "throughput": 2724.58, "total_tokens": 918320032} {"current_steps": 5088, "total_steps": 9134, "loss": 0.6979, "learning_rate": 2.0544054849893696e-05, "epoch": 0.5569938969320453, "percentage": 55.7, "elapsed_time": "3 days, 21:38:37", "remaining_time": "3 days, 2:27:57", "throughput": 2724.6, "total_tokens": 918512000} {"current_steps": 5089, "total_steps": 9134, "loss": 0.7105, "learning_rate": 2.0535594177243183e-05, "epoch": 0.5571033690029831, "percentage": 55.71, "elapsed_time": "3 days, 21:39:47", "remaining_time": "3 days, 2:26:53", "throughput": 2724.65, "total_tokens": 918718080} {"current_steps": 5090, "total_steps": 9134, "loss": 0.9929, "learning_rate": 2.0527134032723337e-05, "epoch": 0.557212841073921, "percentage": 55.73, "elapsed_time": "3 days, 21:40:56", "remaining_time": "3 days, 2:25:49", "throughput": 2724.71, "total_tokens": 918926400} {"current_steps": 5091, "total_steps": 9134, "loss": 0.7281, "learning_rate": 2.0518674417334982e-05, "epoch": 0.5573223131448589, "percentage": 55.74, "elapsed_time": "3 days, 21:41:56", "remaining_time": "3 days, 2:24:38", "throughput": 2724.63, "total_tokens": 919061472} {"current_steps": 5092, "total_steps": 9134, "loss": 0.6037, "learning_rate": 2.0510215332078884e-05, "epoch": 0.5574317852157968, "percentage": 55.75, "elapsed_time": "3 days, 21:43:05", "remaining_time": "3 days, 2:23:34", "throughput": 2724.67, "total_tokens": 919263744} {"current_steps": 5093, "total_steps": 9134, "loss": 0.7978, "learning_rate": 2.050175677795572e-05, "epoch": 0.5575412572867348, "percentage": 55.76, "elapsed_time": "3 days, 21:44:14", "remaining_time": "3 days, 2:22:30", "throughput": 2724.67, "total_tokens": 919453920} {"current_steps": 5094, "total_steps": 9134, "loss": 0.7985, "learning_rate": 2.0493298755966145e-05, "epoch": 0.5576507293576726, "percentage": 55.77, "elapsed_time": "3 days, 21:45:17", "remaining_time": "3 days, 2:21:21", "throughput": 2724.61, "total_tokens": 919602880} {"current_steps": 5095, "total_steps": 9134, "loss": 0.8073, "learning_rate": 2.0484841267110698e-05, "epoch": 0.5577602014286105, "percentage": 55.78, "elapsed_time": "3 days, 21:46:23", "remaining_time": "3 days, 2:20:14", "throughput": 2724.62, "total_tokens": 919786112} {"current_steps": 5096, "total_steps": 9134, "loss": 0.6233, "learning_rate": 2.0476384312389914e-05, "epoch": 0.5578696734995484, "percentage": 55.79, "elapsed_time": "3 days, 21:47:31", "remaining_time": "3 days, 2:19:10", "throughput": 2724.65, "total_tokens": 919982112} {"current_steps": 5097, "total_steps": 9134, "loss": 0.6873, "learning_rate": 2.04679278928042e-05, "epoch": 0.5579791455704863, "percentage": 55.8, "elapsed_time": "3 days, 21:48:37", "remaining_time": "3 days, 2:18:03", "throughput": 2724.64, "total_tokens": 920157952} {"current_steps": 5098, "total_steps": 9134, "loss": 0.8741, "learning_rate": 2.0459472009353957e-05, "epoch": 0.5580886176414243, "percentage": 55.81, "elapsed_time": "3 days, 21:49:46", "remaining_time": "3 days, 2:16:59", "throughput": 2724.69, "total_tokens": 920362016} {"current_steps": 5099, "total_steps": 9134, "loss": 0.8312, "learning_rate": 2.0451016663039503e-05, "epoch": 0.5581980897123622, "percentage": 55.82, "elapsed_time": "3 days, 21:50:51", "remaining_time": "3 days, 2:15:52", "throughput": 2724.72, "total_tokens": 920548608} {"current_steps": 5100, "total_steps": 9134, "loss": 0.6009, "learning_rate": 2.0442561854861076e-05, "epoch": 0.5583075617833, "percentage": 55.84, "elapsed_time": "3 days, 21:51:53", "remaining_time": "3 days, 2:14:43", "throughput": 2724.71, "total_tokens": 920718400} {"current_steps": 5101, "total_steps": 9134, "loss": 0.7294, "learning_rate": 2.043410758581887e-05, "epoch": 0.5584170338542379, "percentage": 55.85, "elapsed_time": "3 days, 21:52:59", "remaining_time": "3 days, 2:13:36", "throughput": 2724.73, "total_tokens": 920903648} {"current_steps": 5102, "total_steps": 9134, "loss": 0.5218, "learning_rate": 2.042565385691301e-05, "epoch": 0.5585265059251758, "percentage": 55.86, "elapsed_time": "3 days, 21:54:01", "remaining_time": "3 days, 2:12:27", "throughput": 2724.66, "total_tokens": 921050144} {"current_steps": 5103, "total_steps": 9134, "loss": 0.7643, "learning_rate": 2.041720066914355e-05, "epoch": 0.5586359779961138, "percentage": 55.87, "elapsed_time": "3 days, 21:55:11", "remaining_time": "3 days, 2:11:23", "throughput": 2724.68, "total_tokens": 921245696} {"current_steps": 5104, "total_steps": 9134, "loss": 0.7074, "learning_rate": 2.040874802351049e-05, "epoch": 0.5587454500670517, "percentage": 55.88, "elapsed_time": "3 days, 21:56:17", "remaining_time": "3 days, 2:10:17", "throughput": 2724.69, "total_tokens": 921428704} {"current_steps": 5105, "total_steps": 9134, "loss": 0.8414, "learning_rate": 2.040029592101376e-05, "epoch": 0.5588549221379896, "percentage": 55.89, "elapsed_time": "3 days, 21:57:26", "remaining_time": "3 days, 2:09:12", "throughput": 2724.67, "total_tokens": 921607904} {"current_steps": 5106, "total_steps": 9134, "loss": 0.8857, "learning_rate": 2.039184436265324e-05, "epoch": 0.5589643942089274, "percentage": 55.9, "elapsed_time": "3 days, 21:58:33", "remaining_time": "3 days, 2:08:07", "throughput": 2724.7, "total_tokens": 921800768} {"current_steps": 5107, "total_steps": 9134, "loss": 0.7862, "learning_rate": 2.038339334942871e-05, "epoch": 0.5590738662798653, "percentage": 55.91, "elapsed_time": "3 days, 21:59:37", "remaining_time": "3 days, 2:06:59", "throughput": 2724.65, "total_tokens": 921958464} {"current_steps": 5108, "total_steps": 9134, "loss": 0.882, "learning_rate": 2.0374942882339935e-05, "epoch": 0.5591833383508032, "percentage": 55.92, "elapsed_time": "3 days, 22:00:43", "remaining_time": "3 days, 2:05:52", "throughput": 2724.64, "total_tokens": 922137664} {"current_steps": 5109, "total_steps": 9134, "loss": 0.6233, "learning_rate": 2.0366492962386563e-05, "epoch": 0.5592928104217412, "percentage": 55.93, "elapsed_time": "3 days, 22:01:52", "remaining_time": "3 days, 2:04:48", "throughput": 2724.7, "total_tokens": 922345312} {"current_steps": 5110, "total_steps": 9134, "loss": 0.6916, "learning_rate": 2.0358043590568215e-05, "epoch": 0.5594022824926791, "percentage": 55.94, "elapsed_time": "3 days, 22:02:58", "remaining_time": "3 days, 2:03:42", "throughput": 2724.72, "total_tokens": 922530560} {"current_steps": 5111, "total_steps": 9134, "loss": 0.6966, "learning_rate": 2.034959476788445e-05, "epoch": 0.5595117545636169, "percentage": 55.96, "elapsed_time": "3 days, 22:04:02", "remaining_time": "3 days, 2:02:34", "throughput": 2724.68, "total_tokens": 922694752} {"current_steps": 5112, "total_steps": 9134, "loss": 0.9519, "learning_rate": 2.034114649533472e-05, "epoch": 0.5596212266345548, "percentage": 55.97, "elapsed_time": "3 days, 22:05:08", "remaining_time": "3 days, 2:01:28", "throughput": 2724.73, "total_tokens": 922889632} {"current_steps": 5113, "total_steps": 9134, "loss": 0.7289, "learning_rate": 2.033269877391846e-05, "epoch": 0.5597306987054927, "percentage": 55.98, "elapsed_time": "3 days, 22:06:16", "remaining_time": "3 days, 2:00:22", "throughput": 2724.76, "total_tokens": 923084736} {"current_steps": 5114, "total_steps": 9134, "loss": 0.6876, "learning_rate": 2.032425160463501e-05, "epoch": 0.5598401707764307, "percentage": 55.99, "elapsed_time": "3 days, 22:07:19", "remaining_time": "3 days, 1:59:13", "throughput": 2724.69, "total_tokens": 923232800} {"current_steps": 5115, "total_steps": 9134, "loss": 0.7089, "learning_rate": 2.0315804988483665e-05, "epoch": 0.5599496428473686, "percentage": 56.0, "elapsed_time": "3 days, 22:08:21", "remaining_time": "3 days, 1:58:04", "throughput": 2724.66, "total_tokens": 923392288} {"current_steps": 5116, "total_steps": 9134, "loss": 0.5511, "learning_rate": 2.030735892646362e-05, "epoch": 0.5600591149183065, "percentage": 56.01, "elapsed_time": "3 days, 22:09:27", "remaining_time": "3 days, 1:56:58", "throughput": 2724.61, "total_tokens": 923554240} {"current_steps": 5117, "total_steps": 9134, "loss": 0.9287, "learning_rate": 2.029891341957405e-05, "epoch": 0.5601685869892443, "percentage": 56.02, "elapsed_time": "3 days, 22:10:30", "remaining_time": "3 days, 1:55:48", "throughput": 2724.58, "total_tokens": 923715296} {"current_steps": 5118, "total_steps": 9134, "loss": 0.8578, "learning_rate": 2.0290468468814045e-05, "epoch": 0.5602780590601822, "percentage": 56.03, "elapsed_time": "3 days, 22:11:35", "remaining_time": "3 days, 1:54:41", "throughput": 2724.59, "total_tokens": 923896736} {"current_steps": 5119, "total_steps": 9134, "loss": 0.7242, "learning_rate": 2.0282024075182603e-05, "epoch": 0.5603875311311202, "percentage": 56.04, "elapsed_time": "3 days, 22:12:41", "remaining_time": "3 days, 1:53:35", "throughput": 2724.58, "total_tokens": 924071680} {"current_steps": 5120, "total_steps": 9134, "loss": 0.6784, "learning_rate": 2.0273580239678706e-05, "epoch": 0.5604970032020581, "percentage": 56.05, "elapsed_time": "3 days, 22:13:48", "remaining_time": "3 days, 1:52:29", "throughput": 2724.55, "total_tokens": 924244608} {"current_steps": 5121, "total_steps": 9134, "loss": 0.7525, "learning_rate": 2.0265136963301225e-05, "epoch": 0.560606475272996, "percentage": 56.07, "elapsed_time": "3 days, 22:14:53", "remaining_time": "3 days, 1:51:22", "throughput": 2724.5, "total_tokens": 924404544} {"current_steps": 5122, "total_steps": 9134, "loss": 0.72, "learning_rate": 2.025669424704899e-05, "epoch": 0.5607159473439339, "percentage": 56.08, "elapsed_time": "3 days, 22:16:00", "remaining_time": "3 days, 1:50:16", "throughput": 2724.47, "total_tokens": 924576800} {"current_steps": 5123, "total_steps": 9134, "loss": 0.6505, "learning_rate": 2.0248252091920757e-05, "epoch": 0.5608254194148717, "percentage": 56.09, "elapsed_time": "3 days, 22:17:09", "remaining_time": "3 days, 1:49:12", "throughput": 2724.5, "total_tokens": 924776608} {"current_steps": 5124, "total_steps": 9134, "loss": 0.6875, "learning_rate": 2.0239810498915213e-05, "epoch": 0.5609348914858097, "percentage": 56.1, "elapsed_time": "3 days, 22:18:12", "remaining_time": "3 days, 1:48:04", "throughput": 2724.43, "total_tokens": 924922880} {"current_steps": 5125, "total_steps": 9134, "loss": 0.6832, "learning_rate": 2.0231369469030996e-05, "epoch": 0.5610443635567476, "percentage": 56.11, "elapsed_time": "3 days, 22:19:20", "remaining_time": "3 days, 1:46:59", "throughput": 2724.44, "total_tokens": 925113280} {"current_steps": 5126, "total_steps": 9134, "loss": 0.6811, "learning_rate": 2.0222929003266645e-05, "epoch": 0.5611538356276855, "percentage": 56.12, "elapsed_time": "3 days, 22:20:27", "remaining_time": "3 days, 1:45:53", "throughput": 2724.45, "total_tokens": 925296064} {"current_steps": 5127, "total_steps": 9134, "loss": 0.6185, "learning_rate": 2.0214489102620675e-05, "epoch": 0.5612633076986234, "percentage": 56.13, "elapsed_time": "3 days, 22:21:33", "remaining_time": "3 days, 1:44:47", "throughput": 2724.46, "total_tokens": 925482656} {"current_steps": 5128, "total_steps": 9134, "loss": 0.8353, "learning_rate": 2.0206049768091482e-05, "epoch": 0.5613727797695612, "percentage": 56.14, "elapsed_time": "3 days, 22:22:39", "remaining_time": "3 days, 1:43:40", "throughput": 2724.44, "total_tokens": 925655136} {"current_steps": 5129, "total_steps": 9134, "loss": 0.8278, "learning_rate": 2.019761100067745e-05, "epoch": 0.5614822518404992, "percentage": 56.15, "elapsed_time": "3 days, 22:23:49", "remaining_time": "3 days, 1:42:37", "throughput": 2724.42, "total_tokens": 925840384} {"current_steps": 5130, "total_steps": 9134, "loss": 0.6623, "learning_rate": 2.0189172801376845e-05, "epoch": 0.5615917239114371, "percentage": 56.16, "elapsed_time": "3 days, 22:24:59", "remaining_time": "3 days, 1:41:33", "throughput": 2724.46, "total_tokens": 926042656} {"current_steps": 5131, "total_steps": 9134, "loss": 0.7527, "learning_rate": 2.01807351711879e-05, "epoch": 0.561701195982375, "percentage": 56.17, "elapsed_time": "3 days, 22:26:07", "remaining_time": "3 days, 1:40:29", "throughput": 2724.52, "total_tokens": 926250080} {"current_steps": 5132, "total_steps": 9134, "loss": 0.6741, "learning_rate": 2.0172298111108782e-05, "epoch": 0.5618106680533129, "percentage": 56.19, "elapsed_time": "3 days, 22:27:14", "remaining_time": "3 days, 1:39:23", "throughput": 2724.54, "total_tokens": 926436000} {"current_steps": 5133, "total_steps": 9134, "loss": 0.657, "learning_rate": 2.016386162213756e-05, "epoch": 0.5619201401242508, "percentage": 56.2, "elapsed_time": "3 days, 22:28:20", "remaining_time": "3 days, 1:38:17", "throughput": 2724.59, "total_tokens": 926636928} {"current_steps": 5134, "total_steps": 9134, "loss": 0.8948, "learning_rate": 2.0155425705272268e-05, "epoch": 0.5620296121951887, "percentage": 56.21, "elapsed_time": "3 days, 22:29:27", "remaining_time": "3 days, 1:37:11", "throughput": 2724.62, "total_tokens": 926828672} {"current_steps": 5135, "total_steps": 9134, "loss": 0.6581, "learning_rate": 2.0146990361510844e-05, "epoch": 0.5621390842661266, "percentage": 56.22, "elapsed_time": "3 days, 22:30:30", "remaining_time": "3 days, 1:36:02", "throughput": 2724.6, "total_tokens": 926991520} {"current_steps": 5136, "total_steps": 9134, "loss": 0.7163, "learning_rate": 2.0138555591851198e-05, "epoch": 0.5622485563370645, "percentage": 56.23, "elapsed_time": "3 days, 22:31:37", "remaining_time": "3 days, 1:34:56", "throughput": 2724.55, "total_tokens": 927157056} {"current_steps": 5137, "total_steps": 9134, "loss": 0.7373, "learning_rate": 2.013012139729112e-05, "epoch": 0.5623580284080024, "percentage": 56.24, "elapsed_time": "3 days, 22:32:44", "remaining_time": "3 days, 1:33:51", "throughput": 2724.58, "total_tokens": 927351040} {"current_steps": 5138, "total_steps": 9134, "loss": 0.7935, "learning_rate": 2.0121687778828372e-05, "epoch": 0.5624675004789403, "percentage": 56.25, "elapsed_time": "3 days, 22:33:53", "remaining_time": "3 days, 1:32:46", "throughput": 2724.63, "total_tokens": 927555104} {"current_steps": 5139, "total_steps": 9134, "loss": 0.7021, "learning_rate": 2.0113254737460643e-05, "epoch": 0.5625769725498783, "percentage": 56.26, "elapsed_time": "3 days, 22:34:55", "remaining_time": "3 days, 1:31:37", "throughput": 2724.53, "total_tokens": 927690176} {"current_steps": 5140, "total_steps": 9134, "loss": 0.7872, "learning_rate": 2.0104822274185525e-05, "epoch": 0.5626864446208161, "percentage": 56.27, "elapsed_time": "3 days, 22:35:59", "remaining_time": "3 days, 1:30:29", "throughput": 2724.51, "total_tokens": 927858400} {"current_steps": 5141, "total_steps": 9134, "loss": 0.7356, "learning_rate": 2.009639039000059e-05, "epoch": 0.562795916691754, "percentage": 56.28, "elapsed_time": "3 days, 22:37:04", "remaining_time": "3 days, 1:29:22", "throughput": 2724.5, "total_tokens": 928032000} {"current_steps": 5142, "total_steps": 9134, "loss": 0.6888, "learning_rate": 2.0087959085903282e-05, "epoch": 0.5629053887626919, "percentage": 56.3, "elapsed_time": "3 days, 22:38:12", "remaining_time": "3 days, 1:28:17", "throughput": 2724.51, "total_tokens": 928218816} {"current_steps": 5143, "total_steps": 9134, "loss": 0.8143, "learning_rate": 2.0079528362891032e-05, "epoch": 0.5630148608336298, "percentage": 56.31, "elapsed_time": "3 days, 22:39:19", "remaining_time": "3 days, 1:27:11", "throughput": 2724.53, "total_tokens": 928408096} {"current_steps": 5144, "total_steps": 9134, "loss": 0.8208, "learning_rate": 2.0071098221961168e-05, "epoch": 0.5631243329045678, "percentage": 56.32, "elapsed_time": "3 days, 22:40:26", "remaining_time": "3 days, 1:26:06", "throughput": 2724.58, "total_tokens": 928609472} {"current_steps": 5145, "total_steps": 9134, "loss": 0.7201, "learning_rate": 2.0062668664110957e-05, "epoch": 0.5632338049755056, "percentage": 56.33, "elapsed_time": "3 days, 22:41:36", "remaining_time": "3 days, 1:25:02", "throughput": 2724.65, "total_tokens": 928823168} {"current_steps": 5146, "total_steps": 9134, "loss": 0.5968, "learning_rate": 2.005423969033761e-05, "epoch": 0.5633432770464435, "percentage": 56.34, "elapsed_time": "3 days, 22:42:38", "remaining_time": "3 days, 1:23:52", "throughput": 2724.62, "total_tokens": 928981536} {"current_steps": 5147, "total_steps": 9134, "loss": 0.6834, "learning_rate": 2.004581130163825e-05, "epoch": 0.5634527491173814, "percentage": 56.35, "elapsed_time": "3 days, 22:43:46", "remaining_time": "3 days, 1:22:48", "throughput": 2724.63, "total_tokens": 929173280} {"current_steps": 5148, "total_steps": 9134, "loss": 0.6464, "learning_rate": 2.0037383499009948e-05, "epoch": 0.5635622211883193, "percentage": 56.36, "elapsed_time": "3 days, 22:44:51", "remaining_time": "3 days, 1:21:40", "throughput": 2724.61, "total_tokens": 929341952} {"current_steps": 5149, "total_steps": 9134, "loss": 0.6408, "learning_rate": 2.0028956283449686e-05, "epoch": 0.5636716932592573, "percentage": 56.37, "elapsed_time": "3 days, 22:46:00", "remaining_time": "3 days, 1:20:36", "throughput": 2724.66, "total_tokens": 929548256} {"current_steps": 5150, "total_steps": 9134, "loss": 0.91, "learning_rate": 2.00205296559544e-05, "epoch": 0.5637811653301952, "percentage": 56.38, "elapsed_time": "3 days, 22:47:09", "remaining_time": "3 days, 1:19:32", "throughput": 2724.72, "total_tokens": 929753216} {"current_steps": 5151, "total_steps": 9134, "loss": 0.525, "learning_rate": 2.0012103617520926e-05, "epoch": 0.563890637401133, "percentage": 56.39, "elapsed_time": "3 days, 22:48:13", "remaining_time": "3 days, 1:18:24", "throughput": 2724.65, "total_tokens": 929905984} {"current_steps": 5152, "total_steps": 9134, "loss": 0.6845, "learning_rate": 2.000367816914606e-05, "epoch": 0.5640001094720709, "percentage": 56.4, "elapsed_time": "3 days, 22:49:17", "remaining_time": "3 days, 1:17:16", "throughput": 2724.6, "total_tokens": 930061216} {"current_steps": 5153, "total_steps": 9134, "loss": 0.5558, "learning_rate": 1.9995253311826526e-05, "epoch": 0.5641095815430088, "percentage": 56.42, "elapsed_time": "3 days, 22:50:26", "remaining_time": "3 days, 1:16:12", "throughput": 2724.69, "total_tokens": 930281184} {"current_steps": 5154, "total_steps": 9134, "loss": 0.56, "learning_rate": 1.9986829046558944e-05, "epoch": 0.5642190536139468, "percentage": 56.43, "elapsed_time": "3 days, 22:51:30", "remaining_time": "3 days, 1:15:04", "throughput": 2724.71, "total_tokens": 930460832} {"current_steps": 5155, "total_steps": 9134, "loss": 0.9095, "learning_rate": 1.997840537433991e-05, "epoch": 0.5643285256848847, "percentage": 56.44, "elapsed_time": "3 days, 22:52:39", "remaining_time": "3 days, 1:14:00", "throughput": 2724.74, "total_tokens": 930661088} {"current_steps": 5156, "total_steps": 9134, "loss": 0.5955, "learning_rate": 1.9969982296165915e-05, "epoch": 0.5644379977558226, "percentage": 56.45, "elapsed_time": "3 days, 22:53:47", "remaining_time": "3 days, 1:12:55", "throughput": 2724.73, "total_tokens": 930841856} {"current_steps": 5157, "total_steps": 9134, "loss": 0.639, "learning_rate": 1.996155981303341e-05, "epoch": 0.5645474698267604, "percentage": 56.46, "elapsed_time": "3 days, 22:54:48", "remaining_time": "3 days, 1:11:44", "throughput": 2724.69, "total_tokens": 930995520} {"current_steps": 5158, "total_steps": 9134, "loss": 0.6926, "learning_rate": 1.9953137925938737e-05, "epoch": 0.5646569418976983, "percentage": 56.47, "elapsed_time": "3 days, 22:55:53", "remaining_time": "3 days, 1:10:38", "throughput": 2724.71, "total_tokens": 931182112} {"current_steps": 5159, "total_steps": 9134, "loss": 0.7113, "learning_rate": 1.9944716635878197e-05, "epoch": 0.5647664139686362, "percentage": 56.48, "elapsed_time": "3 days, 22:56:58", "remaining_time": "3 days, 1:09:30", "throughput": 2724.68, "total_tokens": 931346752} {"current_steps": 5160, "total_steps": 9134, "loss": 0.6718, "learning_rate": 1.9936295943848028e-05, "epoch": 0.5648758860395742, "percentage": 56.49, "elapsed_time": "3 days, 22:58:04", "remaining_time": "3 days, 1:08:23", "throughput": 2724.64, "total_tokens": 931512064} {"current_steps": 5161, "total_steps": 9134, "loss": 0.6866, "learning_rate": 1.9927875850844356e-05, "epoch": 0.5649853581105121, "percentage": 56.5, "elapsed_time": "3 days, 22:59:12", "remaining_time": "3 days, 1:07:19", "throughput": 2724.61, "total_tokens": 931686784} {"current_steps": 5162, "total_steps": 9134, "loss": 0.6033, "learning_rate": 1.9919456357863286e-05, "epoch": 0.5650948301814499, "percentage": 56.51, "elapsed_time": "3 days, 23:00:13", "remaining_time": "3 days, 1:06:08", "throughput": 2724.56, "total_tokens": 931836640} {"current_steps": 5163, "total_steps": 9134, "loss": 0.6833, "learning_rate": 1.9911037465900807e-05, "epoch": 0.5652043022523878, "percentage": 56.53, "elapsed_time": "3 days, 23:01:14", "remaining_time": "3 days, 1:04:58", "throughput": 2724.55, "total_tokens": 932000608} {"current_steps": 5164, "total_steps": 9134, "loss": 0.7289, "learning_rate": 1.990261917595287e-05, "epoch": 0.5653137743233257, "percentage": 56.54, "elapsed_time": "3 days, 23:02:22", "remaining_time": "3 days, 1:03:53", "throughput": 2724.54, "total_tokens": 932180928} {"current_steps": 5165, "total_steps": 9134, "loss": 0.6289, "learning_rate": 1.9894201489015342e-05, "epoch": 0.5654232463942637, "percentage": 56.55, "elapsed_time": "3 days, 23:03:27", "remaining_time": "3 days, 1:02:46", "throughput": 2724.51, "total_tokens": 932348480} {"current_steps": 5166, "total_steps": 9134, "loss": 0.7782, "learning_rate": 1.9885784406084012e-05, "epoch": 0.5655327184652016, "percentage": 56.56, "elapsed_time": "3 days, 23:04:36", "remaining_time": "3 days, 1:01:42", "throughput": 2724.54, "total_tokens": 932545824} {"current_steps": 5167, "total_steps": 9134, "loss": 0.8401, "learning_rate": 1.9877367928154618e-05, "epoch": 0.5656421905361395, "percentage": 56.57, "elapsed_time": "3 days, 23:05:46", "remaining_time": "3 days, 1:00:38", "throughput": 2724.61, "total_tokens": 932760192} {"current_steps": 5168, "total_steps": 9134, "loss": 0.6959, "learning_rate": 1.9868952056222795e-05, "epoch": 0.5657516626070773, "percentage": 56.58, "elapsed_time": "3 days, 23:06:51", "remaining_time": "3 days, 0:59:31", "throughput": 2724.64, "total_tokens": 932947456} {"current_steps": 5169, "total_steps": 9134, "loss": 0.7142, "learning_rate": 1.9860536791284148e-05, "epoch": 0.5658611346780152, "percentage": 56.59, "elapsed_time": "3 days, 23:07:57", "remaining_time": "3 days, 0:58:25", "throughput": 2724.64, "total_tokens": 933128896} {"current_steps": 5170, "total_steps": 9134, "loss": 0.7648, "learning_rate": 1.985212213433416e-05, "epoch": 0.5659706067489532, "percentage": 56.6, "elapsed_time": "3 days, 23:09:07", "remaining_time": "3 days, 0:57:21", "throughput": 2724.69, "total_tokens": 933336768} {"current_steps": 5171, "total_steps": 9134, "loss": 0.7751, "learning_rate": 1.9843708086368287e-05, "epoch": 0.5660800788198911, "percentage": 56.61, "elapsed_time": "3 days, 23:10:13", "remaining_time": "3 days, 0:56:15", "throughput": 2724.72, "total_tokens": 933525376} {"current_steps": 5172, "total_steps": 9134, "loss": 0.8413, "learning_rate": 1.9835294648381898e-05, "epoch": 0.566189550890829, "percentage": 56.62, "elapsed_time": "3 days, 23:11:21", "remaining_time": "3 days, 0:55:10", "throughput": 2724.73, "total_tokens": 933713536} {"current_steps": 5173, "total_steps": 9134, "loss": 0.7625, "learning_rate": 1.9826881821370268e-05, "epoch": 0.5662990229617669, "percentage": 56.63, "elapsed_time": "3 days, 23:12:27", "remaining_time": "3 days, 0:54:04", "throughput": 2724.74, "total_tokens": 933899904} {"current_steps": 5174, "total_steps": 9134, "loss": 0.7137, "learning_rate": 1.9818469606328642e-05, "epoch": 0.5664084950327047, "percentage": 56.65, "elapsed_time": "3 days, 23:13:33", "remaining_time": "3 days, 0:52:57", "throughput": 2724.71, "total_tokens": 934067008} {"current_steps": 5175, "total_steps": 9134, "loss": 0.749, "learning_rate": 1.9810058004252146e-05, "epoch": 0.5665179671036427, "percentage": 56.66, "elapsed_time": "3 days, 23:14:41", "remaining_time": "3 days, 0:51:52", "throughput": 2724.67, "total_tokens": 934240384} {"current_steps": 5176, "total_steps": 9134, "loss": 0.8713, "learning_rate": 1.9801647016135868e-05, "epoch": 0.5666274391745806, "percentage": 56.67, "elapsed_time": "3 days, 23:15:44", "remaining_time": "3 days, 0:50:44", "throughput": 2724.63, "total_tokens": 934399200} {"current_steps": 5177, "total_steps": 9134, "loss": 0.8931, "learning_rate": 1.9793236642974806e-05, "epoch": 0.5667369112455185, "percentage": 56.68, "elapsed_time": "3 days, 23:16:54", "remaining_time": "3 days, 0:49:40", "throughput": 2724.62, "total_tokens": 934586240} {"current_steps": 5178, "total_steps": 9134, "loss": 0.5831, "learning_rate": 1.9784826885763903e-05, "epoch": 0.5668463833164564, "percentage": 56.69, "elapsed_time": "3 days, 23:18:01", "remaining_time": "3 days, 0:48:34", "throughput": 2724.65, "total_tokens": 934777088} {"current_steps": 5179, "total_steps": 9134, "loss": 0.6634, "learning_rate": 1.977641774549801e-05, "epoch": 0.5669558553873942, "percentage": 56.7, "elapsed_time": "3 days, 23:19:06", "remaining_time": "3 days, 0:47:27", "throughput": 2724.58, "total_tokens": 934931872} {"current_steps": 5180, "total_steps": 9134, "loss": 0.813, "learning_rate": 1.9768009223171907e-05, "epoch": 0.5670653274583322, "percentage": 56.71, "elapsed_time": "3 days, 23:20:10", "remaining_time": "3 days, 0:46:19", "throughput": 2724.59, "total_tokens": 935108384} {"current_steps": 5181, "total_steps": 9134, "loss": 0.5376, "learning_rate": 1.9759601319780317e-05, "epoch": 0.5671747995292701, "percentage": 56.72, "elapsed_time": "3 days, 23:21:10", "remaining_time": "3 days, 0:45:08", "throughput": 2724.53, "total_tokens": 935251744} {"current_steps": 5182, "total_steps": 9134, "loss": 0.6096, "learning_rate": 1.9751194036317868e-05, "epoch": 0.567284271600208, "percentage": 56.73, "elapsed_time": "3 days, 23:22:13", "remaining_time": "3 days, 0:44:00", "throughput": 2724.49, "total_tokens": 935409888} {"current_steps": 5183, "total_steps": 9134, "loss": 0.7021, "learning_rate": 1.9742787373779137e-05, "epoch": 0.5673937436711459, "percentage": 56.74, "elapsed_time": "3 days, 23:23:23", "remaining_time": "3 days, 0:42:56", "throughput": 2724.5, "total_tokens": 935602752} {"current_steps": 5184, "total_steps": 9134, "loss": 0.8124, "learning_rate": 1.9734381333158604e-05, "epoch": 0.5675032157420838, "percentage": 56.75, "elapsed_time": "3 days, 23:24:28", "remaining_time": "3 days, 0:41:49", "throughput": 2724.49, "total_tokens": 935778368} {"current_steps": 5185, "total_steps": 9134, "loss": 0.7234, "learning_rate": 1.9725975915450687e-05, "epoch": 0.5676126878130217, "percentage": 56.77, "elapsed_time": "3 days, 23:25:32", "remaining_time": "3 days, 0:40:41", "throughput": 2724.49, "total_tokens": 935953312} {"current_steps": 5186, "total_steps": 9134, "loss": 0.8517, "learning_rate": 1.971757112164975e-05, "epoch": 0.5677221598839596, "percentage": 56.78, "elapsed_time": "3 days, 23:26:41", "remaining_time": "3 days, 0:39:36", "throughput": 2724.49, "total_tokens": 936139456} {"current_steps": 5187, "total_steps": 9134, "loss": 0.5732, "learning_rate": 1.970916695275004e-05, "epoch": 0.5678316319548975, "percentage": 56.79, "elapsed_time": "3 days, 23:27:43", "remaining_time": "3 days, 0:38:27", "throughput": 2724.49, "total_tokens": 936308128} {"current_steps": 5188, "total_steps": 9134, "loss": 0.5845, "learning_rate": 1.9700763409745773e-05, "epoch": 0.5679411040258354, "percentage": 56.8, "elapsed_time": "3 days, 23:28:40", "remaining_time": "3 days, 0:37:14", "throughput": 2724.38, "total_tokens": 936423488} {"current_steps": 5189, "total_steps": 9134, "loss": 0.6367, "learning_rate": 1.9692360493631058e-05, "epoch": 0.5680505760967733, "percentage": 56.81, "elapsed_time": "3 days, 23:29:43", "remaining_time": "3 days, 0:36:05", "throughput": 2724.36, "total_tokens": 936588800} {"current_steps": 5190, "total_steps": 9134, "loss": 0.9478, "learning_rate": 1.968395820539996e-05, "epoch": 0.5681600481677113, "percentage": 56.82, "elapsed_time": "3 days, 23:30:50", "remaining_time": "3 days, 0:35:00", "throughput": 2724.36, "total_tokens": 936772480} {"current_steps": 5191, "total_steps": 9134, "loss": 0.7164, "learning_rate": 1.967555654604643e-05, "epoch": 0.5682695202386491, "percentage": 56.83, "elapsed_time": "3 days, 23:31:57", "remaining_time": "3 days, 0:33:54", "throughput": 2724.35, "total_tokens": 936951680} {"current_steps": 5192, "total_steps": 9134, "loss": 0.7618, "learning_rate": 1.9667155516564385e-05, "epoch": 0.568378992309587, "percentage": 56.84, "elapsed_time": "3 days, 23:33:03", "remaining_time": "3 days, 0:32:47", "throughput": 2724.42, "total_tokens": 937154176} {"current_steps": 5193, "total_steps": 9134, "loss": 0.9073, "learning_rate": 1.9658755117947657e-05, "epoch": 0.5684884643805249, "percentage": 56.85, "elapsed_time": "3 days, 23:34:12", "remaining_time": "3 days, 0:31:43", "throughput": 2724.43, "total_tokens": 937346144} {"current_steps": 5194, "total_steps": 9134, "loss": 0.8494, "learning_rate": 1.965035535118998e-05, "epoch": 0.5685979364514628, "percentage": 56.86, "elapsed_time": "3 days, 23:35:20", "remaining_time": "3 days, 0:30:38", "throughput": 2724.45, "total_tokens": 937540128} {"current_steps": 5195, "total_steps": 9134, "loss": 0.866, "learning_rate": 1.9641956217285048e-05, "epoch": 0.5687074085224008, "percentage": 56.88, "elapsed_time": "3 days, 23:36:28", "remaining_time": "3 days, 0:29:33", "throughput": 2724.43, "total_tokens": 937719328} {"current_steps": 5196, "total_steps": 9134, "loss": 0.8548, "learning_rate": 1.9633557717226443e-05, "epoch": 0.5688168805933386, "percentage": 56.89, "elapsed_time": "3 days, 23:37:34", "remaining_time": "3 days, 0:28:27", "throughput": 2724.41, "total_tokens": 937892256} {"current_steps": 5197, "total_steps": 9134, "loss": 0.6422, "learning_rate": 1.96251598520077e-05, "epoch": 0.5689263526642765, "percentage": 56.9, "elapsed_time": "3 days, 23:38:42", "remaining_time": "3 days, 0:27:21", "throughput": 2724.43, "total_tokens": 938082208} {"current_steps": 5198, "total_steps": 9134, "loss": 0.7881, "learning_rate": 1.9616762622622272e-05, "epoch": 0.5690358247352144, "percentage": 56.91, "elapsed_time": "3 days, 23:39:50", "remaining_time": "3 days, 0:26:17", "throughput": 2724.5, "total_tokens": 938291648} {"current_steps": 5199, "total_steps": 9134, "loss": 0.8533, "learning_rate": 1.960836603006354e-05, "epoch": 0.5691452968061523, "percentage": 56.92, "elapsed_time": "3 days, 23:40:55", "remaining_time": "3 days, 0:25:10", "throughput": 2724.42, "total_tokens": 938441728} {"current_steps": 5200, "total_steps": 9134, "loss": 0.5863, "learning_rate": 1.9599970075324797e-05, "epoch": 0.5692547688770903, "percentage": 56.93, "elapsed_time": "3 days, 23:42:03", "remaining_time": "3 days, 0:24:05", "throughput": 2724.39, "total_tokens": 938616448} {"current_steps": 5201, "total_steps": 9134, "loss": 0.6881, "learning_rate": 1.959157475939927e-05, "epoch": 0.5693642409480282, "percentage": 56.94, "elapsed_time": "3 days, 23:43:09", "remaining_time": "3 days, 0:22:58", "throughput": 2724.43, "total_tokens": 938810656} {"current_steps": 5202, "total_steps": 9134, "loss": 0.7814, "learning_rate": 1.9583180083280118e-05, "epoch": 0.569473713018966, "percentage": 56.95, "elapsed_time": "3 days, 23:44:17", "remaining_time": "3 days, 0:21:53", "throughput": 2724.46, "total_tokens": 939003520} {"current_steps": 5203, "total_steps": 9134, "loss": 0.948, "learning_rate": 1.9574786047960394e-05, "epoch": 0.5695831850899039, "percentage": 56.96, "elapsed_time": "3 days, 23:45:23", "remaining_time": "3 days, 0:20:47", "throughput": 2724.47, "total_tokens": 939188992} {"current_steps": 5204, "total_steps": 9134, "loss": 0.581, "learning_rate": 1.9566392654433123e-05, "epoch": 0.5696926571608418, "percentage": 56.97, "elapsed_time": "3 days, 23:46:27", "remaining_time": "3 days, 0:19:39", "throughput": 2724.45, "total_tokens": 939354304} {"current_steps": 5205, "total_steps": 9134, "loss": 0.5946, "learning_rate": 1.95579999036912e-05, "epoch": 0.5698021292317798, "percentage": 56.98, "elapsed_time": "3 days, 23:47:32", "remaining_time": "3 days, 0:18:31", "throughput": 2724.38, "total_tokens": 939508864} {"current_steps": 5206, "total_steps": 9134, "loss": 0.8921, "learning_rate": 1.9549607796727487e-05, "epoch": 0.5699116013027177, "percentage": 57.0, "elapsed_time": "3 days, 23:48:41", "remaining_time": "3 days, 0:17:27", "throughput": 2724.4, "total_tokens": 939702400} {"current_steps": 5207, "total_steps": 9134, "loss": 0.6433, "learning_rate": 1.9541216334534764e-05, "epoch": 0.5700210733736556, "percentage": 57.01, "elapsed_time": "3 days, 23:49:45", "remaining_time": "3 days, 0:16:20", "throughput": 2724.38, "total_tokens": 939870624} {"current_steps": 5208, "total_steps": 9134, "loss": 0.6541, "learning_rate": 1.9532825518105702e-05, "epoch": 0.5701305454445934, "percentage": 57.02, "elapsed_time": "3 days, 23:50:51", "remaining_time": "3 days, 0:15:13", "throughput": 2724.34, "total_tokens": 940038848} {"current_steps": 5209, "total_steps": 9134, "loss": 0.6135, "learning_rate": 1.9524435348432933e-05, "epoch": 0.5702400175155313, "percentage": 57.03, "elapsed_time": "3 days, 23:51:59", "remaining_time": "3 days, 0:14:08", "throughput": 2724.36, "total_tokens": 940228800} {"current_steps": 5210, "total_steps": 9134, "loss": 0.6384, "learning_rate": 1.9516045826508994e-05, "epoch": 0.5703494895864692, "percentage": 57.04, "elapsed_time": "3 days, 23:53:07", "remaining_time": "3 days, 0:13:03", "throughput": 2724.31, "total_tokens": 940396576} {"current_steps": 5211, "total_steps": 9134, "loss": 0.839, "learning_rate": 1.9507656953326355e-05, "epoch": 0.5704589616574072, "percentage": 57.05, "elapsed_time": "3 days, 23:54:14", "remaining_time": "3 days, 0:11:57", "throughput": 2724.35, "total_tokens": 940591680} {"current_steps": 5212, "total_steps": 9134, "loss": 0.7935, "learning_rate": 1.949926872987739e-05, "epoch": 0.5705684337283451, "percentage": 57.06, "elapsed_time": "3 days, 23:55:18", "remaining_time": "3 days, 0:10:49", "throughput": 2724.32, "total_tokens": 940755872} {"current_steps": 5213, "total_steps": 9134, "loss": 0.7336, "learning_rate": 1.9490881157154422e-05, "epoch": 0.5706779057992829, "percentage": 57.07, "elapsed_time": "3 days, 23:56:24", "remaining_time": "3 days, 0:09:43", "throughput": 2724.32, "total_tokens": 940936864} {"current_steps": 5214, "total_steps": 9134, "loss": 0.6243, "learning_rate": 1.948249423614969e-05, "epoch": 0.5707873778702208, "percentage": 57.08, "elapsed_time": "3 days, 23:57:27", "remaining_time": "3 days, 0:08:34", "throughput": 2724.32, "total_tokens": 941108896} {"current_steps": 5215, "total_steps": 9134, "loss": 0.6991, "learning_rate": 1.9474107967855332e-05, "epoch": 0.5708968499411587, "percentage": 57.09, "elapsed_time": "3 days, 23:58:29", "remaining_time": "3 days, 0:07:25", "throughput": 2724.31, "total_tokens": 941273760} {"current_steps": 5216, "total_steps": 9134, "loss": 0.7685, "learning_rate": 1.9465722353263445e-05, "epoch": 0.5710063220120967, "percentage": 57.11, "elapsed_time": "3 days, 23:59:37", "remaining_time": "3 days, 0:06:20", "throughput": 2724.39, "total_tokens": 941485888} {"current_steps": 5217, "total_steps": 9134, "loss": 0.839, "learning_rate": 1.945733739336602e-05, "epoch": 0.5711157940830346, "percentage": 57.12, "elapsed_time": "4 days, 0:00:42", "remaining_time": "3 days, 0:05:13", "throughput": 2724.37, "total_tokens": 941657248} {"current_steps": 5218, "total_steps": 9134, "loss": 0.6621, "learning_rate": 1.9448953089154982e-05, "epoch": 0.5712252661539725, "percentage": 57.13, "elapsed_time": "4 days, 0:01:51", "remaining_time": "3 days, 0:04:09", "throughput": 2724.31, "total_tokens": 941825696} {"current_steps": 5219, "total_steps": 9134, "loss": 0.8085, "learning_rate": 1.9440569441622182e-05, "epoch": 0.5713347382249103, "percentage": 57.14, "elapsed_time": "4 days, 0:02:57", "remaining_time": "3 days, 0:03:03", "throughput": 2724.36, "total_tokens": 942024160} {"current_steps": 5220, "total_steps": 9134, "loss": 0.682, "learning_rate": 1.9432186451759397e-05, "epoch": 0.5714442102958482, "percentage": 57.15, "elapsed_time": "4 days, 0:04:06", "remaining_time": "3 days, 0:01:58", "throughput": 2724.4, "total_tokens": 942222624} {"current_steps": 5221, "total_steps": 9134, "loss": 0.6697, "learning_rate": 1.9423804120558307e-05, "epoch": 0.5715536823667862, "percentage": 57.16, "elapsed_time": "4 days, 0:05:15", "remaining_time": "3 days, 0:00:54", "throughput": 2724.49, "total_tokens": 942443264} {"current_steps": 5222, "total_steps": 9134, "loss": 0.7611, "learning_rate": 1.9415422449010523e-05, "epoch": 0.5716631544377241, "percentage": 57.17, "elapsed_time": "4 days, 0:06:25", "remaining_time": "2 days, 23:59:50", "throughput": 2724.5, "total_tokens": 942636576} {"current_steps": 5223, "total_steps": 9134, "loss": 0.7642, "learning_rate": 1.94070414381076e-05, "epoch": 0.571772626508662, "percentage": 57.18, "elapsed_time": "4 days, 0:07:29", "remaining_time": "2 days, 23:58:42", "throughput": 2724.52, "total_tokens": 942819584} {"current_steps": 5224, "total_steps": 9134, "loss": 0.6555, "learning_rate": 1.9398661088840974e-05, "epoch": 0.5718820985795999, "percentage": 57.19, "elapsed_time": "4 days, 0:08:36", "remaining_time": "2 days, 23:57:37", "throughput": 2724.54, "total_tokens": 943009536} {"current_steps": 5225, "total_steps": 9134, "loss": 0.7859, "learning_rate": 1.9390281402202043e-05, "epoch": 0.5719915706505377, "percentage": 57.2, "elapsed_time": "4 days, 0:09:45", "remaining_time": "2 days, 23:56:33", "throughput": 2724.63, "total_tokens": 943229952} {"current_steps": 5226, "total_steps": 9134, "loss": 0.6229, "learning_rate": 1.9381902379182085e-05, "epoch": 0.5721010427214757, "percentage": 57.21, "elapsed_time": "4 days, 0:10:54", "remaining_time": "2 days, 23:55:28", "throughput": 2724.61, "total_tokens": 943406912} {"current_steps": 5227, "total_steps": 9134, "loss": 0.9615, "learning_rate": 1.9373524020772337e-05, "epoch": 0.5722105147924136, "percentage": 57.23, "elapsed_time": "4 days, 0:12:03", "remaining_time": "2 days, 23:54:25", "throughput": 2724.66, "total_tokens": 943615008} {"current_steps": 5228, "total_steps": 9134, "loss": 0.8624, "learning_rate": 1.9365146327963955e-05, "epoch": 0.5723199868633515, "percentage": 57.24, "elapsed_time": "4 days, 0:13:12", "remaining_time": "2 days, 23:53:20", "throughput": 2724.7, "total_tokens": 943813472} {"current_steps": 5229, "total_steps": 9134, "loss": 0.6925, "learning_rate": 1.9356769301747972e-05, "epoch": 0.5724294589342894, "percentage": 57.25, "elapsed_time": "4 days, 0:14:19", "remaining_time": "2 days, 23:52:14", "throughput": 2724.73, "total_tokens": 944006784} {"current_steps": 5230, "total_steps": 9134, "loss": 0.61, "learning_rate": 1.9348392943115405e-05, "epoch": 0.5725389310052272, "percentage": 57.26, "elapsed_time": "4 days, 0:15:26", "remaining_time": "2 days, 23:51:08", "throughput": 2724.78, "total_tokens": 944207712} {"current_steps": 5231, "total_steps": 9134, "loss": 0.6085, "learning_rate": 1.9340017253057142e-05, "epoch": 0.5726484030761652, "percentage": 57.27, "elapsed_time": "4 days, 0:16:33", "remaining_time": "2 days, 23:50:03", "throughput": 2724.75, "total_tokens": 944378848} {"current_steps": 5232, "total_steps": 9134, "loss": 0.6213, "learning_rate": 1.933164223256403e-05, "epoch": 0.5727578751471031, "percentage": 57.28, "elapsed_time": "4 days, 0:17:40", "remaining_time": "2 days, 23:48:57", "throughput": 2724.79, "total_tokens": 944577760} {"current_steps": 5233, "total_steps": 9134, "loss": 0.6846, "learning_rate": 1.932326788262679e-05, "epoch": 0.572867347218041, "percentage": 57.29, "elapsed_time": "4 days, 0:18:44", "remaining_time": "2 days, 23:47:50", "throughput": 2724.78, "total_tokens": 944750464} {"current_steps": 5234, "total_steps": 9134, "loss": 0.7816, "learning_rate": 1.931489420423611e-05, "epoch": 0.5729768192889789, "percentage": 57.3, "elapsed_time": "4 days, 0:19:47", "remaining_time": "2 days, 23:46:41", "throughput": 2724.74, "total_tokens": 944905248} {"current_steps": 5235, "total_steps": 9134, "loss": 0.6278, "learning_rate": 1.930652119838259e-05, "epoch": 0.5730862913599168, "percentage": 57.31, "elapsed_time": "4 days, 0:20:52", "remaining_time": "2 days, 23:45:33", "throughput": 2724.75, "total_tokens": 945085344} {"current_steps": 5236, "total_steps": 9134, "loss": 0.7355, "learning_rate": 1.9298148866056716e-05, "epoch": 0.5731957634308547, "percentage": 57.32, "elapsed_time": "4 days, 0:21:57", "remaining_time": "2 days, 23:44:26", "throughput": 2724.71, "total_tokens": 945249088} {"current_steps": 5237, "total_steps": 9134, "loss": 0.7272, "learning_rate": 1.9289777208248942e-05, "epoch": 0.5733052355017926, "percentage": 57.34, "elapsed_time": "4 days, 0:23:00", "remaining_time": "2 days, 23:43:18", "throughput": 2724.62, "total_tokens": 945391552} {"current_steps": 5238, "total_steps": 9134, "loss": 0.6367, "learning_rate": 1.92814062259496e-05, "epoch": 0.5734147075727305, "percentage": 57.35, "elapsed_time": "4 days, 0:24:06", "remaining_time": "2 days, 23:42:11", "throughput": 2724.65, "total_tokens": 945579040} {"current_steps": 5239, "total_steps": 9134, "loss": 0.783, "learning_rate": 1.9273035920148966e-05, "epoch": 0.5735241796436684, "percentage": 57.36, "elapsed_time": "4 days, 0:25:06", "remaining_time": "2 days, 23:41:00", "throughput": 2724.6, "total_tokens": 945723968} {"current_steps": 5240, "total_steps": 9134, "loss": 0.7364, "learning_rate": 1.9264666291837242e-05, "epoch": 0.5736336517146063, "percentage": 57.37, "elapsed_time": "4 days, 0:26:10", "remaining_time": "2 days, 23:39:52", "throughput": 2724.59, "total_tokens": 945894656} {"current_steps": 5241, "total_steps": 9134, "loss": 0.8578, "learning_rate": 1.9256297342004527e-05, "epoch": 0.5737431237855443, "percentage": 57.38, "elapsed_time": "4 days, 0:27:18", "remaining_time": "2 days, 23:38:47", "throughput": 2724.57, "total_tokens": 946075200} {"current_steps": 5242, "total_steps": 9134, "loss": 0.9042, "learning_rate": 1.924792907164086e-05, "epoch": 0.5738525958564821, "percentage": 57.39, "elapsed_time": "4 days, 0:28:20", "remaining_time": "2 days, 23:37:38", "throughput": 2724.56, "total_tokens": 946239840} {"current_steps": 5243, "total_steps": 9134, "loss": 0.6339, "learning_rate": 1.9239561481736183e-05, "epoch": 0.57396206792742, "percentage": 57.4, "elapsed_time": "4 days, 0:29:23", "remaining_time": "2 days, 23:36:29", "throughput": 2724.55, "total_tokens": 946408512} {"current_steps": 5244, "total_steps": 9134, "loss": 0.8207, "learning_rate": 1.9231194573280383e-05, "epoch": 0.5740715399983579, "percentage": 57.41, "elapsed_time": "4 days, 0:30:32", "remaining_time": "2 days, 23:35:25", "throughput": 2724.53, "total_tokens": 946589728} {"current_steps": 5245, "total_steps": 9134, "loss": 0.6888, "learning_rate": 1.9222828347263222e-05, "epoch": 0.5741810120692958, "percentage": 57.42, "elapsed_time": "4 days, 0:31:41", "remaining_time": "2 days, 23:34:20", "throughput": 2724.58, "total_tokens": 946794688} {"current_steps": 5246, "total_steps": 9134, "loss": 0.673, "learning_rate": 1.9214462804674425e-05, "epoch": 0.5742904841402338, "percentage": 57.43, "elapsed_time": "4 days, 0:32:48", "remaining_time": "2 days, 23:33:15", "throughput": 2724.62, "total_tokens": 946992032} {"current_steps": 5247, "total_steps": 9134, "loss": 0.8339, "learning_rate": 1.9206097946503625e-05, "epoch": 0.5743999562111716, "percentage": 57.44, "elapsed_time": "4 days, 0:33:52", "remaining_time": "2 days, 23:32:07", "throughput": 2724.6, "total_tokens": 947158688} {"current_steps": 5248, "total_steps": 9134, "loss": 0.7893, "learning_rate": 1.9197733773740356e-05, "epoch": 0.5745094282821095, "percentage": 57.46, "elapsed_time": "4 days, 0:34:59", "remaining_time": "2 days, 23:31:02", "throughput": 2724.56, "total_tokens": 947330048} {"current_steps": 5249, "total_steps": 9134, "loss": 0.6079, "learning_rate": 1.91893702873741e-05, "epoch": 0.5746189003530474, "percentage": 57.47, "elapsed_time": "4 days, 0:36:04", "remaining_time": "2 days, 23:29:54", "throughput": 2724.56, "total_tokens": 947504320} {"current_steps": 5250, "total_steps": 9134, "loss": 0.7136, "learning_rate": 1.918100748839422e-05, "epoch": 0.5747283724239853, "percentage": 57.48, "elapsed_time": "4 days, 0:37:10", "remaining_time": "2 days, 23:28:48", "throughput": 2724.53, "total_tokens": 947674336} {"current_steps": 5251, "total_steps": 9134, "loss": 0.7487, "learning_rate": 1.9172645377790037e-05, "epoch": 0.5748378444949233, "percentage": 57.49, "elapsed_time": "4 days, 0:38:13", "remaining_time": "2 days, 23:27:39", "throughput": 2724.52, "total_tokens": 947841216} {"current_steps": 5252, "total_steps": 9134, "loss": 0.9854, "learning_rate": 1.916428395655076e-05, "epoch": 0.5749473165658612, "percentage": 57.5, "elapsed_time": "4 days, 0:39:16", "remaining_time": "2 days, 23:26:31", "throughput": 2724.53, "total_tokens": 948018848} {"current_steps": 5253, "total_steps": 9134, "loss": 0.7018, "learning_rate": 1.915592322566553e-05, "epoch": 0.575056788636799, "percentage": 57.51, "elapsed_time": "4 days, 0:40:21", "remaining_time": "2 days, 23:25:23", "throughput": 2724.49, "total_tokens": 948181248} {"current_steps": 5254, "total_steps": 9134, "loss": 0.8095, "learning_rate": 1.9147563186123423e-05, "epoch": 0.5751662607077369, "percentage": 57.52, "elapsed_time": "4 days, 0:41:27", "remaining_time": "2 days, 23:24:17", "throughput": 2724.49, "total_tokens": 948360672} {"current_steps": 5255, "total_steps": 9134, "loss": 0.6982, "learning_rate": 1.9139203838913394e-05, "epoch": 0.5752757327786748, "percentage": 57.53, "elapsed_time": "4 days, 0:42:36", "remaining_time": "2 days, 23:23:12", "throughput": 2724.53, "total_tokens": 948560032} {"current_steps": 5256, "total_steps": 9134, "loss": 0.7193, "learning_rate": 1.913084518502436e-05, "epoch": 0.5753852048496128, "percentage": 57.54, "elapsed_time": "4 days, 0:43:41", "remaining_time": "2 days, 23:22:05", "throughput": 2724.46, "total_tokens": 948714368} {"current_steps": 5257, "total_steps": 9134, "loss": 0.7993, "learning_rate": 1.9122487225445107e-05, "epoch": 0.5754946769205507, "percentage": 57.55, "elapsed_time": "4 days, 0:44:49", "remaining_time": "2 days, 23:21:01", "throughput": 2724.47, "total_tokens": 948903648} {"current_steps": 5258, "total_steps": 9134, "loss": 0.9461, "learning_rate": 1.911412996116439e-05, "epoch": 0.5756041489914886, "percentage": 57.57, "elapsed_time": "4 days, 0:45:58", "remaining_time": "2 days, 23:19:56", "throughput": 2724.54, "total_tokens": 949118464} {"current_steps": 5259, "total_steps": 9134, "loss": 0.8147, "learning_rate": 1.9105773393170836e-05, "epoch": 0.5757136210624264, "percentage": 57.58, "elapsed_time": "4 days, 0:47:07", "remaining_time": "2 days, 23:18:52", "throughput": 2724.53, "total_tokens": 949303712} {"current_steps": 5260, "total_steps": 9134, "loss": 0.5687, "learning_rate": 1.9097417522453023e-05, "epoch": 0.5758230931333643, "percentage": 57.59, "elapsed_time": "4 days, 0:48:16", "remaining_time": "2 days, 23:17:48", "throughput": 2724.58, "total_tokens": 949504416} {"current_steps": 5261, "total_steps": 9134, "loss": 0.6587, "learning_rate": 1.9089062349999437e-05, "epoch": 0.5759325652043022, "percentage": 57.6, "elapsed_time": "4 days, 0:49:23", "remaining_time": "2 days, 23:16:42", "throughput": 2724.6, "total_tokens": 949696608} {"current_steps": 5262, "total_steps": 9134, "loss": 0.7386, "learning_rate": 1.9080707876798475e-05, "epoch": 0.5760420372752402, "percentage": 57.61, "elapsed_time": "4 days, 0:50:24", "remaining_time": "2 days, 23:15:32", "throughput": 2724.53, "total_tokens": 949838848} {"current_steps": 5263, "total_steps": 9134, "loss": 0.5829, "learning_rate": 1.9072354103838458e-05, "epoch": 0.5761515093461781, "percentage": 57.62, "elapsed_time": "4 days, 0:51:30", "remaining_time": "2 days, 23:14:25", "throughput": 2724.5, "total_tokens": 950006848} {"current_steps": 5264, "total_steps": 9134, "loss": 0.7869, "learning_rate": 1.9064001032107612e-05, "epoch": 0.5762609814171159, "percentage": 57.63, "elapsed_time": "4 days, 0:52:39", "remaining_time": "2 days, 23:13:22", "throughput": 2724.5, "total_tokens": 950194784} {"current_steps": 5265, "total_steps": 9134, "loss": 0.6898, "learning_rate": 1.9055648662594107e-05, "epoch": 0.5763704534880538, "percentage": 57.64, "elapsed_time": "4 days, 0:53:48", "remaining_time": "2 days, 23:12:17", "throughput": 2724.48, "total_tokens": 950376224} {"current_steps": 5266, "total_steps": 9134, "loss": 0.7049, "learning_rate": 1.904729699628599e-05, "epoch": 0.5764799255589917, "percentage": 57.65, "elapsed_time": "4 days, 0:54:51", "remaining_time": "2 days, 23:11:09", "throughput": 2724.45, "total_tokens": 950536832} {"current_steps": 5267, "total_steps": 9134, "loss": 0.7944, "learning_rate": 1.9038946034171258e-05, "epoch": 0.5765893976299297, "percentage": 57.66, "elapsed_time": "4 days, 0:55:58", "remaining_time": "2 days, 23:10:02", "throughput": 2724.43, "total_tokens": 950711328} {"current_steps": 5268, "total_steps": 9134, "loss": 0.6113, "learning_rate": 1.903059577723783e-05, "epoch": 0.5766988697008676, "percentage": 57.67, "elapsed_time": "4 days, 0:57:03", "remaining_time": "2 days, 23:08:55", "throughput": 2724.38, "total_tokens": 950870816} {"current_steps": 5269, "total_steps": 9134, "loss": 0.6373, "learning_rate": 1.9022246226473494e-05, "epoch": 0.5768083417718055, "percentage": 57.69, "elapsed_time": "4 days, 0:58:06", "remaining_time": "2 days, 23:07:47", "throughput": 2724.33, "total_tokens": 951029184} {"current_steps": 5270, "total_steps": 9134, "loss": 0.6858, "learning_rate": 1.9013897382866013e-05, "epoch": 0.5769178138427433, "percentage": 57.7, "elapsed_time": "4 days, 0:59:15", "remaining_time": "2 days, 23:06:43", "throughput": 2724.31, "total_tokens": 951206816} {"current_steps": 5271, "total_steps": 9134, "loss": 0.7019, "learning_rate": 1.900554924740302e-05, "epoch": 0.5770272859136812, "percentage": 57.71, "elapsed_time": "4 days, 1:00:17", "remaining_time": "2 days, 23:05:33", "throughput": 2724.26, "total_tokens": 951358016} {"current_steps": 5272, "total_steps": 9134, "loss": 0.6708, "learning_rate": 1.8997201821072097e-05, "epoch": 0.5771367579846192, "percentage": 57.72, "elapsed_time": "4 days, 1:01:22", "remaining_time": "2 days, 23:04:26", "throughput": 2724.25, "total_tokens": 951534528} {"current_steps": 5273, "total_steps": 9134, "loss": 0.9943, "learning_rate": 1.8988855104860718e-05, "epoch": 0.5772462300555571, "percentage": 57.73, "elapsed_time": "4 days, 1:02:28", "remaining_time": "2 days, 23:03:20", "throughput": 2724.23, "total_tokens": 951704320} {"current_steps": 5274, "total_steps": 9134, "loss": 0.783, "learning_rate": 1.8980509099756287e-05, "epoch": 0.577355702126495, "percentage": 57.74, "elapsed_time": "4 days, 1:03:34", "remaining_time": "2 days, 23:02:14", "throughput": 2724.26, "total_tokens": 951898752} {"current_steps": 5275, "total_steps": 9134, "loss": 0.7669, "learning_rate": 1.8972163806746132e-05, "epoch": 0.5774651741974329, "percentage": 57.75, "elapsed_time": "4 days, 1:04:42", "remaining_time": "2 days, 23:01:08", "throughput": 2724.32, "total_tokens": 952101920} {"current_steps": 5276, "total_steps": 9134, "loss": 0.5525, "learning_rate": 1.8963819226817468e-05, "epoch": 0.5775746462683707, "percentage": 57.76, "elapsed_time": "4 days, 1:05:52", "remaining_time": "2 days, 23:00:05", "throughput": 2724.36, "total_tokens": 952306880} {"current_steps": 5277, "total_steps": 9134, "loss": 0.5393, "learning_rate": 1.895547536095746e-05, "epoch": 0.5776841183393087, "percentage": 57.77, "elapsed_time": "4 days, 1:06:58", "remaining_time": "2 days, 22:58:58", "throughput": 2724.34, "total_tokens": 952478464} {"current_steps": 5278, "total_steps": 9134, "loss": 0.8122, "learning_rate": 1.8947132210153144e-05, "epoch": 0.5777935904102466, "percentage": 57.78, "elapsed_time": "4 days, 1:08:04", "remaining_time": "2 days, 22:57:52", "throughput": 2724.3, "total_tokens": 952644672} {"current_steps": 5279, "total_steps": 9134, "loss": 0.6977, "learning_rate": 1.8938789775391536e-05, "epoch": 0.5779030624811845, "percentage": 57.8, "elapsed_time": "4 days, 1:09:13", "remaining_time": "2 days, 22:56:48", "throughput": 2724.33, "total_tokens": 952846048} {"current_steps": 5280, "total_steps": 9134, "loss": 0.8444, "learning_rate": 1.8930448057659497e-05, "epoch": 0.5780125345521224, "percentage": 57.81, "elapsed_time": "4 days, 1:10:20", "remaining_time": "2 days, 22:55:42", "throughput": 2724.36, "total_tokens": 953036896} {"current_steps": 5281, "total_steps": 9134, "loss": 0.7312, "learning_rate": 1.892210705794385e-05, "epoch": 0.5781220066230603, "percentage": 57.82, "elapsed_time": "4 days, 1:11:23", "remaining_time": "2 days, 22:54:33", "throughput": 2724.36, "total_tokens": 953207584} {"current_steps": 5282, "total_steps": 9134, "loss": 0.7561, "learning_rate": 1.8913766777231322e-05, "epoch": 0.5782314786939982, "percentage": 57.83, "elapsed_time": "4 days, 1:12:31", "remaining_time": "2 days, 22:53:28", "throughput": 2724.4, "total_tokens": 953407616} {"current_steps": 5283, "total_steps": 9134, "loss": 0.7085, "learning_rate": 1.8905427216508554e-05, "epoch": 0.5783409507649361, "percentage": 57.84, "elapsed_time": "4 days, 1:13:32", "remaining_time": "2 days, 22:52:18", "throughput": 2724.33, "total_tokens": 953551424} {"current_steps": 5284, "total_steps": 9134, "loss": 0.7052, "learning_rate": 1.8897088376762094e-05, "epoch": 0.578450422835874, "percentage": 57.85, "elapsed_time": "4 days, 1:14:38", "remaining_time": "2 days, 22:51:12", "throughput": 2724.35, "total_tokens": 953737792} {"current_steps": 5285, "total_steps": 9134, "loss": 0.8348, "learning_rate": 1.8888750258978404e-05, "epoch": 0.5785598949068119, "percentage": 57.86, "elapsed_time": "4 days, 1:15:43", "remaining_time": "2 days, 22:50:05", "throughput": 2724.33, "total_tokens": 953907808} {"current_steps": 5286, "total_steps": 9134, "loss": 0.852, "learning_rate": 1.8880412864143886e-05, "epoch": 0.5786693669777498, "percentage": 57.87, "elapsed_time": "4 days, 1:16:52", "remaining_time": "2 days, 22:49:01", "throughput": 2724.44, "total_tokens": 954133824} {"current_steps": 5287, "total_steps": 9134, "loss": 0.6797, "learning_rate": 1.887207619324482e-05, "epoch": 0.5787788390486877, "percentage": 57.88, "elapsed_time": "4 days, 1:17:57", "remaining_time": "2 days, 22:47:53", "throughput": 2724.44, "total_tokens": 954309664} {"current_steps": 5288, "total_steps": 9134, "loss": 0.6149, "learning_rate": 1.8863740247267426e-05, "epoch": 0.5788883111196256, "percentage": 57.89, "elapsed_time": "4 days, 1:19:02", "remaining_time": "2 days, 22:46:46", "throughput": 2724.42, "total_tokens": 954479904} {"current_steps": 5289, "total_steps": 9134, "loss": 0.9868, "learning_rate": 1.8855405027197838e-05, "epoch": 0.5789977831905635, "percentage": 57.9, "elapsed_time": "4 days, 1:20:10", "remaining_time": "2 days, 22:45:41", "throughput": 2724.4, "total_tokens": 954656640} {"current_steps": 5290, "total_steps": 9134, "loss": 0.5796, "learning_rate": 1.884707053402208e-05, "epoch": 0.5791072552615014, "percentage": 57.92, "elapsed_time": "4 days, 1:21:17", "remaining_time": "2 days, 22:44:35", "throughput": 2724.4, "total_tokens": 954838976} {"current_steps": 5291, "total_steps": 9134, "loss": 0.7819, "learning_rate": 1.8838736768726125e-05, "epoch": 0.5792167273324393, "percentage": 57.93, "elapsed_time": "4 days, 1:22:21", "remaining_time": "2 days, 22:43:27", "throughput": 2724.38, "total_tokens": 955006752} {"current_steps": 5292, "total_steps": 9134, "loss": 0.9763, "learning_rate": 1.8830403732295823e-05, "epoch": 0.5793261994033773, "percentage": 57.94, "elapsed_time": "4 days, 1:23:28", "remaining_time": "2 days, 22:42:22", "throughput": 2724.4, "total_tokens": 955198048} {"current_steps": 5293, "total_steps": 9134, "loss": 0.85, "learning_rate": 1.8822071425716968e-05, "epoch": 0.5794356714743151, "percentage": 57.95, "elapsed_time": "4 days, 1:24:38", "remaining_time": "2 days, 22:41:18", "throughput": 2724.44, "total_tokens": 955400768} {"current_steps": 5294, "total_steps": 9134, "loss": 0.9957, "learning_rate": 1.881373984997525e-05, "epoch": 0.579545143545253, "percentage": 57.96, "elapsed_time": "4 days, 1:25:45", "remaining_time": "2 days, 22:40:12", "throughput": 2724.44, "total_tokens": 955584896} {"current_steps": 5295, "total_steps": 9134, "loss": 0.9051, "learning_rate": 1.880540900605628e-05, "epoch": 0.5796546156161909, "percentage": 57.97, "elapsed_time": "4 days, 1:26:50", "remaining_time": "2 days, 22:39:05", "throughput": 2724.43, "total_tokens": 955756480} {"current_steps": 5296, "total_steps": 9134, "loss": 0.7964, "learning_rate": 1.8797078894945596e-05, "epoch": 0.5797640876871288, "percentage": 57.98, "elapsed_time": "4 days, 1:27:55", "remaining_time": "2 days, 22:37:58", "throughput": 2724.4, "total_tokens": 955926272} {"current_steps": 5297, "total_steps": 9134, "loss": 0.8012, "learning_rate": 1.8788749517628606e-05, "epoch": 0.5798735597580668, "percentage": 57.99, "elapsed_time": "4 days, 1:29:01", "remaining_time": "2 days, 22:36:52", "throughput": 2724.45, "total_tokens": 956122944} {"current_steps": 5298, "total_steps": 9134, "loss": 0.6837, "learning_rate": 1.878042087509069e-05, "epoch": 0.5799830318290047, "percentage": 58.0, "elapsed_time": "4 days, 1:30:05", "remaining_time": "2 days, 22:35:44", "throughput": 2724.48, "total_tokens": 956307968} {"current_steps": 5299, "total_steps": 9134, "loss": 0.6519, "learning_rate": 1.877209296831708e-05, "epoch": 0.5800925038999425, "percentage": 58.01, "elapsed_time": "4 days, 1:31:12", "remaining_time": "2 days, 22:34:38", "throughput": 2724.48, "total_tokens": 956492544} {"current_steps": 5300, "total_steps": 9134, "loss": 0.6671, "learning_rate": 1.8763765798292966e-05, "epoch": 0.5802019759708804, "percentage": 58.02, "elapsed_time": "4 days, 1:32:20", "remaining_time": "2 days, 22:33:33", "throughput": 2724.47, "total_tokens": 956669280} {"current_steps": 5301, "total_steps": 9134, "loss": 0.71, "learning_rate": 1.8755439366003448e-05, "epoch": 0.5803114480418183, "percentage": 58.04, "elapsed_time": "4 days, 1:33:26", "remaining_time": "2 days, 22:32:27", "throughput": 2724.48, "total_tokens": 956855872} {"current_steps": 5302, "total_steps": 9134, "loss": 0.7924, "learning_rate": 1.8747113672433505e-05, "epoch": 0.5804209201127563, "percentage": 58.05, "elapsed_time": "4 days, 1:34:32", "remaining_time": "2 days, 22:31:20", "throughput": 2724.51, "total_tokens": 957044928} {"current_steps": 5303, "total_steps": 9134, "loss": 0.7529, "learning_rate": 1.8738788718568066e-05, "epoch": 0.5805303921836942, "percentage": 58.06, "elapsed_time": "4 days, 1:35:40", "remaining_time": "2 days, 22:30:15", "throughput": 2724.56, "total_tokens": 957248320} {"current_steps": 5304, "total_steps": 9134, "loss": 0.72, "learning_rate": 1.8730464505391953e-05, "epoch": 0.580639864254632, "percentage": 58.07, "elapsed_time": "4 days, 1:36:41", "remaining_time": "2 days, 22:29:05", "throughput": 2724.54, "total_tokens": 957406688} {"current_steps": 5305, "total_steps": 9134, "loss": 0.7287, "learning_rate": 1.8722141033889904e-05, "epoch": 0.5807493363255699, "percentage": 58.08, "elapsed_time": "4 days, 1:37:47", "remaining_time": "2 days, 22:27:59", "throughput": 2724.53, "total_tokens": 957584320} {"current_steps": 5306, "total_steps": 9134, "loss": 0.8282, "learning_rate": 1.8713818305046566e-05, "epoch": 0.5808588083965078, "percentage": 58.09, "elapsed_time": "4 days, 1:38:54", "remaining_time": "2 days, 22:26:53", "throughput": 2724.5, "total_tokens": 957754560} {"current_steps": 5307, "total_steps": 9134, "loss": 0.8704, "learning_rate": 1.87054963198465e-05, "epoch": 0.5809682804674458, "percentage": 58.1, "elapsed_time": "4 days, 1:40:00", "remaining_time": "2 days, 22:25:47", "throughput": 2724.52, "total_tokens": 957944064} {"current_steps": 5308, "total_steps": 9134, "loss": 0.7101, "learning_rate": 1.86971750792742e-05, "epoch": 0.5810777525383837, "percentage": 58.11, "elapsed_time": "4 days, 1:41:07", "remaining_time": "2 days, 22:24:41", "throughput": 2724.53, "total_tokens": 958129760} {"current_steps": 5309, "total_steps": 9134, "loss": 0.8386, "learning_rate": 1.8688854584314028e-05, "epoch": 0.5811872246093216, "percentage": 58.12, "elapsed_time": "4 days, 1:42:15", "remaining_time": "2 days, 22:23:36", "throughput": 2724.59, "total_tokens": 958335392} {"current_steps": 5310, "total_steps": 9134, "loss": 0.6684, "learning_rate": 1.8680534835950302e-05, "epoch": 0.5812966966802594, "percentage": 58.13, "elapsed_time": "4 days, 1:43:20", "remaining_time": "2 days, 22:22:29", "throughput": 2724.59, "total_tokens": 958512352} {"current_steps": 5311, "total_steps": 9134, "loss": 0.7258, "learning_rate": 1.8672215835167217e-05, "epoch": 0.5814061687511973, "percentage": 58.15, "elapsed_time": "4 days, 1:44:26", "remaining_time": "2 days, 22:21:22", "throughput": 2724.58, "total_tokens": 958689312} {"current_steps": 5312, "total_steps": 9134, "loss": 0.6262, "learning_rate": 1.8663897582948912e-05, "epoch": 0.5815156408221352, "percentage": 58.16, "elapsed_time": "4 days, 1:45:29", "remaining_time": "2 days, 22:20:14", "throughput": 2724.57, "total_tokens": 958854624} {"current_steps": 5313, "total_steps": 9134, "loss": 0.9159, "learning_rate": 1.86555800802794e-05, "epoch": 0.5816251128930732, "percentage": 58.17, "elapsed_time": "4 days, 1:46:34", "remaining_time": "2 days, 22:19:07", "throughput": 2724.58, "total_tokens": 959038976} {"current_steps": 5314, "total_steps": 9134, "loss": 0.7262, "learning_rate": 1.864726332814264e-05, "epoch": 0.5817345849640111, "percentage": 58.18, "elapsed_time": "4 days, 1:47:40", "remaining_time": "2 days, 22:18:00", "throughput": 2724.51, "total_tokens": 959190624} {"current_steps": 5315, "total_steps": 9134, "loss": 0.635, "learning_rate": 1.863894732752248e-05, "epoch": 0.581844057034949, "percentage": 58.19, "elapsed_time": "4 days, 1:48:45", "remaining_time": "2 days, 22:16:53", "throughput": 2724.51, "total_tokens": 959370048} {"current_steps": 5316, "total_steps": 9134, "loss": 0.5877, "learning_rate": 1.8630632079402693e-05, "epoch": 0.5819535291058868, "percentage": 58.2, "elapsed_time": "4 days, 1:49:52", "remaining_time": "2 days, 22:15:47", "throughput": 2724.48, "total_tokens": 959542304} {"current_steps": 5317, "total_steps": 9134, "loss": 0.6888, "learning_rate": 1.8622317584766962e-05, "epoch": 0.5820630011768247, "percentage": 58.21, "elapsed_time": "4 days, 1:51:00", "remaining_time": "2 days, 22:14:42", "throughput": 2724.51, "total_tokens": 959735616} {"current_steps": 5318, "total_steps": 9134, "loss": 0.682, "learning_rate": 1.861400384459886e-05, "epoch": 0.5821724732477627, "percentage": 58.22, "elapsed_time": "4 days, 1:52:06", "remaining_time": "2 days, 22:13:36", "throughput": 2724.46, "total_tokens": 959901376} {"current_steps": 5319, "total_steps": 9134, "loss": 1.0569, "learning_rate": 1.86056908598819e-05, "epoch": 0.5822819453187006, "percentage": 58.23, "elapsed_time": "4 days, 1:53:16", "remaining_time": "2 days, 22:12:32", "throughput": 2724.54, "total_tokens": 960116416} {"current_steps": 5320, "total_steps": 9134, "loss": 0.8573, "learning_rate": 1.8597378631599484e-05, "epoch": 0.5823914173896385, "percentage": 58.24, "elapsed_time": "4 days, 1:54:24", "remaining_time": "2 days, 22:11:27", "throughput": 2724.56, "total_tokens": 960311520} {"current_steps": 5321, "total_steps": 9134, "loss": 0.6862, "learning_rate": 1.8589067160734935e-05, "epoch": 0.5825008894605763, "percentage": 58.25, "elapsed_time": "4 days, 1:55:28", "remaining_time": "2 days, 22:10:19", "throughput": 2724.52, "total_tokens": 960470336} {"current_steps": 5322, "total_steps": 9134, "loss": 0.7469, "learning_rate": 1.8580756448271496e-05, "epoch": 0.5826103615315142, "percentage": 58.27, "elapsed_time": "4 days, 1:56:36", "remaining_time": "2 days, 22:09:14", "throughput": 2724.57, "total_tokens": 960672384} {"current_steps": 5323, "total_steps": 9134, "loss": 0.8786, "learning_rate": 1.8572446495192288e-05, "epoch": 0.5827198336024522, "percentage": 58.28, "elapsed_time": "4 days, 1:57:45", "remaining_time": "2 days, 22:08:10", "throughput": 2724.64, "total_tokens": 960886304} {"current_steps": 5324, "total_steps": 9134, "loss": 0.711, "learning_rate": 1.8564137302480373e-05, "epoch": 0.5828293056733901, "percentage": 58.29, "elapsed_time": "4 days, 1:58:51", "remaining_time": "2 days, 22:07:04", "throughput": 2724.66, "total_tokens": 961071776} {"current_steps": 5325, "total_steps": 9134, "loss": 0.8633, "learning_rate": 1.8555828871118715e-05, "epoch": 0.582938777744328, "percentage": 58.3, "elapsed_time": "4 days, 1:59:54", "remaining_time": "2 days, 22:05:56", "throughput": 2724.62, "total_tokens": 961231040} {"current_steps": 5326, "total_steps": 9134, "loss": 0.8133, "learning_rate": 1.8547521202090178e-05, "epoch": 0.5830482498152659, "percentage": 58.31, "elapsed_time": "4 days, 2:00:58", "remaining_time": "2 days, 22:04:47", "throughput": 2724.64, "total_tokens": 961409792} {"current_steps": 5327, "total_steps": 9134, "loss": 0.7706, "learning_rate": 1.8539214296377545e-05, "epoch": 0.5831577218862037, "percentage": 58.32, "elapsed_time": "4 days, 2:02:00", "remaining_time": "2 days, 22:03:38", "throughput": 2724.62, "total_tokens": 961573760} {"current_steps": 5328, "total_steps": 9134, "loss": 0.702, "learning_rate": 1.853090815496351e-05, "epoch": 0.5832671939571417, "percentage": 58.33, "elapsed_time": "4 days, 2:03:07", "remaining_time": "2 days, 22:02:33", "throughput": 2724.64, "total_tokens": 961764384} {"current_steps": 5329, "total_steps": 9134, "loss": 0.9349, "learning_rate": 1.8522602778830688e-05, "epoch": 0.5833766660280796, "percentage": 58.34, "elapsed_time": "4 days, 2:04:13", "remaining_time": "2 days, 22:01:26", "throughput": 2724.66, "total_tokens": 961950080} {"current_steps": 5330, "total_steps": 9134, "loss": 0.6777, "learning_rate": 1.851429816896156e-05, "epoch": 0.5834861380990175, "percentage": 58.35, "elapsed_time": "4 days, 2:05:20", "remaining_time": "2 days, 22:00:20", "throughput": 2724.68, "total_tokens": 962140256} {"current_steps": 5331, "total_steps": 9134, "loss": 0.6275, "learning_rate": 1.850599432633857e-05, "epoch": 0.5835956101699554, "percentage": 58.36, "elapsed_time": "4 days, 2:06:29", "remaining_time": "2 days, 21:59:16", "throughput": 2724.66, "total_tokens": 962322368} {"current_steps": 5332, "total_steps": 9134, "loss": 0.6795, "learning_rate": 1.8497691251944027e-05, "epoch": 0.5837050822408933, "percentage": 58.38, "elapsed_time": "4 days, 2:07:35", "remaining_time": "2 days, 21:58:10", "throughput": 2724.7, "total_tokens": 962516576} {"current_steps": 5333, "total_steps": 9134, "loss": 0.7046, "learning_rate": 1.848938894676019e-05, "epoch": 0.5838145543118312, "percentage": 58.39, "elapsed_time": "4 days, 2:08:40", "remaining_time": "2 days, 21:57:03", "throughput": 2724.73, "total_tokens": 962704288} {"current_steps": 5334, "total_steps": 9134, "loss": 0.5481, "learning_rate": 1.8481087411769187e-05, "epoch": 0.5839240263827691, "percentage": 58.4, "elapsed_time": "4 days, 2:09:45", "remaining_time": "2 days, 21:55:55", "throughput": 2724.73, "total_tokens": 962881248} {"current_steps": 5335, "total_steps": 9134, "loss": 0.6449, "learning_rate": 1.8472786647953078e-05, "epoch": 0.584033498453707, "percentage": 58.41, "elapsed_time": "4 days, 2:10:48", "remaining_time": "2 days, 21:54:46", "throughput": 2724.68, "total_tokens": 963031552} {"current_steps": 5336, "total_steps": 9134, "loss": 1.0847, "learning_rate": 1.8464486656293834e-05, "epoch": 0.5841429705246449, "percentage": 58.42, "elapsed_time": "4 days, 2:11:51", "remaining_time": "2 days, 21:53:38", "throughput": 2724.69, "total_tokens": 963210528} {"current_steps": 5337, "total_steps": 9134, "loss": 0.6754, "learning_rate": 1.845618743777332e-05, "epoch": 0.5842524425955828, "percentage": 58.43, "elapsed_time": "4 days, 2:12:54", "remaining_time": "2 days, 21:52:30", "throughput": 2724.65, "total_tokens": 963368672} {"current_steps": 5338, "total_steps": 9134, "loss": 0.8798, "learning_rate": 1.8447888993373336e-05, "epoch": 0.5843619146665207, "percentage": 58.44, "elapsed_time": "4 days, 2:14:02", "remaining_time": "2 days, 21:51:24", "throughput": 2724.72, "total_tokens": 963577440} {"current_steps": 5339, "total_steps": 9134, "loss": 0.6739, "learning_rate": 1.8439591324075545e-05, "epoch": 0.5844713867374586, "percentage": 58.45, "elapsed_time": "4 days, 2:15:09", "remaining_time": "2 days, 21:50:19", "throughput": 2724.75, "total_tokens": 963768064} {"current_steps": 5340, "total_steps": 9134, "loss": 0.6251, "learning_rate": 1.8431294430861572e-05, "epoch": 0.5845808588083965, "percentage": 58.46, "elapsed_time": "4 days, 2:16:16", "remaining_time": "2 days, 21:49:13", "throughput": 2724.69, "total_tokens": 963930464} {"current_steps": 5341, "total_steps": 9134, "loss": 0.8172, "learning_rate": 1.8422998314712897e-05, "epoch": 0.5846903308793344, "percentage": 58.47, "elapsed_time": "4 days, 2:17:23", "remaining_time": "2 days, 21:48:07", "throughput": 2724.69, "total_tokens": 964114816} {"current_steps": 5342, "total_steps": 9134, "loss": 0.885, "learning_rate": 1.841470297661095e-05, "epoch": 0.5847998029502723, "percentage": 58.48, "elapsed_time": "4 days, 2:18:31", "remaining_time": "2 days, 21:47:02", "throughput": 2724.74, "total_tokens": 964317984} {"current_steps": 5343, "total_steps": 9134, "loss": 0.9545, "learning_rate": 1.8406408417537064e-05, "epoch": 0.5849092750212103, "percentage": 58.5, "elapsed_time": "4 days, 2:19:41", "remaining_time": "2 days, 21:45:59", "throughput": 2724.82, "total_tokens": 964534816} {"current_steps": 5344, "total_steps": 9134, "loss": 0.5781, "learning_rate": 1.8398114638472444e-05, "epoch": 0.5850187470921481, "percentage": 58.51, "elapsed_time": "4 days, 2:20:43", "remaining_time": "2 days, 21:44:49", "throughput": 2724.79, "total_tokens": 964693632} {"current_steps": 5345, "total_steps": 9134, "loss": 0.9383, "learning_rate": 1.8389821640398245e-05, "epoch": 0.585128219163086, "percentage": 58.52, "elapsed_time": "4 days, 2:21:51", "remaining_time": "2 days, 21:43:45", "throughput": 2724.8, "total_tokens": 964883808} {"current_steps": 5346, "total_steps": 9134, "loss": 0.7277, "learning_rate": 1.8381529424295516e-05, "epoch": 0.5852376912340239, "percentage": 58.53, "elapsed_time": "4 days, 2:22:56", "remaining_time": "2 days, 21:42:37", "throughput": 2724.78, "total_tokens": 965054048} {"current_steps": 5347, "total_steps": 9134, "loss": 0.8436, "learning_rate": 1.8373237991145202e-05, "epoch": 0.5853471633049618, "percentage": 58.54, "elapsed_time": "4 days, 2:24:01", "remaining_time": "2 days, 21:41:30", "throughput": 2724.78, "total_tokens": 965228768} {"current_steps": 5348, "total_steps": 9134, "loss": 0.8186, "learning_rate": 1.8364947341928156e-05, "epoch": 0.5854566353758998, "percentage": 58.55, "elapsed_time": "4 days, 2:25:06", "remaining_time": "2 days, 21:40:23", "throughput": 2724.76, "total_tokens": 965400576} {"current_steps": 5349, "total_steps": 9134, "loss": 0.7624, "learning_rate": 1.8356657477625157e-05, "epoch": 0.5855661074468377, "percentage": 58.56, "elapsed_time": "4 days, 2:26:11", "remaining_time": "2 days, 21:39:16", "throughput": 2724.74, "total_tokens": 965569024} {"current_steps": 5350, "total_steps": 9134, "loss": 0.9171, "learning_rate": 1.8348368399216892e-05, "epoch": 0.5856755795177755, "percentage": 58.57, "elapsed_time": "4 days, 2:27:17", "remaining_time": "2 days, 21:38:09", "throughput": 2724.78, "total_tokens": 965762560} {"current_steps": 5351, "total_steps": 9134, "loss": 0.7223, "learning_rate": 1.8340080107683915e-05, "epoch": 0.5857850515887134, "percentage": 58.58, "elapsed_time": "4 days, 2:28:22", "remaining_time": "2 days, 21:37:02", "throughput": 2724.79, "total_tokens": 965944000} {"current_steps": 5352, "total_steps": 9134, "loss": 0.6672, "learning_rate": 1.833179260400674e-05, "epoch": 0.5858945236596513, "percentage": 58.59, "elapsed_time": "4 days, 2:29:28", "remaining_time": "2 days, 21:35:56", "throughput": 2724.75, "total_tokens": 966109984} {"current_steps": 5353, "total_steps": 9134, "loss": 0.8184, "learning_rate": 1.8323505889165747e-05, "epoch": 0.5860039957305893, "percentage": 58.61, "elapsed_time": "4 days, 2:30:31", "remaining_time": "2 days, 21:34:47", "throughput": 2724.73, "total_tokens": 966275072} {"current_steps": 5354, "total_steps": 9134, "loss": 0.7877, "learning_rate": 1.831521996414125e-05, "epoch": 0.5861134678015272, "percentage": 58.62, "elapsed_time": "4 days, 2:31:34", "remaining_time": "2 days, 21:33:39", "throughput": 2724.71, "total_tokens": 966441056} {"current_steps": 5355, "total_steps": 9134, "loss": 0.6966, "learning_rate": 1.8306934829913448e-05, "epoch": 0.586222939872465, "percentage": 58.63, "elapsed_time": "4 days, 2:32:41", "remaining_time": "2 days, 21:32:33", "throughput": 2724.69, "total_tokens": 966613312} {"current_steps": 5356, "total_steps": 9134, "loss": 0.7099, "learning_rate": 1.8298650487462455e-05, "epoch": 0.5863324119434029, "percentage": 58.64, "elapsed_time": "4 days, 2:33:50", "remaining_time": "2 days, 21:31:29", "throughput": 2724.77, "total_tokens": 966833504} {"current_steps": 5357, "total_steps": 9134, "loss": 1.0304, "learning_rate": 1.8290366937768306e-05, "epoch": 0.5864418840143408, "percentage": 58.65, "elapsed_time": "4 days, 2:34:59", "remaining_time": "2 days, 21:30:25", "throughput": 2724.84, "total_tokens": 967043392} {"current_steps": 5358, "total_steps": 9134, "loss": 0.8782, "learning_rate": 1.8282084181810915e-05, "epoch": 0.5865513560852788, "percentage": 58.66, "elapsed_time": "4 days, 2:36:08", "remaining_time": "2 days, 21:29:21", "throughput": 2724.91, "total_tokens": 967259104} {"current_steps": 5359, "total_steps": 9134, "loss": 0.6825, "learning_rate": 1.827380222057013e-05, "epoch": 0.5866608281562167, "percentage": 58.67, "elapsed_time": "4 days, 2:37:16", "remaining_time": "2 days, 21:28:15", "throughput": 2724.96, "total_tokens": 967461600} {"current_steps": 5360, "total_steps": 9134, "loss": 0.5396, "learning_rate": 1.8265521055025677e-05, "epoch": 0.5867703002271546, "percentage": 58.68, "elapsed_time": "4 days, 2:38:24", "remaining_time": "2 days, 21:27:10", "throughput": 2724.96, "total_tokens": 967644832} {"current_steps": 5361, "total_steps": 9134, "loss": 0.9616, "learning_rate": 1.825724068615721e-05, "epoch": 0.5868797722980924, "percentage": 58.69, "elapsed_time": "4 days, 2:39:31", "remaining_time": "2 days, 21:26:05", "throughput": 2724.99, "total_tokens": 967839264} {"current_steps": 5362, "total_steps": 9134, "loss": 0.6433, "learning_rate": 1.824896111494429e-05, "epoch": 0.5869892443690303, "percentage": 58.7, "elapsed_time": "4 days, 2:40:34", "remaining_time": "2 days, 21:24:56", "throughput": 2724.95, "total_tokens": 967995616} {"current_steps": 5363, "total_steps": 9134, "loss": 0.7917, "learning_rate": 1.8240682342366354e-05, "epoch": 0.5870987164399682, "percentage": 58.71, "elapsed_time": "4 days, 2:41:44", "remaining_time": "2 days, 21:23:52", "throughput": 2724.92, "total_tokens": 968177056} {"current_steps": 5364, "total_steps": 9134, "loss": 0.6896, "learning_rate": 1.8232404369402784e-05, "epoch": 0.5872081885109062, "percentage": 58.73, "elapsed_time": "4 days, 2:42:47", "remaining_time": "2 days, 21:22:44", "throughput": 2724.85, "total_tokens": 968325344} {"current_steps": 5365, "total_steps": 9134, "loss": 0.84, "learning_rate": 1.822412719703283e-05, "epoch": 0.5873176605818441, "percentage": 58.74, "elapsed_time": "4 days, 2:43:55", "remaining_time": "2 days, 21:21:39", "throughput": 2724.85, "total_tokens": 968509248} {"current_steps": 5366, "total_steps": 9134, "loss": 0.7646, "learning_rate": 1.8215850826235682e-05, "epoch": 0.587427132652782, "percentage": 58.75, "elapsed_time": "4 days, 2:45:02", "remaining_time": "2 days, 21:20:33", "throughput": 2724.94, "total_tokens": 968724288} {"current_steps": 5367, "total_steps": 9134, "loss": 0.8142, "learning_rate": 1.820757525799041e-05, "epoch": 0.5875366047237198, "percentage": 58.76, "elapsed_time": "4 days, 2:46:11", "remaining_time": "2 days, 21:19:29", "throughput": 2724.93, "total_tokens": 968907968} {"current_steps": 5368, "total_steps": 9134, "loss": 0.8325, "learning_rate": 1.8199300493275993e-05, "epoch": 0.5876460767946577, "percentage": 58.77, "elapsed_time": "4 days, 2:47:18", "remaining_time": "2 days, 21:18:23", "throughput": 2724.97, "total_tokens": 969105088} {"current_steps": 5369, "total_steps": 9134, "loss": 0.8287, "learning_rate": 1.8191026533071336e-05, "epoch": 0.5877555488655957, "percentage": 58.78, "elapsed_time": "4 days, 2:48:28", "remaining_time": "2 days, 21:17:19", "throughput": 2724.97, "total_tokens": 969294592} {"current_steps": 5370, "total_steps": 9134, "loss": 0.884, "learning_rate": 1.8182753378355218e-05, "epoch": 0.5878650209365336, "percentage": 58.79, "elapsed_time": "4 days, 2:49:28", "remaining_time": "2 days, 21:16:09", "throughput": 2724.93, "total_tokens": 969442880} {"current_steps": 5371, "total_steps": 9134, "loss": 1.0454, "learning_rate": 1.817448103010635e-05, "epoch": 0.5879744930074715, "percentage": 58.8, "elapsed_time": "4 days, 2:50:35", "remaining_time": "2 days, 21:15:03", "throughput": 2724.91, "total_tokens": 969619392} {"current_steps": 5372, "total_steps": 9134, "loss": 0.9974, "learning_rate": 1.816620948930332e-05, "epoch": 0.5880839650784093, "percentage": 58.81, "elapsed_time": "4 days, 2:51:45", "remaining_time": "2 days, 21:13:59", "throughput": 2724.91, "total_tokens": 969809568} {"current_steps": 5373, "total_steps": 9134, "loss": 0.7218, "learning_rate": 1.8157938756924656e-05, "epoch": 0.5881934371493472, "percentage": 58.82, "elapsed_time": "4 days, 2:52:51", "remaining_time": "2 days, 21:12:53", "throughput": 2724.88, "total_tokens": 969978912} {"current_steps": 5374, "total_steps": 9134, "loss": 0.8229, "learning_rate": 1.8149668833948747e-05, "epoch": 0.5883029092202852, "percentage": 58.84, "elapsed_time": "4 days, 2:53:57", "remaining_time": "2 days, 21:11:47", "throughput": 2724.91, "total_tokens": 970169760} {"current_steps": 5375, "total_steps": 9134, "loss": 0.9436, "learning_rate": 1.8141399721353915e-05, "epoch": 0.5884123812912231, "percentage": 58.85, "elapsed_time": "4 days, 2:55:07", "remaining_time": "2 days, 21:10:43", "throughput": 2724.91, "total_tokens": 970359040} {"current_steps": 5376, "total_steps": 9134, "loss": 0.7799, "learning_rate": 1.81331314201184e-05, "epoch": 0.588521853362161, "percentage": 58.86, "elapsed_time": "4 days, 2:56:15", "remaining_time": "2 days, 21:09:38", "throughput": 2724.96, "total_tokens": 970564448} {"current_steps": 5377, "total_steps": 9134, "loss": 0.7778, "learning_rate": 1.8124863931220293e-05, "epoch": 0.5886313254330989, "percentage": 58.87, "elapsed_time": "4 days, 2:57:23", "remaining_time": "2 days, 21:08:33", "throughput": 2724.96, "total_tokens": 970747232} {"current_steps": 5378, "total_steps": 9134, "loss": 0.7139, "learning_rate": 1.811659725563765e-05, "epoch": 0.5887407975040367, "percentage": 58.88, "elapsed_time": "4 days, 2:58:29", "remaining_time": "2 days, 21:07:27", "throughput": 2724.95, "total_tokens": 970927552} {"current_steps": 5379, "total_steps": 9134, "loss": 0.7163, "learning_rate": 1.8108331394348388e-05, "epoch": 0.5888502695749747, "percentage": 58.89, "elapsed_time": "4 days, 2:59:39", "remaining_time": "2 days, 21:06:22", "throughput": 2724.98, "total_tokens": 971126464} {"current_steps": 5380, "total_steps": 9134, "loss": 0.8249, "learning_rate": 1.8100066348330356e-05, "epoch": 0.5889597416459126, "percentage": 58.9, "elapsed_time": "4 days, 3:00:47", "remaining_time": "2 days, 21:05:18", "throughput": 2724.94, "total_tokens": 971299840} {"current_steps": 5381, "total_steps": 9134, "loss": 0.6595, "learning_rate": 1.8091802118561272e-05, "epoch": 0.5890692137168505, "percentage": 58.91, "elapsed_time": "4 days, 3:01:53", "remaining_time": "2 days, 21:04:12", "throughput": 2724.99, "total_tokens": 971497632} {"current_steps": 5382, "total_steps": 9134, "loss": 0.7831, "learning_rate": 1.80835387060188e-05, "epoch": 0.5891786857877884, "percentage": 58.92, "elapsed_time": "4 days, 3:03:02", "remaining_time": "2 days, 21:03:07", "throughput": 2725.03, "total_tokens": 971697664} {"current_steps": 5383, "total_steps": 9134, "loss": 0.8302, "learning_rate": 1.8075276111680478e-05, "epoch": 0.5892881578587263, "percentage": 58.93, "elapsed_time": "4 days, 3:04:11", "remaining_time": "2 days, 21:02:02", "throughput": 2725.03, "total_tokens": 971884928} {"current_steps": 5384, "total_steps": 9134, "loss": 0.7442, "learning_rate": 1.806701433652375e-05, "epoch": 0.5893976299296642, "percentage": 58.94, "elapsed_time": "4 days, 3:05:18", "remaining_time": "2 days, 21:00:57", "throughput": 2725.04, "total_tokens": 972069728} {"current_steps": 5385, "total_steps": 9134, "loss": 0.673, "learning_rate": 1.805875338152598e-05, "epoch": 0.5895071020006021, "percentage": 58.96, "elapsed_time": "4 days, 3:06:24", "remaining_time": "2 days, 20:59:51", "throughput": 2725.1, "total_tokens": 972274688} {"current_steps": 5386, "total_steps": 9134, "loss": 0.8682, "learning_rate": 1.8050493247664404e-05, "epoch": 0.58961657407154, "percentage": 58.97, "elapsed_time": "4 days, 3:07:32", "remaining_time": "2 days, 20:58:46", "throughput": 2725.09, "total_tokens": 972455456} {"current_steps": 5387, "total_steps": 9134, "loss": 1.0582, "learning_rate": 1.80422339359162e-05, "epoch": 0.5897260461424779, "percentage": 58.98, "elapsed_time": "4 days, 3:08:42", "remaining_time": "2 days, 20:57:41", "throughput": 2725.06, "total_tokens": 972633760} {"current_steps": 5388, "total_steps": 9134, "loss": 0.77, "learning_rate": 1.8033975447258416e-05, "epoch": 0.5898355182134158, "percentage": 58.99, "elapsed_time": "4 days, 3:09:41", "remaining_time": "2 days, 20:56:31", "throughput": 2725.0, "total_tokens": 972775104} {"current_steps": 5389, "total_steps": 9134, "loss": 0.5463, "learning_rate": 1.802571778266802e-05, "epoch": 0.5899449902843537, "percentage": 59.0, "elapsed_time": "4 days, 3:10:45", "remaining_time": "2 days, 20:55:23", "throughput": 2724.95, "total_tokens": 972933472} {"current_steps": 5390, "total_steps": 9134, "loss": 0.7448, "learning_rate": 1.8017460943121878e-05, "epoch": 0.5900544623552916, "percentage": 59.01, "elapsed_time": "4 days, 3:11:54", "remaining_time": "2 days, 20:54:18", "throughput": 2724.98, "total_tokens": 973131488} {"current_steps": 5391, "total_steps": 9134, "loss": 0.6134, "learning_rate": 1.8009204929596757e-05, "epoch": 0.5901639344262295, "percentage": 59.02, "elapsed_time": "4 days, 3:13:01", "remaining_time": "2 days, 20:53:12", "throughput": 2724.95, "total_tokens": 973299712} {"current_steps": 5392, "total_steps": 9134, "loss": 0.8962, "learning_rate": 1.8000949743069336e-05, "epoch": 0.5902734064971674, "percentage": 59.03, "elapsed_time": "4 days, 3:14:07", "remaining_time": "2 days, 20:52:06", "throughput": 2725.0, "total_tokens": 973499072} {"current_steps": 5393, "total_steps": 9134, "loss": 0.713, "learning_rate": 1.7992695384516174e-05, "epoch": 0.5903828785681053, "percentage": 59.04, "elapsed_time": "4 days, 3:15:11", "remaining_time": "2 days, 20:50:58", "throughput": 2724.95, "total_tokens": 973654304} {"current_steps": 5394, "total_steps": 9134, "loss": 0.9427, "learning_rate": 1.7984441854913758e-05, "epoch": 0.5904923506390433, "percentage": 59.05, "elapsed_time": "4 days, 3:16:17", "remaining_time": "2 days, 20:49:52", "throughput": 2724.89, "total_tokens": 973814016} {"current_steps": 5395, "total_steps": 9134, "loss": 0.6623, "learning_rate": 1.7976189155238448e-05, "epoch": 0.5906018227099811, "percentage": 59.07, "elapsed_time": "4 days, 3:17:22", "remaining_time": "2 days, 20:48:44", "throughput": 2724.9, "total_tokens": 973995008} {"current_steps": 5396, "total_steps": 9134, "loss": 0.9194, "learning_rate": 1.796793728646654e-05, "epoch": 0.590711294780919, "percentage": 59.08, "elapsed_time": "4 days, 3:18:30", "remaining_time": "2 days, 20:47:40", "throughput": 2724.93, "total_tokens": 974191904} {"current_steps": 5397, "total_steps": 9134, "loss": 0.8079, "learning_rate": 1.7959686249574214e-05, "epoch": 0.5908207668518569, "percentage": 59.09, "elapsed_time": "4 days, 3:19:40", "remaining_time": "2 days, 20:46:36", "throughput": 2724.99, "total_tokens": 974402688} {"current_steps": 5398, "total_steps": 9134, "loss": 0.5146, "learning_rate": 1.7951436045537536e-05, "epoch": 0.5909302389227948, "percentage": 59.1, "elapsed_time": "4 days, 3:20:43", "remaining_time": "2 days, 20:45:28", "throughput": 2724.95, "total_tokens": 974560160} {"current_steps": 5399, "total_steps": 9134, "loss": 0.9154, "learning_rate": 1.7943186675332504e-05, "epoch": 0.5910397109937328, "percentage": 59.11, "elapsed_time": "4 days, 3:21:50", "remaining_time": "2 days, 20:44:22", "throughput": 2724.94, "total_tokens": 974739360} {"current_steps": 5400, "total_steps": 9134, "loss": 0.7965, "learning_rate": 1.7934938139934993e-05, "epoch": 0.5911491830646707, "percentage": 59.12, "elapsed_time": "4 days, 3:22:50", "remaining_time": "2 days, 20:43:11", "throughput": 2724.85, "total_tokens": 974869504} {"current_steps": 5401, "total_steps": 9134, "loss": 0.6232, "learning_rate": 1.7926690440320803e-05, "epoch": 0.5912586551356085, "percentage": 59.13, "elapsed_time": "4 days, 3:23:56", "remaining_time": "2 days, 20:42:05", "throughput": 2724.82, "total_tokens": 975040640} {"current_steps": 5402, "total_steps": 9134, "loss": 0.7882, "learning_rate": 1.7918443577465605e-05, "epoch": 0.5913681272065464, "percentage": 59.14, "elapsed_time": "4 days, 3:25:00", "remaining_time": "2 days, 20:40:57", "throughput": 2724.82, "total_tokens": 975214464} {"current_steps": 5403, "total_steps": 9134, "loss": 0.8397, "learning_rate": 1.7910197552344993e-05, "epoch": 0.5914775992774843, "percentage": 59.15, "elapsed_time": "4 days, 3:26:06", "remaining_time": "2 days, 20:39:51", "throughput": 2724.83, "total_tokens": 975398368} {"current_steps": 5404, "total_steps": 9134, "loss": 0.854, "learning_rate": 1.7901952365934467e-05, "epoch": 0.5915870713484223, "percentage": 59.16, "elapsed_time": "4 days, 3:27:12", "remaining_time": "2 days, 20:38:44", "throughput": 2724.86, "total_tokens": 975589216} {"current_steps": 5405, "total_steps": 9134, "loss": 0.7249, "learning_rate": 1.78937080192094e-05, "epoch": 0.5916965434193602, "percentage": 59.17, "elapsed_time": "4 days, 3:28:15", "remaining_time": "2 days, 20:37:36", "throughput": 2724.75, "total_tokens": 975723168} {"current_steps": 5406, "total_steps": 9134, "loss": 0.8784, "learning_rate": 1.7885464513145094e-05, "epoch": 0.591806015490298, "percentage": 59.19, "elapsed_time": "4 days, 3:29:20", "remaining_time": "2 days, 20:36:28", "throughput": 2724.72, "total_tokens": 975884896} {"current_steps": 5407, "total_steps": 9134, "loss": 0.7616, "learning_rate": 1.7877221848716726e-05, "epoch": 0.5919154875612359, "percentage": 59.2, "elapsed_time": "4 days, 3:30:28", "remaining_time": "2 days, 20:35:24", "throughput": 2724.78, "total_tokens": 976095232} {"current_steps": 5408, "total_steps": 9134, "loss": 0.8733, "learning_rate": 1.7868980026899405e-05, "epoch": 0.5920249596321738, "percentage": 59.21, "elapsed_time": "4 days, 3:31:31", "remaining_time": "2 days, 20:34:15", "throughput": 2724.75, "total_tokens": 976256512} {"current_steps": 5409, "total_steps": 9134, "loss": 0.7395, "learning_rate": 1.786073904866811e-05, "epoch": 0.5921344317031118, "percentage": 59.22, "elapsed_time": "4 days, 3:32:39", "remaining_time": "2 days, 20:33:10", "throughput": 2724.77, "total_tokens": 976448480} {"current_steps": 5410, "total_steps": 9134, "loss": 0.9165, "learning_rate": 1.785249891499774e-05, "epoch": 0.5922439037740497, "percentage": 59.23, "elapsed_time": "4 days, 3:33:48", "remaining_time": "2 days, 20:32:06", "throughput": 2724.78, "total_tokens": 976637536} {"current_steps": 5411, "total_steps": 9134, "loss": 0.7528, "learning_rate": 1.7844259626863083e-05, "epoch": 0.5923533758449876, "percentage": 59.24, "elapsed_time": "4 days, 3:34:58", "remaining_time": "2 days, 20:31:02", "throughput": 2724.79, "total_tokens": 976831744} {"current_steps": 5412, "total_steps": 9134, "loss": 0.8915, "learning_rate": 1.783602118523883e-05, "epoch": 0.5924628479159254, "percentage": 59.25, "elapsed_time": "4 days, 3:36:05", "remaining_time": "2 days, 20:29:56", "throughput": 2724.77, "total_tokens": 977008928} {"current_steps": 5413, "total_steps": 9134, "loss": 0.6286, "learning_rate": 1.7827783591099583e-05, "epoch": 0.5925723199868633, "percentage": 59.26, "elapsed_time": "4 days, 3:37:12", "remaining_time": "2 days, 20:28:50", "throughput": 2724.76, "total_tokens": 977186784} {"current_steps": 5414, "total_steps": 9134, "loss": 0.6468, "learning_rate": 1.781954684541982e-05, "epoch": 0.5926817920578012, "percentage": 59.27, "elapsed_time": "4 days, 3:38:21", "remaining_time": "2 days, 20:27:46", "throughput": 2724.8, "total_tokens": 977389952} {"current_steps": 5415, "total_steps": 9134, "loss": 0.8473, "learning_rate": 1.7811310949173947e-05, "epoch": 0.5927912641287392, "percentage": 59.28, "elapsed_time": "4 days, 3:39:29", "remaining_time": "2 days, 20:26:41", "throughput": 2724.79, "total_tokens": 977569824} {"current_steps": 5416, "total_steps": 9134, "loss": 0.8091, "learning_rate": 1.7803075903336238e-05, "epoch": 0.5929007361996771, "percentage": 59.29, "elapsed_time": "4 days, 3:40:35", "remaining_time": "2 days, 20:25:35", "throughput": 2724.75, "total_tokens": 977736928} {"current_steps": 5417, "total_steps": 9134, "loss": 0.8207, "learning_rate": 1.7794841708880888e-05, "epoch": 0.593010208270615, "percentage": 59.31, "elapsed_time": "4 days, 3:41:44", "remaining_time": "2 days, 20:24:30", "throughput": 2724.84, "total_tokens": 977954432} {"current_steps": 5418, "total_steps": 9134, "loss": 0.9478, "learning_rate": 1.7786608366782002e-05, "epoch": 0.5931196803415528, "percentage": 59.32, "elapsed_time": "4 days, 3:42:52", "remaining_time": "2 days, 20:23:25", "throughput": 2724.92, "total_tokens": 978171040} {"current_steps": 5419, "total_steps": 9134, "loss": 0.6887, "learning_rate": 1.7778375878013547e-05, "epoch": 0.5932291524124907, "percentage": 59.33, "elapsed_time": "4 days, 3:43:59", "remaining_time": "2 days, 20:22:19", "throughput": 2724.91, "total_tokens": 978349120} {"current_steps": 5420, "total_steps": 9134, "loss": 0.5265, "learning_rate": 1.7770144243549425e-05, "epoch": 0.5933386244834287, "percentage": 59.34, "elapsed_time": "4 days, 3:45:09", "remaining_time": "2 days, 20:21:16", "throughput": 2724.92, "total_tokens": 978545568} {"current_steps": 5421, "total_steps": 9134, "loss": 0.7012, "learning_rate": 1.7761913464363413e-05, "epoch": 0.5934480965543666, "percentage": 59.35, "elapsed_time": "4 days, 3:46:16", "remaining_time": "2 days, 20:20:10", "throughput": 2724.93, "total_tokens": 978732384} {"current_steps": 5422, "total_steps": 9134, "loss": 0.8515, "learning_rate": 1.7753683541429212e-05, "epoch": 0.5935575686253045, "percentage": 59.36, "elapsed_time": "4 days, 3:47:22", "remaining_time": "2 days, 20:19:03", "throughput": 2724.96, "total_tokens": 978922112} {"current_steps": 5423, "total_steps": 9134, "loss": 0.6774, "learning_rate": 1.7745454475720387e-05, "epoch": 0.5936670406962423, "percentage": 59.37, "elapsed_time": "4 days, 3:48:30", "remaining_time": "2 days, 20:17:58", "throughput": 2724.96, "total_tokens": 979108256} {"current_steps": 5424, "total_steps": 9134, "loss": 0.6143, "learning_rate": 1.7737226268210423e-05, "epoch": 0.5937765127671802, "percentage": 59.38, "elapsed_time": "4 days, 3:49:36", "remaining_time": "2 days, 20:16:52", "throughput": 2724.96, "total_tokens": 979285888} {"current_steps": 5425, "total_steps": 9134, "loss": 0.9674, "learning_rate": 1.7728998919872723e-05, "epoch": 0.5938859848381182, "percentage": 59.39, "elapsed_time": "4 days, 3:50:42", "remaining_time": "2 days, 20:15:46", "throughput": 2725.01, "total_tokens": 979485248} {"current_steps": 5426, "total_steps": 9134, "loss": 0.8077, "learning_rate": 1.7720772431680538e-05, "epoch": 0.5939954569090561, "percentage": 59.4, "elapsed_time": "4 days, 3:51:48", "remaining_time": "2 days, 20:14:39", "throughput": 2724.99, "total_tokens": 979658176} {"current_steps": 5427, "total_steps": 9134, "loss": 0.6688, "learning_rate": 1.771254680460707e-05, "epoch": 0.594104928979994, "percentage": 59.42, "elapsed_time": "4 days, 3:52:56", "remaining_time": "2 days, 20:13:34", "throughput": 2725.03, "total_tokens": 979855520} {"current_steps": 5428, "total_steps": 9134, "loss": 0.8152, "learning_rate": 1.770432203962537e-05, "epoch": 0.5942144010509319, "percentage": 59.43, "elapsed_time": "4 days, 3:54:01", "remaining_time": "2 days, 20:12:27", "throughput": 2725.02, "total_tokens": 980028672} {"current_steps": 5429, "total_steps": 9134, "loss": 0.91, "learning_rate": 1.7696098137708434e-05, "epoch": 0.5943238731218697, "percentage": 59.44, "elapsed_time": "4 days, 3:55:10", "remaining_time": "2 days, 20:11:22", "throughput": 2725.09, "total_tokens": 980241024} {"current_steps": 5430, "total_steps": 9134, "loss": 0.6866, "learning_rate": 1.7687875099829127e-05, "epoch": 0.5944333451928077, "percentage": 59.45, "elapsed_time": "4 days, 3:56:16", "remaining_time": "2 days, 20:10:16", "throughput": 2725.07, "total_tokens": 980414624} {"current_steps": 5431, "total_steps": 9134, "loss": 0.6133, "learning_rate": 1.767965292696021e-05, "epoch": 0.5945428172637456, "percentage": 59.46, "elapsed_time": "4 days, 3:57:22", "remaining_time": "2 days, 20:09:09", "throughput": 2725.09, "total_tokens": 980602784} {"current_steps": 5432, "total_steps": 9134, "loss": 0.789, "learning_rate": 1.7671431620074365e-05, "epoch": 0.5946522893346835, "percentage": 59.47, "elapsed_time": "4 days, 3:58:28", "remaining_time": "2 days, 20:08:03", "throughput": 2725.01, "total_tokens": 980753984} {"current_steps": 5433, "total_steps": 9134, "loss": 1.0414, "learning_rate": 1.7663211180144146e-05, "epoch": 0.5947617614056214, "percentage": 59.48, "elapsed_time": "4 days, 3:59:34", "remaining_time": "2 days, 20:06:56", "throughput": 2725.0, "total_tokens": 980930048} {"current_steps": 5434, "total_steps": 9134, "loss": 0.7856, "learning_rate": 1.7654991608142024e-05, "epoch": 0.5948712334765593, "percentage": 59.49, "elapsed_time": "4 days, 4:00:39", "remaining_time": "2 days, 20:05:50", "throughput": 2724.97, "total_tokens": 981098496} {"current_steps": 5435, "total_steps": 9134, "loss": 0.825, "learning_rate": 1.7646772905040347e-05, "epoch": 0.5949807055474972, "percentage": 59.5, "elapsed_time": "4 days, 4:01:46", "remaining_time": "2 days, 20:04:44", "throughput": 2724.97, "total_tokens": 981279264} {"current_steps": 5436, "total_steps": 9134, "loss": 0.8719, "learning_rate": 1.7638555071811373e-05, "epoch": 0.5950901776184351, "percentage": 59.51, "elapsed_time": "4 days, 4:02:51", "remaining_time": "2 days, 20:03:37", "throughput": 2724.95, "total_tokens": 981448384} {"current_steps": 5437, "total_steps": 9134, "loss": 0.6106, "learning_rate": 1.763033810942728e-05, "epoch": 0.595199649689373, "percentage": 59.52, "elapsed_time": "4 days, 4:03:55", "remaining_time": "2 days, 20:02:29", "throughput": 2724.95, "total_tokens": 981624672} {"current_steps": 5438, "total_steps": 9134, "loss": 0.7378, "learning_rate": 1.7622122018860082e-05, "epoch": 0.5953091217603109, "percentage": 59.54, "elapsed_time": "4 days, 4:04:57", "remaining_time": "2 days, 20:01:20", "throughput": 2724.91, "total_tokens": 981779008} {"current_steps": 5439, "total_steps": 9134, "loss": 0.6691, "learning_rate": 1.761390680108176e-05, "epoch": 0.5954185938312488, "percentage": 59.55, "elapsed_time": "4 days, 4:06:03", "remaining_time": "2 days, 20:00:13", "throughput": 2724.88, "total_tokens": 981948128} {"current_steps": 5440, "total_steps": 9134, "loss": 0.6119, "learning_rate": 1.7605692457064133e-05, "epoch": 0.5955280659021867, "percentage": 59.56, "elapsed_time": "4 days, 4:07:11", "remaining_time": "2 days, 19:59:08", "throughput": 2724.88, "total_tokens": 982133600} {"current_steps": 5441, "total_steps": 9134, "loss": 0.7315, "learning_rate": 1.7597478987778956e-05, "epoch": 0.5956375379731246, "percentage": 59.57, "elapsed_time": "4 days, 4:08:19", "remaining_time": "2 days, 19:58:03", "throughput": 2724.88, "total_tokens": 982314816} {"current_steps": 5442, "total_steps": 9134, "loss": 0.8267, "learning_rate": 1.758926639419786e-05, "epoch": 0.5957470100440625, "percentage": 59.58, "elapsed_time": "4 days, 4:09:25", "remaining_time": "2 days, 19:56:57", "throughput": 2724.91, "total_tokens": 982511040} {"current_steps": 5443, "total_steps": 9134, "loss": 0.7293, "learning_rate": 1.7581054677292387e-05, "epoch": 0.5958564821150004, "percentage": 59.59, "elapsed_time": "4 days, 4:10:31", "remaining_time": "2 days, 19:55:50", "throughput": 2724.93, "total_tokens": 982694272} {"current_steps": 5444, "total_steps": 9134, "loss": 0.8918, "learning_rate": 1.7572843838033964e-05, "epoch": 0.5959659541859383, "percentage": 59.6, "elapsed_time": "4 days, 4:11:40", "remaining_time": "2 days, 19:54:46", "throughput": 2724.95, "total_tokens": 982891840} {"current_steps": 5445, "total_steps": 9134, "loss": 0.8333, "learning_rate": 1.756463387739391e-05, "epoch": 0.5960754262568763, "percentage": 59.61, "elapsed_time": "4 days, 4:12:48", "remaining_time": "2 days, 19:53:41", "throughput": 2724.94, "total_tokens": 983074176} {"current_steps": 5446, "total_steps": 9134, "loss": 0.6789, "learning_rate": 1.7556424796343462e-05, "epoch": 0.5961848983278141, "percentage": 59.62, "elapsed_time": "4 days, 4:13:57", "remaining_time": "2 days, 19:52:36", "throughput": 2724.86, "total_tokens": 983230976} {"current_steps": 5447, "total_steps": 9134, "loss": 0.8542, "learning_rate": 1.754821659585373e-05, "epoch": 0.596294370398752, "percentage": 59.63, "elapsed_time": "4 days, 4:15:03", "remaining_time": "2 days, 19:51:30", "throughput": 2724.84, "total_tokens": 983404800} {"current_steps": 5448, "total_steps": 9134, "loss": 0.7352, "learning_rate": 1.754000927689573e-05, "epoch": 0.5964038424696899, "percentage": 59.65, "elapsed_time": "4 days, 4:16:13", "remaining_time": "2 days, 19:50:26", "throughput": 2724.88, "total_tokens": 983607296} {"current_steps": 5449, "total_steps": 9134, "loss": 0.5752, "learning_rate": 1.7531802840440364e-05, "epoch": 0.5965133145406278, "percentage": 59.66, "elapsed_time": "4 days, 4:17:19", "remaining_time": "2 days, 19:49:20", "throughput": 2724.9, "total_tokens": 983796352} {"current_steps": 5450, "total_steps": 9134, "loss": 0.8487, "learning_rate": 1.7523597287458447e-05, "epoch": 0.5966227866115658, "percentage": 59.67, "elapsed_time": "4 days, 4:18:25", "remaining_time": "2 days, 19:48:14", "throughput": 2724.84, "total_tokens": 983955616} {"current_steps": 5451, "total_steps": 9134, "loss": 0.7848, "learning_rate": 1.7515392618920686e-05, "epoch": 0.5967322586825037, "percentage": 59.68, "elapsed_time": "4 days, 4:19:29", "remaining_time": "2 days, 19:47:06", "throughput": 2724.84, "total_tokens": 984128768} {"current_steps": 5452, "total_steps": 9134, "loss": 0.751, "learning_rate": 1.750718883579766e-05, "epoch": 0.5968417307534415, "percentage": 59.69, "elapsed_time": "4 days, 4:20:35", "remaining_time": "2 days, 19:45:59", "throughput": 2724.83, "total_tokens": 984304832} {"current_steps": 5453, "total_steps": 9134, "loss": 0.5144, "learning_rate": 1.749898593905988e-05, "epoch": 0.5969512028243794, "percentage": 59.7, "elapsed_time": "4 days, 4:21:41", "remaining_time": "2 days, 19:44:53", "throughput": 2724.84, "total_tokens": 984487616} {"current_steps": 5454, "total_steps": 9134, "loss": 0.6408, "learning_rate": 1.7490783929677714e-05, "epoch": 0.5970606748953173, "percentage": 59.71, "elapsed_time": "4 days, 4:22:46", "remaining_time": "2 days, 19:43:46", "throughput": 2724.82, "total_tokens": 984659424} {"current_steps": 5455, "total_steps": 9134, "loss": 0.6533, "learning_rate": 1.748258280862147e-05, "epoch": 0.5971701469662553, "percentage": 59.72, "elapsed_time": "4 days, 4:23:53", "remaining_time": "2 days, 19:42:40", "throughput": 2724.84, "total_tokens": 984848928} {"current_steps": 5456, "total_steps": 9134, "loss": 0.7597, "learning_rate": 1.7474382576861293e-05, "epoch": 0.5972796190371932, "percentage": 59.73, "elapsed_time": "4 days, 4:24:52", "remaining_time": "2 days, 19:41:29", "throughput": 2724.75, "total_tokens": 984977280} {"current_steps": 5457, "total_steps": 9134, "loss": 0.8465, "learning_rate": 1.7466183235367274e-05, "epoch": 0.597389091108131, "percentage": 59.74, "elapsed_time": "4 days, 4:25:58", "remaining_time": "2 days, 19:40:23", "throughput": 2724.74, "total_tokens": 985152000} {"current_steps": 5458, "total_steps": 9134, "loss": 0.9797, "learning_rate": 1.745798478510938e-05, "epoch": 0.5974985631790689, "percentage": 59.75, "elapsed_time": "4 days, 4:27:03", "remaining_time": "2 days, 19:39:15", "throughput": 2724.76, "total_tokens": 985338592} {"current_steps": 5459, "total_steps": 9134, "loss": 0.9235, "learning_rate": 1.744978722705747e-05, "epoch": 0.5976080352500068, "percentage": 59.77, "elapsed_time": "4 days, 4:28:12", "remaining_time": "2 days, 19:38:11", "throughput": 2724.78, "total_tokens": 985530784} {"current_steps": 5460, "total_steps": 9134, "loss": 0.6718, "learning_rate": 1.74415905621813e-05, "epoch": 0.5977175073209448, "percentage": 59.78, "elapsed_time": "4 days, 4:29:20", "remaining_time": "2 days, 19:37:06", "throughput": 2724.79, "total_tokens": 985720288} {"current_steps": 5461, "total_steps": 9134, "loss": 0.7027, "learning_rate": 1.74333947914505e-05, "epoch": 0.5978269793918827, "percentage": 59.79, "elapsed_time": "4 days, 4:30:23", "remaining_time": "2 days, 19:35:58", "throughput": 2724.8, "total_tokens": 985897920} {"current_steps": 5462, "total_steps": 9134, "loss": 0.7748, "learning_rate": 1.7425199915834646e-05, "epoch": 0.5979364514628206, "percentage": 59.8, "elapsed_time": "4 days, 4:31:27", "remaining_time": "2 days, 19:34:49", "throughput": 2724.81, "total_tokens": 986072416} {"current_steps": 5463, "total_steps": 9134, "loss": 0.7614, "learning_rate": 1.7417005936303155e-05, "epoch": 0.5980459235337584, "percentage": 59.81, "elapsed_time": "4 days, 4:32:36", "remaining_time": "2 days, 19:33:45", "throughput": 2724.86, "total_tokens": 986280064} {"current_steps": 5464, "total_steps": 9134, "loss": 0.5321, "learning_rate": 1.740881285382537e-05, "epoch": 0.5981553956046963, "percentage": 59.82, "elapsed_time": "4 days, 4:33:40", "remaining_time": "2 days, 19:32:37", "throughput": 2724.86, "total_tokens": 986455008} {"current_steps": 5465, "total_steps": 9134, "loss": 0.7024, "learning_rate": 1.7400620669370513e-05, "epoch": 0.5982648676756342, "percentage": 59.83, "elapsed_time": "4 days, 4:34:47", "remaining_time": "2 days, 19:31:32", "throughput": 2724.89, "total_tokens": 986648768} {"current_steps": 5466, "total_steps": 9134, "loss": 0.7324, "learning_rate": 1.7392429383907698e-05, "epoch": 0.5983743397465722, "percentage": 59.84, "elapsed_time": "4 days, 4:35:54", "remaining_time": "2 days, 19:30:26", "throughput": 2724.9, "total_tokens": 986835808} {"current_steps": 5467, "total_steps": 9134, "loss": 0.8376, "learning_rate": 1.7384238998405954e-05, "epoch": 0.5984838118175101, "percentage": 59.85, "elapsed_time": "4 days, 4:37:02", "remaining_time": "2 days, 19:29:21", "throughput": 2724.92, "total_tokens": 987027104} {"current_steps": 5468, "total_steps": 9134, "loss": 0.9533, "learning_rate": 1.7376049513834165e-05, "epoch": 0.598593283888448, "percentage": 59.86, "elapsed_time": "4 days, 4:38:08", "remaining_time": "2 days, 19:28:14", "throughput": 2724.97, "total_tokens": 987226912} {"current_steps": 5469, "total_steps": 9134, "loss": 0.5967, "learning_rate": 1.7367860931161155e-05, "epoch": 0.5987027559593858, "percentage": 59.88, "elapsed_time": "4 days, 4:39:14", "remaining_time": "2 days, 19:27:08", "throughput": 2724.95, "total_tokens": 987399616} {"current_steps": 5470, "total_steps": 9134, "loss": 0.8264, "learning_rate": 1.73596732513556e-05, "epoch": 0.5988122280303237, "percentage": 59.89, "elapsed_time": "4 days, 4:40:19", "remaining_time": "2 days, 19:26:01", "throughput": 2724.95, "total_tokens": 987573664} {"current_steps": 5471, "total_steps": 9134, "loss": 0.6711, "learning_rate": 1.7351486475386088e-05, "epoch": 0.5989217001012617, "percentage": 59.9, "elapsed_time": "4 days, 4:41:27", "remaining_time": "2 days, 19:24:56", "throughput": 2725.04, "total_tokens": 987790720} {"current_steps": 5472, "total_steps": 9134, "loss": 0.8188, "learning_rate": 1.7343300604221118e-05, "epoch": 0.5990311721721996, "percentage": 59.91, "elapsed_time": "4 days, 4:42:32", "remaining_time": "2 days, 19:23:48", "throughput": 2724.99, "total_tokens": 987949984} {"current_steps": 5473, "total_steps": 9134, "loss": 0.7175, "learning_rate": 1.733511563882904e-05, "epoch": 0.5991406442431375, "percentage": 59.92, "elapsed_time": "4 days, 4:43:41", "remaining_time": "2 days, 19:22:44", "throughput": 2725.01, "total_tokens": 988148000} {"current_steps": 5474, "total_steps": 9134, "loss": 0.8653, "learning_rate": 1.732693158017813e-05, "epoch": 0.5992501163140753, "percentage": 59.93, "elapsed_time": "4 days, 4:44:49", "remaining_time": "2 days, 19:21:39", "throughput": 2725.1, "total_tokens": 988364608} {"current_steps": 5475, "total_steps": 9134, "loss": 0.5839, "learning_rate": 1.7318748429236547e-05, "epoch": 0.5993595883850132, "percentage": 59.94, "elapsed_time": "4 days, 4:45:55", "remaining_time": "2 days, 19:20:33", "throughput": 2725.12, "total_tokens": 988550976} {"current_steps": 5476, "total_steps": 9134, "loss": 0.83, "learning_rate": 1.7310566186972345e-05, "epoch": 0.5994690604559512, "percentage": 59.95, "elapsed_time": "4 days, 4:46:58", "remaining_time": "2 days, 19:19:24", "throughput": 2725.07, "total_tokens": 988704416} {"current_steps": 5477, "total_steps": 9134, "loss": 1.0223, "learning_rate": 1.7302384854353455e-05, "epoch": 0.5995785325268891, "percentage": 59.96, "elapsed_time": "4 days, 4:48:05", "remaining_time": "2 days, 19:18:19", "throughput": 2725.02, "total_tokens": 988870848} {"current_steps": 5478, "total_steps": 9134, "loss": 0.7546, "learning_rate": 1.7294204432347723e-05, "epoch": 0.599688004597827, "percentage": 59.97, "elapsed_time": "4 days, 4:49:10", "remaining_time": "2 days, 19:17:12", "throughput": 2725.05, "total_tokens": 989056992} {"current_steps": 5479, "total_steps": 9134, "loss": 0.7647, "learning_rate": 1.7286024921922887e-05, "epoch": 0.5997974766687649, "percentage": 59.98, "elapsed_time": "4 days, 4:50:17", "remaining_time": "2 days, 19:16:06", "throughput": 2725.04, "total_tokens": 989236864} {"current_steps": 5480, "total_steps": 9134, "loss": 0.8436, "learning_rate": 1.7277846324046544e-05, "epoch": 0.5999069487397027, "percentage": 60.0, "elapsed_time": "4 days, 4:51:22", "remaining_time": "2 days, 19:14:59", "throughput": 2725.04, "total_tokens": 989414272} {"current_steps": 5481, "total_steps": 9134, "loss": 1.1026, "learning_rate": 1.7269668639686225e-05, "epoch": 0.6000164208106407, "percentage": 60.01, "elapsed_time": "4 days, 4:52:32", "remaining_time": "2 days, 19:13:55", "throughput": 2725.08, "total_tokens": 989620800} {"current_steps": 5482, "total_steps": 9134, "loss": 1.0973, "learning_rate": 1.7261491869809327e-05, "epoch": 0.6001258928815786, "percentage": 60.02, "elapsed_time": "4 days, 4:53:38", "remaining_time": "2 days, 19:12:49", "throughput": 2725.09, "total_tokens": 989802688} {"current_steps": 5483, "total_steps": 9134, "loss": 0.6267, "learning_rate": 1.7253316015383145e-05, "epoch": 0.6002353649525165, "percentage": 60.03, "elapsed_time": "4 days, 4:54:40", "remaining_time": "2 days, 19:11:40", "throughput": 2725.08, "total_tokens": 989968000} {"current_steps": 5484, "total_steps": 9134, "loss": 0.842, "learning_rate": 1.7245141077374865e-05, "epoch": 0.6003448370234544, "percentage": 60.04, "elapsed_time": "4 days, 4:55:50", "remaining_time": "2 days, 19:10:36", "throughput": 2725.09, "total_tokens": 990164448} {"current_steps": 5485, "total_steps": 9134, "loss": 0.7046, "learning_rate": 1.723696705675158e-05, "epoch": 0.6004543090943923, "percentage": 60.05, "elapsed_time": "4 days, 4:56:59", "remaining_time": "2 days, 19:09:31", "throughput": 2725.04, "total_tokens": 990334464} {"current_steps": 5486, "total_steps": 9134, "loss": 0.7015, "learning_rate": 1.7228793954480246e-05, "epoch": 0.6005637811653302, "percentage": 60.06, "elapsed_time": "4 days, 4:58:01", "remaining_time": "2 days, 19:08:22", "throughput": 2725.0, "total_tokens": 990489696} {"current_steps": 5487, "total_steps": 9134, "loss": 0.7332, "learning_rate": 1.722062177152773e-05, "epoch": 0.6006732532362681, "percentage": 60.07, "elapsed_time": "4 days, 4:59:06", "remaining_time": "2 days, 19:07:15", "throughput": 2725.01, "total_tokens": 990666656} {"current_steps": 5488, "total_steps": 9134, "loss": 0.6961, "learning_rate": 1.7212450508860794e-05, "epoch": 0.600782725307206, "percentage": 60.08, "elapsed_time": "4 days, 5:00:09", "remaining_time": "2 days, 19:06:07", "throughput": 2724.92, "total_tokens": 990806656} {"current_steps": 5489, "total_steps": 9134, "loss": 0.9414, "learning_rate": 1.720428016744607e-05, "epoch": 0.6008921973781439, "percentage": 60.09, "elapsed_time": "4 days, 5:01:17", "remaining_time": "2 days, 19:05:02", "throughput": 2724.92, "total_tokens": 990993696} {"current_steps": 5490, "total_steps": 9134, "loss": 0.8922, "learning_rate": 1.7196110748250095e-05, "epoch": 0.6010016694490818, "percentage": 60.11, "elapsed_time": "4 days, 5:02:23", "remaining_time": "2 days, 19:03:55", "throughput": 2724.88, "total_tokens": 991158784} {"current_steps": 5491, "total_steps": 9134, "loss": 0.7054, "learning_rate": 1.718794225223931e-05, "epoch": 0.6011111415200197, "percentage": 60.12, "elapsed_time": "4 days, 5:03:28", "remaining_time": "2 days, 19:02:48", "throughput": 2724.87, "total_tokens": 991330592} {"current_steps": 5492, "total_steps": 9134, "loss": 0.8146, "learning_rate": 1.7179774680380014e-05, "epoch": 0.6012206135909576, "percentage": 60.13, "elapsed_time": "4 days, 5:04:35", "remaining_time": "2 days, 19:01:42", "throughput": 2724.87, "total_tokens": 991511584} {"current_steps": 5493, "total_steps": 9134, "loss": 0.7095, "learning_rate": 1.7171608033638435e-05, "epoch": 0.6013300856618955, "percentage": 60.14, "elapsed_time": "4 days, 5:05:38", "remaining_time": "2 days, 19:00:34", "throughput": 2724.86, "total_tokens": 991679808} {"current_steps": 5494, "total_steps": 9134, "loss": 0.9056, "learning_rate": 1.716344231298065e-05, "epoch": 0.6014395577328334, "percentage": 60.15, "elapsed_time": "4 days, 5:06:48", "remaining_time": "2 days, 18:59:30", "throughput": 2724.89, "total_tokens": 991882304} {"current_steps": 5495, "total_steps": 9134, "loss": 0.9579, "learning_rate": 1.715527751937266e-05, "epoch": 0.6015490298037713, "percentage": 60.16, "elapsed_time": "4 days, 5:07:50", "remaining_time": "2 days, 18:58:21", "throughput": 2724.84, "total_tokens": 992036416} {"current_steps": 5496, "total_steps": 9134, "loss": 0.9317, "learning_rate": 1.714711365378034e-05, "epoch": 0.6016585018747093, "percentage": 60.17, "elapsed_time": "4 days, 5:08:53", "remaining_time": "2 days, 18:57:13", "throughput": 2724.81, "total_tokens": 992193888} {"current_steps": 5497, "total_steps": 9134, "loss": 0.6919, "learning_rate": 1.713895071716946e-05, "epoch": 0.6017679739456471, "percentage": 60.18, "elapsed_time": "4 days, 5:10:01", "remaining_time": "2 days, 18:56:07", "throughput": 2724.83, "total_tokens": 992388096} {"current_steps": 5498, "total_steps": 9134, "loss": 0.6749, "learning_rate": 1.7130788710505696e-05, "epoch": 0.601877446016585, "percentage": 60.19, "elapsed_time": "4 days, 5:11:09", "remaining_time": "2 days, 18:55:02", "throughput": 2724.86, "total_tokens": 992584992} {"current_steps": 5499, "total_steps": 9134, "loss": 0.6773, "learning_rate": 1.7122627634754573e-05, "epoch": 0.6019869180875229, "percentage": 60.2, "elapsed_time": "4 days, 5:12:12", "remaining_time": "2 days, 18:53:54", "throughput": 2724.83, "total_tokens": 992744704} {"current_steps": 5500, "total_steps": 9134, "loss": 0.8476, "learning_rate": 1.7114467490881553e-05, "epoch": 0.6020963901584608, "percentage": 60.21, "elapsed_time": "4 days, 5:13:19", "remaining_time": "2 days, 18:52:48", "throughput": 2724.82, "total_tokens": 992923008} {"current_steps": 5501, "total_steps": 9134, "loss": 0.6068, "learning_rate": 1.7106308279851945e-05, "epoch": 0.6022058622293988, "percentage": 60.23, "elapsed_time": "4 days, 5:14:27", "remaining_time": "2 days, 18:51:43", "throughput": 2724.88, "total_tokens": 993128864} {"current_steps": 5502, "total_steps": 9134, "loss": 0.6729, "learning_rate": 1.7098150002630988e-05, "epoch": 0.6023153343003367, "percentage": 60.24, "elapsed_time": "4 days, 5:15:34", "remaining_time": "2 days, 18:50:37", "throughput": 2724.88, "total_tokens": 993310976} {"current_steps": 5503, "total_steps": 9134, "loss": 0.6883, "learning_rate": 1.7089992660183766e-05, "epoch": 0.6024248063712745, "percentage": 60.25, "elapsed_time": "4 days, 5:16:42", "remaining_time": "2 days, 18:49:32", "throughput": 2724.91, "total_tokens": 993510336} {"current_steps": 5504, "total_steps": 9134, "loss": 0.7234, "learning_rate": 1.7081836253475292e-05, "epoch": 0.6025342784422124, "percentage": 60.26, "elapsed_time": "4 days, 5:17:51", "remaining_time": "2 days, 18:48:28", "throughput": 2724.94, "total_tokens": 993709248} {"current_steps": 5505, "total_steps": 9134, "loss": 0.6737, "learning_rate": 1.7073680783470457e-05, "epoch": 0.6026437505131503, "percentage": 60.27, "elapsed_time": "4 days, 5:19:01", "remaining_time": "2 days, 18:47:24", "throughput": 2724.95, "total_tokens": 993902560} {"current_steps": 5506, "total_steps": 9134, "loss": 0.6561, "learning_rate": 1.7065526251134033e-05, "epoch": 0.6027532225840883, "percentage": 60.28, "elapsed_time": "4 days, 5:20:07", "remaining_time": "2 days, 18:46:18", "throughput": 2724.9, "total_tokens": 994063392} {"current_steps": 5507, "total_steps": 9134, "loss": 0.8774, "learning_rate": 1.7057372657430687e-05, "epoch": 0.6028626946550262, "percentage": 60.29, "elapsed_time": "4 days, 5:21:10", "remaining_time": "2 days, 18:45:09", "throughput": 2724.84, "total_tokens": 994213696} {"current_steps": 5508, "total_steps": 9134, "loss": 0.7296, "learning_rate": 1.7049220003324964e-05, "epoch": 0.602972166725964, "percentage": 60.3, "elapsed_time": "4 days, 5:22:14", "remaining_time": "2 days, 18:44:02", "throughput": 2724.82, "total_tokens": 994381472} {"current_steps": 5509, "total_steps": 9134, "loss": 0.6512, "learning_rate": 1.7041068289781326e-05, "epoch": 0.6030816387969019, "percentage": 60.31, "elapsed_time": "4 days, 5:23:20", "remaining_time": "2 days, 18:42:55", "throughput": 2724.83, "total_tokens": 994562912} {"current_steps": 5510, "total_steps": 9134, "loss": 1.0969, "learning_rate": 1.7032917517764085e-05, "epoch": 0.6031911108678398, "percentage": 60.32, "elapsed_time": "4 days, 5:24:29", "remaining_time": "2 days, 18:41:51", "throughput": 2724.93, "total_tokens": 994788928} {"current_steps": 5511, "total_steps": 9134, "loss": 0.6186, "learning_rate": 1.7024767688237475e-05, "epoch": 0.6033005829387778, "percentage": 60.34, "elapsed_time": "4 days, 5:25:35", "remaining_time": "2 days, 18:40:44", "throughput": 2724.87, "total_tokens": 994947520} {"current_steps": 5512, "total_steps": 9134, "loss": 0.8869, "learning_rate": 1.7016618802165607e-05, "epoch": 0.6034100550097157, "percentage": 60.35, "elapsed_time": "4 days, 5:26:37", "remaining_time": "2 days, 18:39:35", "throughput": 2724.83, "total_tokens": 995099392} {"current_steps": 5513, "total_steps": 9134, "loss": 0.6334, "learning_rate": 1.7008470860512466e-05, "epoch": 0.6035195270806536, "percentage": 60.36, "elapsed_time": "4 days, 5:27:43", "remaining_time": "2 days, 18:38:29", "throughput": 2724.83, "total_tokens": 995279936} {"current_steps": 5514, "total_steps": 9134, "loss": 0.5778, "learning_rate": 1.7000323864241953e-05, "epoch": 0.6036289991515914, "percentage": 60.37, "elapsed_time": "4 days, 5:28:47", "remaining_time": "2 days, 18:37:21", "throughput": 2724.8, "total_tokens": 995445472} {"current_steps": 5515, "total_steps": 9134, "loss": 0.7222, "learning_rate": 1.699217781431782e-05, "epoch": 0.6037384712225293, "percentage": 60.38, "elapsed_time": "4 days, 5:29:54", "remaining_time": "2 days, 18:36:15", "throughput": 2724.79, "total_tokens": 995621312} {"current_steps": 5516, "total_steps": 9134, "loss": 0.9345, "learning_rate": 1.6984032711703753e-05, "epoch": 0.6038479432934672, "percentage": 60.39, "elapsed_time": "4 days, 5:31:03", "remaining_time": "2 days, 18:35:10", "throughput": 2724.83, "total_tokens": 995824480} {"current_steps": 5517, "total_steps": 9134, "loss": 0.6892, "learning_rate": 1.697588855736329e-05, "epoch": 0.6039574153644052, "percentage": 60.4, "elapsed_time": "4 days, 5:32:09", "remaining_time": "2 days, 18:34:05", "throughput": 2724.84, "total_tokens": 996008832} {"current_steps": 5518, "total_steps": 9134, "loss": 0.9348, "learning_rate": 1.6967745352259868e-05, "epoch": 0.6040668874353431, "percentage": 60.41, "elapsed_time": "4 days, 5:33:15", "remaining_time": "2 days, 18:32:58", "throughput": 2724.76, "total_tokens": 996161152} {"current_steps": 5519, "total_steps": 9134, "loss": 0.7976, "learning_rate": 1.6959603097356823e-05, "epoch": 0.604176359506281, "percentage": 60.42, "elapsed_time": "4 days, 5:34:22", "remaining_time": "2 days, 18:31:52", "throughput": 2724.76, "total_tokens": 996343264} {"current_steps": 5520, "total_steps": 9134, "loss": 0.6922, "learning_rate": 1.6951461793617354e-05, "epoch": 0.6042858315772188, "percentage": 60.43, "elapsed_time": "4 days, 5:35:27", "remaining_time": "2 days, 18:30:45", "throughput": 2724.76, "total_tokens": 996519552} {"current_steps": 5521, "total_steps": 9134, "loss": 0.6488, "learning_rate": 1.694332144200458e-05, "epoch": 0.6043953036481567, "percentage": 60.44, "elapsed_time": "4 days, 5:36:30", "remaining_time": "2 days, 18:29:37", "throughput": 2724.72, "total_tokens": 996677248} {"current_steps": 5522, "total_steps": 9134, "loss": 1.0386, "learning_rate": 1.693518204348146e-05, "epoch": 0.6045047757190947, "percentage": 60.46, "elapsed_time": "4 days, 5:37:35", "remaining_time": "2 days, 18:28:30", "throughput": 2724.73, "total_tokens": 996856224} {"current_steps": 5523, "total_steps": 9134, "loss": 0.8737, "learning_rate": 1.6927043599010906e-05, "epoch": 0.6046142477900326, "percentage": 60.47, "elapsed_time": "4 days, 5:38:37", "remaining_time": "2 days, 18:27:21", "throughput": 2724.65, "total_tokens": 996998912} {"current_steps": 5524, "total_steps": 9134, "loss": 0.8438, "learning_rate": 1.691890610955565e-05, "epoch": 0.6047237198609705, "percentage": 60.48, "elapsed_time": "4 days, 5:39:46", "remaining_time": "2 days, 18:26:16", "throughput": 2724.72, "total_tokens": 997210368} {"current_steps": 5525, "total_steps": 9134, "loss": 0.6916, "learning_rate": 1.691076957607835e-05, "epoch": 0.6048331919319083, "percentage": 60.49, "elapsed_time": "4 days, 5:40:54", "remaining_time": "2 days, 18:25:11", "throughput": 2724.68, "total_tokens": 997382400} {"current_steps": 5526, "total_steps": 9134, "loss": 0.6764, "learning_rate": 1.690263399954155e-05, "epoch": 0.6049426640028462, "percentage": 60.5, "elapsed_time": "4 days, 5:42:03", "remaining_time": "2 days, 18:24:06", "throughput": 2724.66, "total_tokens": 997560256} {"current_steps": 5527, "total_steps": 9134, "loss": 1.0718, "learning_rate": 1.689449938090767e-05, "epoch": 0.6050521360737842, "percentage": 60.51, "elapsed_time": "4 days, 5:43:12", "remaining_time": "2 days, 18:23:02", "throughput": 2724.66, "total_tokens": 997747968} {"current_steps": 5528, "total_steps": 9134, "loss": 0.8101, "learning_rate": 1.688636572113902e-05, "epoch": 0.6051616081447221, "percentage": 60.52, "elapsed_time": "4 days, 5:44:20", "remaining_time": "2 days, 18:21:57", "throughput": 2724.69, "total_tokens": 997946208} {"current_steps": 5529, "total_steps": 9134, "loss": 0.5713, "learning_rate": 1.6878233021197783e-05, "epoch": 0.60527108021566, "percentage": 60.53, "elapsed_time": "4 days, 5:45:25", "remaining_time": "2 days, 18:20:50", "throughput": 2724.64, "total_tokens": 998106816} {"current_steps": 5530, "total_steps": 9134, "loss": 0.7715, "learning_rate": 1.687010128204607e-05, "epoch": 0.6053805522865979, "percentage": 60.54, "elapsed_time": "4 days, 5:46:30", "remaining_time": "2 days, 18:19:43", "throughput": 2724.61, "total_tokens": 998271904} {"current_steps": 5531, "total_steps": 9134, "loss": 0.6131, "learning_rate": 1.6861970504645818e-05, "epoch": 0.6054900243575357, "percentage": 60.55, "elapsed_time": "4 days, 5:47:37", "remaining_time": "2 days, 18:18:37", "throughput": 2724.64, "total_tokens": 998465440} {"current_steps": 5532, "total_steps": 9134, "loss": 0.7166, "learning_rate": 1.6853840689958904e-05, "epoch": 0.6055994964284737, "percentage": 60.56, "elapsed_time": "4 days, 5:48:38", "remaining_time": "2 days, 18:17:28", "throughput": 2724.56, "total_tokens": 998603424} {"current_steps": 5533, "total_steps": 9134, "loss": 0.5986, "learning_rate": 1.684571183894707e-05, "epoch": 0.6057089684994116, "percentage": 60.58, "elapsed_time": "4 days, 5:49:47", "remaining_time": "2 days, 18:16:23", "throughput": 2724.58, "total_tokens": 998796960} {"current_steps": 5534, "total_steps": 9134, "loss": 0.7069, "learning_rate": 1.6837583952571927e-05, "epoch": 0.6058184405703495, "percentage": 60.59, "elapsed_time": "4 days, 5:50:55", "remaining_time": "2 days, 18:15:18", "throughput": 2724.57, "total_tokens": 998978848} {"current_steps": 5535, "total_steps": 9134, "loss": 0.6636, "learning_rate": 1.682945703179501e-05, "epoch": 0.6059279126412874, "percentage": 60.6, "elapsed_time": "4 days, 5:51:59", "remaining_time": "2 days, 18:14:10", "throughput": 2724.52, "total_tokens": 999136096} {"current_steps": 5536, "total_steps": 9134, "loss": 0.716, "learning_rate": 1.6821331077577697e-05, "epoch": 0.6060373847122253, "percentage": 60.61, "elapsed_time": "4 days, 5:53:03", "remaining_time": "2 days, 18:13:02", "throughput": 2724.53, "total_tokens": 999311488} {"current_steps": 5537, "total_steps": 9134, "loss": 0.8667, "learning_rate": 1.6813206090881285e-05, "epoch": 0.6061468567831632, "percentage": 60.62, "elapsed_time": "4 days, 5:54:12", "remaining_time": "2 days, 18:11:58", "throughput": 2724.51, "total_tokens": 999493824} {"current_steps": 5538, "total_steps": 9134, "loss": 0.8186, "learning_rate": 1.680508207266694e-05, "epoch": 0.6062563288541011, "percentage": 60.63, "elapsed_time": "4 days, 5:55:16", "remaining_time": "2 days, 18:10:50", "throughput": 2724.46, "total_tokens": 999650176} {"current_steps": 5539, "total_steps": 9134, "loss": 0.6468, "learning_rate": 1.6796959023895717e-05, "epoch": 0.606365800925039, "percentage": 60.64, "elapsed_time": "4 days, 5:56:22", "remaining_time": "2 days, 18:09:44", "throughput": 2724.45, "total_tokens": 999826912} {"current_steps": 5540, "total_steps": 9134, "loss": 0.8095, "learning_rate": 1.678883694552857e-05, "epoch": 0.6064752729959769, "percentage": 60.65, "elapsed_time": "4 days, 5:57:27", "remaining_time": "2 days, 18:08:37", "throughput": 2724.43, "total_tokens": 999996928} {"current_steps": 5541, "total_steps": 9134, "loss": 0.8928, "learning_rate": 1.678071583852631e-05, "epoch": 0.6065847450669148, "percentage": 60.66, "elapsed_time": "4 days, 5:58:36", "remaining_time": "2 days, 18:07:32", "throughput": 2724.51, "total_tokens": 1000215104} {"current_steps": 5542, "total_steps": 9134, "loss": 1.0532, "learning_rate": 1.677259570384966e-05, "epoch": 0.6066942171378527, "percentage": 60.67, "elapsed_time": "4 days, 5:59:45", "remaining_time": "2 days, 18:06:28", "throughput": 2724.59, "total_tokens": 1000430144} {"current_steps": 5543, "total_steps": 9134, "loss": 0.5697, "learning_rate": 1.67644765424592e-05, "epoch": 0.6068036892087906, "percentage": 60.69, "elapsed_time": "4 days, 6:00:49", "remaining_time": "2 days, 18:05:20", "throughput": 2724.56, "total_tokens": 1000591424} {"current_steps": 5544, "total_steps": 9134, "loss": 0.7783, "learning_rate": 1.6756358355315433e-05, "epoch": 0.6069131612797285, "percentage": 60.7, "elapsed_time": "4 days, 6:01:56", "remaining_time": "2 days, 18:04:14", "throughput": 2724.59, "total_tokens": 1000786528} {"current_steps": 5545, "total_steps": 9134, "loss": 0.8278, "learning_rate": 1.6748241143378702e-05, "epoch": 0.6070226333506664, "percentage": 60.71, "elapsed_time": "4 days, 6:03:02", "remaining_time": "2 days, 18:03:08", "throughput": 2724.56, "total_tokens": 1000958112} {"current_steps": 5546, "total_steps": 9134, "loss": 0.8167, "learning_rate": 1.6740124907609266e-05, "epoch": 0.6071321054216043, "percentage": 60.72, "elapsed_time": "4 days, 6:04:11", "remaining_time": "2 days, 18:02:03", "throughput": 2724.59, "total_tokens": 1001154784} {"current_steps": 5547, "total_steps": 9134, "loss": 0.7418, "learning_rate": 1.6732009648967272e-05, "epoch": 0.6072415774925423, "percentage": 60.73, "elapsed_time": "4 days, 6:05:18", "remaining_time": "2 days, 18:00:58", "throughput": 2724.56, "total_tokens": 1001326592} {"current_steps": 5548, "total_steps": 9134, "loss": 0.6757, "learning_rate": 1.6723895368412732e-05, "epoch": 0.6073510495634801, "percentage": 60.74, "elapsed_time": "4 days, 6:06:25", "remaining_time": "2 days, 17:59:51", "throughput": 2724.57, "total_tokens": 1001510496} {"current_steps": 5549, "total_steps": 9134, "loss": 0.7962, "learning_rate": 1.6715782066905544e-05, "epoch": 0.607460521634418, "percentage": 60.75, "elapsed_time": "4 days, 6:07:30", "remaining_time": "2 days, 17:58:45", "throughput": 2724.55, "total_tokens": 1001681856} {"current_steps": 5550, "total_steps": 9134, "loss": 0.9985, "learning_rate": 1.6707669745405502e-05, "epoch": 0.6075699937053559, "percentage": 60.76, "elapsed_time": "4 days, 6:08:39", "remaining_time": "2 days, 17:57:40", "throughput": 2724.62, "total_tokens": 1001895104} {"current_steps": 5551, "total_steps": 9134, "loss": 0.9074, "learning_rate": 1.6699558404872272e-05, "epoch": 0.6076794657762938, "percentage": 60.77, "elapsed_time": "4 days, 6:09:46", "remaining_time": "2 days, 17:56:35", "throughput": 2724.67, "total_tokens": 1002098048} {"current_steps": 5552, "total_steps": 9134, "loss": 0.7959, "learning_rate": 1.6691448046265426e-05, "epoch": 0.6077889378472318, "percentage": 60.78, "elapsed_time": "4 days, 6:10:50", "remaining_time": "2 days, 17:55:26", "throughput": 2724.66, "total_tokens": 1002267840} {"current_steps": 5553, "total_steps": 9134, "loss": 0.6694, "learning_rate": 1.6683338670544384e-05, "epoch": 0.6078984099181697, "percentage": 60.79, "elapsed_time": "4 days, 6:11:58", "remaining_time": "2 days, 17:54:21", "throughput": 2724.66, "total_tokens": 1002453984} {"current_steps": 5554, "total_steps": 9134, "loss": 0.9039, "learning_rate": 1.6675230278668484e-05, "epoch": 0.6080078819891075, "percentage": 60.81, "elapsed_time": "4 days, 6:13:04", "remaining_time": "2 days, 17:53:15", "throughput": 2724.67, "total_tokens": 1002635648} {"current_steps": 5555, "total_steps": 9134, "loss": 0.5707, "learning_rate": 1.6667122871596925e-05, "epoch": 0.6081173540600454, "percentage": 60.82, "elapsed_time": "4 days, 6:14:14", "remaining_time": "2 days, 17:52:11", "throughput": 2724.72, "total_tokens": 1002845760} {"current_steps": 5556, "total_steps": 9134, "loss": 0.8132, "learning_rate": 1.6659016450288805e-05, "epoch": 0.6082268261309833, "percentage": 60.83, "elapsed_time": "4 days, 6:15:21", "remaining_time": "2 days, 17:51:05", "throughput": 2724.73, "total_tokens": 1003031904} {"current_steps": 5557, "total_steps": 9134, "loss": 0.6512, "learning_rate": 1.665091101570309e-05, "epoch": 0.6083362982019213, "percentage": 60.84, "elapsed_time": "4 days, 6:16:25", "remaining_time": "2 days, 17:49:58", "throughput": 2724.74, "total_tokens": 1003211776} {"current_steps": 5558, "total_steps": 9134, "loss": 0.5813, "learning_rate": 1.6642806568798635e-05, "epoch": 0.6084457702728592, "percentage": 60.85, "elapsed_time": "4 days, 6:17:29", "remaining_time": "2 days, 17:48:50", "throughput": 2724.72, "total_tokens": 1003377536} {"current_steps": 5559, "total_steps": 9134, "loss": 0.7503, "learning_rate": 1.6634703110534195e-05, "epoch": 0.608555242343797, "percentage": 60.86, "elapsed_time": "4 days, 6:18:39", "remaining_time": "2 days, 17:47:46", "throughput": 2724.73, "total_tokens": 1003571072} {"current_steps": 5560, "total_steps": 9134, "loss": 0.5809, "learning_rate": 1.662660064186838e-05, "epoch": 0.6086647144147349, "percentage": 60.87, "elapsed_time": "4 days, 6:19:45", "remaining_time": "2 days, 17:46:40", "throughput": 2724.75, "total_tokens": 1003759904} {"current_steps": 5561, "total_steps": 9134, "loss": 0.7881, "learning_rate": 1.661849916375971e-05, "epoch": 0.6087741864856728, "percentage": 60.88, "elapsed_time": "4 days, 6:20:51", "remaining_time": "2 days, 17:45:33", "throughput": 2724.74, "total_tokens": 1003934624} {"current_steps": 5562, "total_steps": 9134, "loss": 0.554, "learning_rate": 1.6610398677166555e-05, "epoch": 0.6088836585566108, "percentage": 60.89, "elapsed_time": "4 days, 6:21:51", "remaining_time": "2 days, 17:44:23", "throughput": 2724.69, "total_tokens": 1004079104} {"current_steps": 5563, "total_steps": 9134, "loss": 0.6521, "learning_rate": 1.660229918304721e-05, "epoch": 0.6089931306275487, "percentage": 60.9, "elapsed_time": "4 days, 6:22:58", "remaining_time": "2 days, 17:43:17", "throughput": 2724.71, "total_tokens": 1004269504} {"current_steps": 5564, "total_steps": 9134, "loss": 0.705, "learning_rate": 1.659420068235981e-05, "epoch": 0.6091026026984866, "percentage": 60.92, "elapsed_time": "4 days, 6:24:05", "remaining_time": "2 days, 17:42:11", "throughput": 2724.76, "total_tokens": 1004470880} {"current_steps": 5565, "total_steps": 9134, "loss": 0.5571, "learning_rate": 1.6586103176062397e-05, "epoch": 0.6092120747694244, "percentage": 60.93, "elapsed_time": "4 days, 6:25:05", "remaining_time": "2 days, 17:41:01", "throughput": 2724.73, "total_tokens": 1004621184} {"current_steps": 5566, "total_steps": 9134, "loss": 0.8197, "learning_rate": 1.6578006665112906e-05, "epoch": 0.6093215468403623, "percentage": 60.94, "elapsed_time": "4 days, 6:26:13", "remaining_time": "2 days, 17:39:56", "throughput": 2724.78, "total_tokens": 1004827712} {"current_steps": 5567, "total_steps": 9134, "loss": 0.5778, "learning_rate": 1.6569911150469113e-05, "epoch": 0.6094310189113002, "percentage": 60.95, "elapsed_time": "4 days, 6:27:20", "remaining_time": "2 days, 17:38:51", "throughput": 2724.81, "total_tokens": 1005021024} {"current_steps": 5568, "total_steps": 9134, "loss": 0.8989, "learning_rate": 1.6561816633088723e-05, "epoch": 0.6095404909822382, "percentage": 60.96, "elapsed_time": "4 days, 6:28:29", "remaining_time": "2 days, 17:37:46", "throughput": 2724.79, "total_tokens": 1005199552} {"current_steps": 5569, "total_steps": 9134, "loss": 0.9195, "learning_rate": 1.6553723113929296e-05, "epoch": 0.6096499630531761, "percentage": 60.97, "elapsed_time": "4 days, 6:29:34", "remaining_time": "2 days, 17:36:39", "throughput": 2724.76, "total_tokens": 1005363968} {"current_steps": 5570, "total_steps": 9134, "loss": 0.7277, "learning_rate": 1.6545630593948276e-05, "epoch": 0.609759435124114, "percentage": 60.98, "elapsed_time": "4 days, 6:30:41", "remaining_time": "2 days, 17:35:33", "throughput": 2724.77, "total_tokens": 1005554368} {"current_steps": 5571, "total_steps": 9134, "loss": 0.6542, "learning_rate": 1.6537539074102988e-05, "epoch": 0.6098689071950518, "percentage": 60.99, "elapsed_time": "4 days, 6:31:47", "remaining_time": "2 days, 17:34:27", "throughput": 2724.77, "total_tokens": 1005733568} {"current_steps": 5572, "total_steps": 9134, "loss": 0.6329, "learning_rate": 1.6529448555350653e-05, "epoch": 0.6099783792659897, "percentage": 61.0, "elapsed_time": "4 days, 6:32:55", "remaining_time": "2 days, 17:33:21", "throughput": 2724.8, "total_tokens": 1005929344} {"current_steps": 5573, "total_steps": 9134, "loss": 0.6468, "learning_rate": 1.652135903864837e-05, "epoch": 0.6100878513369277, "percentage": 61.01, "elapsed_time": "4 days, 6:34:02", "remaining_time": "2 days, 17:32:16", "throughput": 2724.82, "total_tokens": 1006120192} {"current_steps": 5574, "total_steps": 9134, "loss": 0.8085, "learning_rate": 1.6513270524953092e-05, "epoch": 0.6101973234078656, "percentage": 61.02, "elapsed_time": "4 days, 6:35:09", "remaining_time": "2 days, 17:31:10", "throughput": 2724.79, "total_tokens": 1006292672} {"current_steps": 5575, "total_steps": 9134, "loss": 0.9803, "learning_rate": 1.65051830152217e-05, "epoch": 0.6103067954788035, "percentage": 61.04, "elapsed_time": "4 days, 6:36:18", "remaining_time": "2 days, 17:30:06", "throughput": 2724.81, "total_tokens": 1006487104} {"current_steps": 5576, "total_steps": 9134, "loss": 0.7258, "learning_rate": 1.6497096510410908e-05, "epoch": 0.6104162675497413, "percentage": 61.05, "elapsed_time": "4 days, 6:37:23", "remaining_time": "2 days, 17:28:59", "throughput": 2724.83, "total_tokens": 1006673696} {"current_steps": 5577, "total_steps": 9134, "loss": 0.9891, "learning_rate": 1.648901101147735e-05, "epoch": 0.6105257396206792, "percentage": 61.06, "elapsed_time": "4 days, 6:38:33", "remaining_time": "2 days, 17:27:54", "throughput": 2724.81, "total_tokens": 1006853344} {"current_steps": 5578, "total_steps": 9134, "loss": 0.7626, "learning_rate": 1.6480926519377514e-05, "epoch": 0.6106352116916172, "percentage": 61.07, "elapsed_time": "4 days, 6:39:36", "remaining_time": "2 days, 17:26:46", "throughput": 2724.79, "total_tokens": 1007018656} {"current_steps": 5579, "total_steps": 9134, "loss": 1.0454, "learning_rate": 1.6472843035067784e-05, "epoch": 0.6107446837625551, "percentage": 61.08, "elapsed_time": "4 days, 6:40:45", "remaining_time": "2 days, 17:25:42", "throughput": 2724.82, "total_tokens": 1007218240} {"current_steps": 5580, "total_steps": 9134, "loss": 0.7578, "learning_rate": 1.6464760559504424e-05, "epoch": 0.610854155833493, "percentage": 61.09, "elapsed_time": "4 days, 6:41:54", "remaining_time": "2 days, 17:24:37", "throughput": 2724.85, "total_tokens": 1007417152} {"current_steps": 5581, "total_steps": 9134, "loss": 0.8691, "learning_rate": 1.6456679093643572e-05, "epoch": 0.6109636279044309, "percentage": 61.1, "elapsed_time": "4 days, 6:43:02", "remaining_time": "2 days, 17:23:32", "throughput": 2724.88, "total_tokens": 1007611584} {"current_steps": 5582, "total_steps": 9134, "loss": 0.6419, "learning_rate": 1.644859863844126e-05, "epoch": 0.6110730999753687, "percentage": 61.11, "elapsed_time": "4 days, 6:44:07", "remaining_time": "2 days, 17:22:25", "throughput": 2724.82, "total_tokens": 1007767712} {"current_steps": 5583, "total_steps": 9134, "loss": 0.6541, "learning_rate": 1.644051919485337e-05, "epoch": 0.6111825720463067, "percentage": 61.12, "elapsed_time": "4 days, 6:45:14", "remaining_time": "2 days, 17:21:19", "throughput": 2724.85, "total_tokens": 1007960800} {"current_steps": 5584, "total_steps": 9134, "loss": 0.6812, "learning_rate": 1.643244076383571e-05, "epoch": 0.6112920441172446, "percentage": 61.13, "elapsed_time": "4 days, 6:46:19", "remaining_time": "2 days, 17:20:12", "throughput": 2724.84, "total_tokens": 1008135072} {"current_steps": 5585, "total_steps": 9134, "loss": 0.9242, "learning_rate": 1.6424363346343912e-05, "epoch": 0.6114015161881825, "percentage": 61.15, "elapsed_time": "4 days, 6:47:27", "remaining_time": "2 days, 17:19:07", "throughput": 2724.83, "total_tokens": 1008317408} {"current_steps": 5586, "total_steps": 9134, "loss": 0.7242, "learning_rate": 1.641628694333354e-05, "epoch": 0.6115109882591204, "percentage": 61.16, "elapsed_time": "4 days, 6:48:30", "remaining_time": "2 days, 17:17:59", "throughput": 2724.8, "total_tokens": 1008475776} {"current_steps": 5587, "total_steps": 9134, "loss": 0.656, "learning_rate": 1.6408211555760028e-05, "epoch": 0.6116204603300583, "percentage": 61.17, "elapsed_time": "4 days, 6:49:36", "remaining_time": "2 days, 17:16:52", "throughput": 2724.77, "total_tokens": 1008647136} {"current_steps": 5588, "total_steps": 9134, "loss": 0.6507, "learning_rate": 1.6400137184578647e-05, "epoch": 0.6117299324009962, "percentage": 61.18, "elapsed_time": "4 days, 6:50:42", "remaining_time": "2 days, 17:15:46", "throughput": 2724.73, "total_tokens": 1008812896} {"current_steps": 5589, "total_steps": 9134, "loss": 0.7057, "learning_rate": 1.639206383074461e-05, "epoch": 0.6118394044719341, "percentage": 61.19, "elapsed_time": "4 days, 6:51:50", "remaining_time": "2 days, 17:14:41", "throughput": 2724.73, "total_tokens": 1008995680} {"current_steps": 5590, "total_steps": 9134, "loss": 0.8946, "learning_rate": 1.6383991495212957e-05, "epoch": 0.611948876542872, "percentage": 61.2, "elapsed_time": "4 days, 6:52:58", "remaining_time": "2 days, 17:13:36", "throughput": 2724.8, "total_tokens": 1009209600} {"current_steps": 5591, "total_steps": 9134, "loss": 0.6025, "learning_rate": 1.6375920178938646e-05, "epoch": 0.6120583486138099, "percentage": 61.21, "elapsed_time": "4 days, 6:54:05", "remaining_time": "2 days, 17:12:30", "throughput": 2724.73, "total_tokens": 1009361696} {"current_steps": 5592, "total_steps": 9134, "loss": 0.7432, "learning_rate": 1.6367849882876485e-05, "epoch": 0.6121678206847478, "percentage": 61.22, "elapsed_time": "4 days, 6:55:13", "remaining_time": "2 days, 17:11:25", "throughput": 2724.73, "total_tokens": 1009551200} {"current_steps": 5593, "total_steps": 9134, "loss": 0.937, "learning_rate": 1.635978060798118e-05, "epoch": 0.6122772927556857, "percentage": 61.23, "elapsed_time": "4 days, 6:56:20", "remaining_time": "2 days, 17:10:19", "throughput": 2724.77, "total_tokens": 1009746976} {"current_steps": 5594, "total_steps": 9134, "loss": 0.8917, "learning_rate": 1.6351712355207323e-05, "epoch": 0.6123867648266236, "percentage": 61.24, "elapsed_time": "4 days, 6:57:26", "remaining_time": "2 days, 17:09:12", "throughput": 2724.78, "total_tokens": 1009928192} {"current_steps": 5595, "total_steps": 9134, "loss": 0.8546, "learning_rate": 1.6343645125509348e-05, "epoch": 0.6124962368975615, "percentage": 61.25, "elapsed_time": "4 days, 6:58:35", "remaining_time": "2 days, 17:08:08", "throughput": 2724.77, "total_tokens": 1010113216} {"current_steps": 5596, "total_steps": 9134, "loss": 0.7644, "learning_rate": 1.633557891984162e-05, "epoch": 0.6126057089684994, "percentage": 61.27, "elapsed_time": "4 days, 6:59:39", "remaining_time": "2 days, 17:07:00", "throughput": 2724.75, "total_tokens": 1010279648} {"current_steps": 5597, "total_steps": 9134, "loss": 0.551, "learning_rate": 1.632751373915833e-05, "epoch": 0.6127151810394373, "percentage": 61.28, "elapsed_time": "4 days, 7:00:47", "remaining_time": "2 days, 17:05:55", "throughput": 2724.77, "total_tokens": 1010474976} {"current_steps": 5598, "total_steps": 9134, "loss": 0.7171, "learning_rate": 1.6319449584413596e-05, "epoch": 0.6128246531103753, "percentage": 61.29, "elapsed_time": "4 days, 7:01:56", "remaining_time": "2 days, 17:04:51", "throughput": 2724.79, "total_tokens": 1010668960} {"current_steps": 5599, "total_steps": 9134, "loss": 0.7969, "learning_rate": 1.6311386456561373e-05, "epoch": 0.6129341251813131, "percentage": 61.3, "elapsed_time": "4 days, 7:03:06", "remaining_time": "2 days, 17:03:46", "throughput": 2724.85, "total_tokens": 1010881760} {"current_steps": 5600, "total_steps": 9134, "loss": 0.8477, "learning_rate": 1.6303324356555523e-05, "epoch": 0.613043597252251, "percentage": 61.31, "elapsed_time": "4 days, 7:04:10", "remaining_time": "2 days, 17:02:39", "throughput": 2724.83, "total_tokens": 1011052224} {"current_steps": 5601, "total_steps": 9134, "loss": 0.7495, "learning_rate": 1.6295263285349776e-05, "epoch": 0.6131530693231889, "percentage": 61.32, "elapsed_time": "4 days, 7:05:17", "remaining_time": "2 days, 17:01:33", "throughput": 2724.83, "total_tokens": 1011230752} {"current_steps": 5602, "total_steps": 9134, "loss": 0.5814, "learning_rate": 1.628720324389774e-05, "epoch": 0.6132625413941268, "percentage": 61.33, "elapsed_time": "4 days, 7:06:21", "remaining_time": "2 days, 17:00:25", "throughput": 2724.8, "total_tokens": 1011392704} {"current_steps": 5603, "total_steps": 9134, "loss": 0.9052, "learning_rate": 1.6279144233152922e-05, "epoch": 0.6133720134650648, "percentage": 61.34, "elapsed_time": "4 days, 7:07:28", "remaining_time": "2 days, 16:59:19", "throughput": 2724.76, "total_tokens": 1011561376} {"current_steps": 5604, "total_steps": 9134, "loss": 0.7543, "learning_rate": 1.6271086254068653e-05, "epoch": 0.6134814855360027, "percentage": 61.35, "elapsed_time": "4 days, 7:08:36", "remaining_time": "2 days, 16:58:14", "throughput": 2724.8, "total_tokens": 1011760512} {"current_steps": 5605, "total_steps": 9134, "loss": 0.8816, "learning_rate": 1.6263029307598198e-05, "epoch": 0.6135909576069405, "percentage": 61.36, "elapsed_time": "4 days, 7:09:44", "remaining_time": "2 days, 16:57:09", "throughput": 2724.79, "total_tokens": 1011946208} {"current_steps": 5606, "total_steps": 9134, "loss": 0.8905, "learning_rate": 1.6254973394694672e-05, "epoch": 0.6137004296778784, "percentage": 61.38, "elapsed_time": "4 days, 7:10:53", "remaining_time": "2 days, 16:56:04", "throughput": 2724.81, "total_tokens": 1012138624} {"current_steps": 5607, "total_steps": 9134, "loss": 0.633, "learning_rate": 1.6246918516311072e-05, "epoch": 0.6138099017488163, "percentage": 61.39, "elapsed_time": "4 days, 7:11:59", "remaining_time": "2 days, 16:54:58", "throughput": 2724.81, "total_tokens": 1012319840} {"current_steps": 5608, "total_steps": 9134, "loss": 0.9574, "learning_rate": 1.623886467340029e-05, "epoch": 0.6139193738197543, "percentage": 61.4, "elapsed_time": "4 days, 7:13:09", "remaining_time": "2 days, 16:53:54", "throughput": 2724.85, "total_tokens": 1012523456} {"current_steps": 5609, "total_steps": 9134, "loss": 0.9073, "learning_rate": 1.6230811866915057e-05, "epoch": 0.6140288458906922, "percentage": 61.41, "elapsed_time": "4 days, 7:14:17", "remaining_time": "2 days, 16:52:49", "throughput": 2724.81, "total_tokens": 1012695264} {"current_steps": 5610, "total_steps": 9134, "loss": 0.5939, "learning_rate": 1.622276009780802e-05, "epoch": 0.61413831796163, "percentage": 61.42, "elapsed_time": "4 days, 7:15:21", "remaining_time": "2 days, 16:51:42", "throughput": 2724.76, "total_tokens": 1012852288} {"current_steps": 5611, "total_steps": 9134, "loss": 0.8305, "learning_rate": 1.621470936703169e-05, "epoch": 0.6142477900325679, "percentage": 61.43, "elapsed_time": "4 days, 7:16:26", "remaining_time": "2 days, 16:50:34", "throughput": 2724.71, "total_tokens": 1013010432} {"current_steps": 5612, "total_steps": 9134, "loss": 0.6938, "learning_rate": 1.6206659675538445e-05, "epoch": 0.6143572621035058, "percentage": 61.44, "elapsed_time": "4 days, 7:17:33", "remaining_time": "2 days, 16:49:29", "throughput": 2724.71, "total_tokens": 1013190976} {"current_steps": 5613, "total_steps": 9134, "loss": 0.8629, "learning_rate": 1.6198611024280543e-05, "epoch": 0.6144667341744438, "percentage": 61.45, "elapsed_time": "4 days, 7:18:36", "remaining_time": "2 days, 16:48:21", "throughput": 2724.66, "total_tokens": 1013346432} {"current_steps": 5614, "total_steps": 9134, "loss": 0.5833, "learning_rate": 1.6190563414210132e-05, "epoch": 0.6145762062453817, "percentage": 61.46, "elapsed_time": "4 days, 7:19:41", "remaining_time": "2 days, 16:47:14", "throughput": 2724.63, "total_tokens": 1013514432} {"current_steps": 5615, "total_steps": 9134, "loss": 1.0842, "learning_rate": 1.6182516846279237e-05, "epoch": 0.6146856783163196, "percentage": 61.47, "elapsed_time": "4 days, 7:20:48", "remaining_time": "2 days, 16:46:07", "throughput": 2724.59, "total_tokens": 1013679296} {"current_steps": 5616, "total_steps": 9134, "loss": 0.8542, "learning_rate": 1.6174471321439737e-05, "epoch": 0.6147951503872574, "percentage": 61.48, "elapsed_time": "4 days, 7:21:55", "remaining_time": "2 days, 16:45:02", "throughput": 2724.58, "total_tokens": 1013856928} {"current_steps": 5617, "total_steps": 9134, "loss": 0.7794, "learning_rate": 1.6166426840643415e-05, "epoch": 0.6149046224581953, "percentage": 61.5, "elapsed_time": "4 days, 7:23:00", "remaining_time": "2 days, 16:43:55", "throughput": 2724.59, "total_tokens": 1014039040} {"current_steps": 5618, "total_steps": 9134, "loss": 0.8752, "learning_rate": 1.6158383404841902e-05, "epoch": 0.6150140945291332, "percentage": 61.51, "elapsed_time": "4 days, 7:24:09", "remaining_time": "2 days, 16:42:50", "throughput": 2724.68, "total_tokens": 1014261472} {"current_steps": 5619, "total_steps": 9134, "loss": 0.6257, "learning_rate": 1.615034101498673e-05, "epoch": 0.6151235666000712, "percentage": 61.52, "elapsed_time": "4 days, 7:25:16", "remaining_time": "2 days, 16:41:44", "throughput": 2724.66, "total_tokens": 1014436192} {"current_steps": 5620, "total_steps": 9134, "loss": 0.7707, "learning_rate": 1.6142299672029307e-05, "epoch": 0.6152330386710091, "percentage": 61.53, "elapsed_time": "4 days, 7:26:24", "remaining_time": "2 days, 16:40:39", "throughput": 2724.66, "total_tokens": 1014618752} {"current_steps": 5621, "total_steps": 9134, "loss": 0.9942, "learning_rate": 1.613425937692089e-05, "epoch": 0.615342510741947, "percentage": 61.54, "elapsed_time": "4 days, 7:27:33", "remaining_time": "2 days, 16:39:35", "throughput": 2724.63, "total_tokens": 1014798848} {"current_steps": 5622, "total_steps": 9134, "loss": 0.788, "learning_rate": 1.6126220130612646e-05, "epoch": 0.6154519828128848, "percentage": 61.55, "elapsed_time": "4 days, 7:28:39", "remaining_time": "2 days, 16:38:28", "throughput": 2724.65, "total_tokens": 1014986560} {"current_steps": 5623, "total_steps": 9134, "loss": 0.5454, "learning_rate": 1.6118181934055593e-05, "epoch": 0.6155614548838227, "percentage": 61.56, "elapsed_time": "4 days, 7:29:44", "remaining_time": "2 days, 16:37:21", "throughput": 2724.64, "total_tokens": 1015159264} {"current_steps": 5624, "total_steps": 9134, "loss": 0.8409, "learning_rate": 1.611014478820064e-05, "epoch": 0.6156709269547607, "percentage": 61.57, "elapsed_time": "4 days, 7:30:53", "remaining_time": "2 days, 16:36:17", "throughput": 2724.64, "total_tokens": 1015347872} {"current_steps": 5625, "total_steps": 9134, "loss": 0.7603, "learning_rate": 1.6102108693998568e-05, "epoch": 0.6157803990256986, "percentage": 61.58, "elapsed_time": "4 days, 7:31:58", "remaining_time": "2 days, 16:35:10", "throughput": 2724.57, "total_tokens": 1015498400} {"current_steps": 5626, "total_steps": 9134, "loss": 0.652, "learning_rate": 1.6094073652400014e-05, "epoch": 0.6158898710966365, "percentage": 61.59, "elapsed_time": "4 days, 7:33:04", "remaining_time": "2 days, 16:34:03", "throughput": 2724.6, "total_tokens": 1015688576} {"current_steps": 5627, "total_steps": 9134, "loss": 0.8421, "learning_rate": 1.608603966435554e-05, "epoch": 0.6159993431675743, "percentage": 61.6, "elapsed_time": "4 days, 7:34:11", "remaining_time": "2 days, 16:32:57", "throughput": 2724.59, "total_tokens": 1015868448} {"current_steps": 5628, "total_steps": 9134, "loss": 0.6916, "learning_rate": 1.607800673081552e-05, "epoch": 0.6161088152385122, "percentage": 61.62, "elapsed_time": "4 days, 7:35:19", "remaining_time": "2 days, 16:31:52", "throughput": 2724.59, "total_tokens": 1016054816} {"current_steps": 5629, "total_steps": 9134, "loss": 0.7484, "learning_rate": 1.6069974852730263e-05, "epoch": 0.6162182873094502, "percentage": 61.63, "elapsed_time": "4 days, 7:36:25", "remaining_time": "2 days, 16:30:46", "throughput": 2724.59, "total_tokens": 1016232224} {"current_steps": 5630, "total_steps": 9134, "loss": 0.6238, "learning_rate": 1.6061944031049893e-05, "epoch": 0.6163277593803881, "percentage": 61.64, "elapsed_time": "4 days, 7:37:32", "remaining_time": "2 days, 16:29:40", "throughput": 2724.6, "total_tokens": 1016420384} {"current_steps": 5631, "total_steps": 9134, "loss": 0.8591, "learning_rate": 1.605391426672447e-05, "epoch": 0.616437231451326, "percentage": 61.65, "elapsed_time": "4 days, 7:38:41", "remaining_time": "2 days, 16:28:36", "throughput": 2724.69, "total_tokens": 1016639904} {"current_steps": 5632, "total_steps": 9134, "loss": 0.8722, "learning_rate": 1.604588556070388e-05, "epoch": 0.6165467035222639, "percentage": 61.66, "elapsed_time": "4 days, 7:39:46", "remaining_time": "2 days, 16:27:29", "throughput": 2724.65, "total_tokens": 1016802976} {"current_steps": 5633, "total_steps": 9134, "loss": 0.7539, "learning_rate": 1.6037857913937908e-05, "epoch": 0.6166561755932017, "percentage": 61.67, "elapsed_time": "4 days, 7:40:50", "remaining_time": "2 days, 16:26:21", "throughput": 2724.61, "total_tokens": 1016962688} {"current_steps": 5634, "total_steps": 9134, "loss": 0.7009, "learning_rate": 1.6029831327376217e-05, "epoch": 0.6167656476641397, "percentage": 61.68, "elapsed_time": "4 days, 7:41:55", "remaining_time": "2 days, 16:25:14", "throughput": 2724.61, "total_tokens": 1017139424} {"current_steps": 5635, "total_steps": 9134, "loss": 0.8175, "learning_rate": 1.6021805801968325e-05, "epoch": 0.6168751197350776, "percentage": 61.69, "elapsed_time": "4 days, 7:43:01", "remaining_time": "2 days, 16:24:07", "throughput": 2724.61, "total_tokens": 1017316384} {"current_steps": 5636, "total_steps": 9134, "loss": 0.7916, "learning_rate": 1.6013781338663654e-05, "epoch": 0.6169845918060155, "percentage": 61.7, "elapsed_time": "4 days, 7:44:10", "remaining_time": "2 days, 16:23:02", "throughput": 2724.64, "total_tokens": 1017518656} {"current_steps": 5637, "total_steps": 9134, "loss": 0.6901, "learning_rate": 1.6005757938411466e-05, "epoch": 0.6170940638769534, "percentage": 61.71, "elapsed_time": "4 days, 7:45:15", "remaining_time": "2 days, 16:21:56", "throughput": 2724.62, "total_tokens": 1017689792} {"current_steps": 5638, "total_steps": 9134, "loss": 0.7235, "learning_rate": 1.5997735602160923e-05, "epoch": 0.6172035359478913, "percentage": 61.73, "elapsed_time": "4 days, 7:46:16", "remaining_time": "2 days, 16:20:46", "throughput": 2724.54, "total_tokens": 1017823296} {"current_steps": 5639, "total_steps": 9134, "loss": 0.7091, "learning_rate": 1.5989714330861043e-05, "epoch": 0.6173130080188292, "percentage": 61.74, "elapsed_time": "4 days, 7:47:24", "remaining_time": "2 days, 16:19:41", "throughput": 2724.56, "total_tokens": 1018016832} {"current_steps": 5640, "total_steps": 9134, "loss": 0.6641, "learning_rate": 1.5981694125460735e-05, "epoch": 0.6174224800897671, "percentage": 61.75, "elapsed_time": "4 days, 7:48:31", "remaining_time": "2 days, 16:18:35", "throughput": 2724.59, "total_tokens": 1018210816} {"current_steps": 5641, "total_steps": 9134, "loss": 0.7093, "learning_rate": 1.5973674986908778e-05, "epoch": 0.617531952160705, "percentage": 61.76, "elapsed_time": "4 days, 7:49:38", "remaining_time": "2 days, 16:17:29", "throughput": 2724.63, "total_tokens": 1018406144} {"current_steps": 5642, "total_steps": 9134, "loss": 0.5434, "learning_rate": 1.596565691615381e-05, "epoch": 0.6176414242316429, "percentage": 61.77, "elapsed_time": "4 days, 7:50:44", "remaining_time": "2 days, 16:16:23", "throughput": 2724.62, "total_tokens": 1018583776} {"current_steps": 5643, "total_steps": 9134, "loss": 1.1702, "learning_rate": 1.5957639914144358e-05, "epoch": 0.6177508963025808, "percentage": 61.78, "elapsed_time": "4 days, 7:51:52", "remaining_time": "2 days, 16:15:18", "throughput": 2724.66, "total_tokens": 1018783808} {"current_steps": 5644, "total_steps": 9134, "loss": 0.6512, "learning_rate": 1.5949623981828815e-05, "epoch": 0.6178603683735187, "percentage": 61.79, "elapsed_time": "4 days, 7:53:00", "remaining_time": "2 days, 16:14:13", "throughput": 2724.65, "total_tokens": 1018968608} {"current_steps": 5645, "total_steps": 9134, "loss": 0.866, "learning_rate": 1.594160912015546e-05, "epoch": 0.6179698404444566, "percentage": 61.8, "elapsed_time": "4 days, 7:54:09", "remaining_time": "2 days, 16:13:08", "throughput": 2724.65, "total_tokens": 1019151392} {"current_steps": 5646, "total_steps": 9134, "loss": 0.755, "learning_rate": 1.5933595330072425e-05, "epoch": 0.6180793125153945, "percentage": 61.81, "elapsed_time": "4 days, 7:55:07", "remaining_time": "2 days, 16:11:57", "throughput": 2724.58, "total_tokens": 1019284896} {"current_steps": 5647, "total_steps": 9134, "loss": 0.8724, "learning_rate": 1.5925582612527728e-05, "epoch": 0.6181887845863324, "percentage": 61.82, "elapsed_time": "4 days, 7:56:15", "remaining_time": "2 days, 16:10:51", "throughput": 2724.51, "total_tokens": 1019443936} {"current_steps": 5648, "total_steps": 9134, "loss": 0.588, "learning_rate": 1.591757096846927e-05, "epoch": 0.6182982566572703, "percentage": 61.83, "elapsed_time": "4 days, 7:57:21", "remaining_time": "2 days, 16:09:45", "throughput": 2724.52, "total_tokens": 1019630528} {"current_steps": 5649, "total_steps": 9134, "loss": 0.6737, "learning_rate": 1.590956039884479e-05, "epoch": 0.6184077287282083, "percentage": 61.85, "elapsed_time": "4 days, 7:58:26", "remaining_time": "2 days, 16:08:38", "throughput": 2724.54, "total_tokens": 1019815552} {"current_steps": 5650, "total_steps": 9134, "loss": 1.056, "learning_rate": 1.5901550904601952e-05, "epoch": 0.6185172007991461, "percentage": 61.86, "elapsed_time": "4 days, 7:59:29", "remaining_time": "2 days, 16:07:30", "throughput": 2724.53, "total_tokens": 1019979744} {"current_steps": 5651, "total_steps": 9134, "loss": 0.8429, "learning_rate": 1.589354248668824e-05, "epoch": 0.618626672870084, "percentage": 61.87, "elapsed_time": "4 days, 8:00:35", "remaining_time": "2 days, 16:06:23", "throughput": 2724.54, "total_tokens": 1020164992} {"current_steps": 5652, "total_steps": 9134, "loss": 0.6074, "learning_rate": 1.5885535146051046e-05, "epoch": 0.6187361449410219, "percentage": 61.88, "elapsed_time": "4 days, 8:01:41", "remaining_time": "2 days, 16:05:17", "throughput": 2724.54, "total_tokens": 1020344416} {"current_steps": 5653, "total_steps": 9134, "loss": 1.0089, "learning_rate": 1.587752888363762e-05, "epoch": 0.6188456170119598, "percentage": 61.89, "elapsed_time": "4 days, 8:02:49", "remaining_time": "2 days, 16:04:12", "throughput": 2724.58, "total_tokens": 1020546688} {"current_steps": 5654, "total_steps": 9134, "loss": 0.9002, "learning_rate": 1.5869523700395085e-05, "epoch": 0.6189550890828978, "percentage": 61.9, "elapsed_time": "4 days, 8:03:53", "remaining_time": "2 days, 16:03:04", "throughput": 2724.51, "total_tokens": 1020694080} {"current_steps": 5655, "total_steps": 9134, "loss": 0.7451, "learning_rate": 1.5861519597270442e-05, "epoch": 0.6190645611538357, "percentage": 61.91, "elapsed_time": "4 days, 8:04:57", "remaining_time": "2 days, 16:01:56", "throughput": 2724.52, "total_tokens": 1020870368} {"current_steps": 5656, "total_steps": 9134, "loss": 0.8295, "learning_rate": 1.5853516575210558e-05, "epoch": 0.6191740332247735, "percentage": 61.92, "elapsed_time": "4 days, 8:06:03", "remaining_time": "2 days, 16:00:50", "throughput": 2724.54, "total_tokens": 1021055392} {"current_steps": 5657, "total_steps": 9134, "loss": 0.5985, "learning_rate": 1.5845514635162188e-05, "epoch": 0.6192835052957114, "percentage": 61.93, "elapsed_time": "4 days, 8:07:04", "remaining_time": "2 days, 15:59:40", "throughput": 2724.51, "total_tokens": 1021213088} {"current_steps": 5658, "total_steps": 9134, "loss": 0.7283, "learning_rate": 1.5837513778071927e-05, "epoch": 0.6193929773666493, "percentage": 61.94, "elapsed_time": "4 days, 8:08:09", "remaining_time": "2 days, 15:58:33", "throughput": 2724.49, "total_tokens": 1021382880} {"current_steps": 5659, "total_steps": 9134, "loss": 0.6655, "learning_rate": 1.5829514004886282e-05, "epoch": 0.6195024494375873, "percentage": 61.96, "elapsed_time": "4 days, 8:09:15", "remaining_time": "2 days, 15:57:27", "throughput": 2724.5, "total_tokens": 1021566112} {"current_steps": 5660, "total_steps": 9134, "loss": 1.0023, "learning_rate": 1.582151531655159e-05, "epoch": 0.6196119215085252, "percentage": 61.97, "elapsed_time": "4 days, 8:10:18", "remaining_time": "2 days, 15:56:19", "throughput": 2724.46, "total_tokens": 1021722464} {"current_steps": 5661, "total_steps": 9134, "loss": 0.9385, "learning_rate": 1.5813517714014087e-05, "epoch": 0.619721393579463, "percentage": 61.98, "elapsed_time": "4 days, 8:11:28", "remaining_time": "2 days, 15:55:15", "throughput": 2724.52, "total_tokens": 1021934816} {"current_steps": 5662, "total_steps": 9134, "loss": 0.8711, "learning_rate": 1.5805521198219886e-05, "epoch": 0.6198308656504009, "percentage": 61.99, "elapsed_time": "4 days, 8:12:30", "remaining_time": "2 days, 15:54:06", "throughput": 2724.45, "total_tokens": 1022080192} {"current_steps": 5663, "total_steps": 9134, "loss": 0.6519, "learning_rate": 1.579752577011494e-05, "epoch": 0.6199403377213388, "percentage": 62.0, "elapsed_time": "4 days, 8:13:36", "remaining_time": "2 days, 15:52:59", "throughput": 2724.45, "total_tokens": 1022259840} {"current_steps": 5664, "total_steps": 9134, "loss": 0.9084, "learning_rate": 1.578953143064511e-05, "epoch": 0.6200498097922768, "percentage": 62.01, "elapsed_time": "4 days, 8:14:45", "remaining_time": "2 days, 15:51:55", "throughput": 2724.45, "total_tokens": 1022446208} {"current_steps": 5665, "total_steps": 9134, "loss": 0.7223, "learning_rate": 1.57815381807561e-05, "epoch": 0.6201592818632147, "percentage": 62.02, "elapsed_time": "4 days, 8:15:53", "remaining_time": "2 days, 15:50:50", "throughput": 2724.5, "total_tokens": 1022652064} {"current_steps": 5666, "total_steps": 9134, "loss": 0.6946, "learning_rate": 1.577354602139351e-05, "epoch": 0.6202687539341526, "percentage": 62.03, "elapsed_time": "4 days, 8:16:52", "remaining_time": "2 days, 15:49:39", "throughput": 2724.44, "total_tokens": 1022787808} {"current_steps": 5667, "total_steps": 9134, "loss": 0.7203, "learning_rate": 1.5765554953502777e-05, "epoch": 0.6203782260050904, "percentage": 62.04, "elapsed_time": "4 days, 8:17:59", "remaining_time": "2 days, 15:48:33", "throughput": 2724.41, "total_tokens": 1022960512} {"current_steps": 5668, "total_steps": 9134, "loss": 0.726, "learning_rate": 1.575756497802924e-05, "epoch": 0.6204876980760283, "percentage": 62.05, "elapsed_time": "4 days, 8:19:05", "remaining_time": "2 days, 15:47:27", "throughput": 2724.41, "total_tokens": 1023137248} {"current_steps": 5669, "total_steps": 9134, "loss": 0.8754, "learning_rate": 1.574957609591811e-05, "epoch": 0.6205971701469662, "percentage": 62.06, "elapsed_time": "4 days, 8:20:12", "remaining_time": "2 days, 15:46:21", "throughput": 2724.39, "total_tokens": 1023316224} {"current_steps": 5670, "total_steps": 9134, "loss": 0.7545, "learning_rate": 1.574158830811443e-05, "epoch": 0.6207066422179042, "percentage": 62.08, "elapsed_time": "4 days, 8:21:19", "remaining_time": "2 days, 15:45:15", "throughput": 2724.44, "total_tokens": 1023516480} {"current_steps": 5671, "total_steps": 9134, "loss": 0.7692, "learning_rate": 1.5733601615563163e-05, "epoch": 0.6208161142888421, "percentage": 62.09, "elapsed_time": "4 days, 8:22:26", "remaining_time": "2 days, 15:44:09", "throughput": 2724.51, "total_tokens": 1023724128} {"current_steps": 5672, "total_steps": 9134, "loss": 0.7723, "learning_rate": 1.5725616019209106e-05, "epoch": 0.62092558635978, "percentage": 62.1, "elapsed_time": "4 days, 8:23:34", "remaining_time": "2 days, 15:43:04", "throughput": 2724.49, "total_tokens": 1023901984} {"current_steps": 5673, "total_steps": 9134, "loss": 0.8368, "learning_rate": 1.5717631519996947e-05, "epoch": 0.6210350584307178, "percentage": 62.11, "elapsed_time": "4 days, 8:24:40", "remaining_time": "2 days, 15:41:57", "throughput": 2724.48, "total_tokens": 1024076928} {"current_steps": 5674, "total_steps": 9134, "loss": 0.8955, "learning_rate": 1.5709648118871232e-05, "epoch": 0.6211445305016557, "percentage": 62.12, "elapsed_time": "4 days, 8:25:45", "remaining_time": "2 days, 15:40:51", "throughput": 2724.5, "total_tokens": 1024263968} {"current_steps": 5675, "total_steps": 9134, "loss": 0.7904, "learning_rate": 1.5701665816776385e-05, "epoch": 0.6212540025725937, "percentage": 62.13, "elapsed_time": "4 days, 8:26:49", "remaining_time": "2 days, 15:39:43", "throughput": 2724.49, "total_tokens": 1024433760} {"current_steps": 5676, "total_steps": 9134, "loss": 0.8252, "learning_rate": 1.5693684614656697e-05, "epoch": 0.6213634746435316, "percentage": 62.14, "elapsed_time": "4 days, 8:27:56", "remaining_time": "2 days, 15:38:37", "throughput": 2724.48, "total_tokens": 1024613856} {"current_steps": 5677, "total_steps": 9134, "loss": 0.6227, "learning_rate": 1.568570451345632e-05, "epoch": 0.6214729467144695, "percentage": 62.15, "elapsed_time": "4 days, 8:29:03", "remaining_time": "2 days, 15:37:32", "throughput": 2724.49, "total_tokens": 1024800672} {"current_steps": 5678, "total_steps": 9134, "loss": 0.9248, "learning_rate": 1.567772551411931e-05, "epoch": 0.6215824187854073, "percentage": 62.16, "elapsed_time": "4 days, 8:30:10", "remaining_time": "2 days, 15:36:26", "throughput": 2724.49, "total_tokens": 1024983232} {"current_steps": 5679, "total_steps": 9134, "loss": 0.7289, "learning_rate": 1.5669747617589535e-05, "epoch": 0.6216918908563452, "percentage": 62.17, "elapsed_time": "4 days, 8:31:17", "remaining_time": "2 days, 15:35:20", "throughput": 2724.52, "total_tokens": 1025174528} {"current_steps": 5680, "total_steps": 9134, "loss": 0.6663, "learning_rate": 1.5661770824810785e-05, "epoch": 0.6218013629272832, "percentage": 62.19, "elapsed_time": "4 days, 8:32:23", "remaining_time": "2 days, 15:34:13", "throughput": 2724.51, "total_tokens": 1025353056} {"current_steps": 5681, "total_steps": 9134, "loss": 0.6899, "learning_rate": 1.5653795136726705e-05, "epoch": 0.6219108349982211, "percentage": 62.2, "elapsed_time": "4 days, 8:33:30", "remaining_time": "2 days, 15:33:08", "throughput": 2724.53, "total_tokens": 1025542784} {"current_steps": 5682, "total_steps": 9134, "loss": 0.8408, "learning_rate": 1.5645820554280783e-05, "epoch": 0.622020307069159, "percentage": 62.21, "elapsed_time": "4 days, 8:34:37", "remaining_time": "2 days, 15:32:02", "throughput": 2724.49, "total_tokens": 1025711456} {"current_steps": 5683, "total_steps": 9134, "loss": 0.8344, "learning_rate": 1.5637847078416413e-05, "epoch": 0.6221297791400969, "percentage": 62.22, "elapsed_time": "4 days, 8:35:47", "remaining_time": "2 days, 15:30:58", "throughput": 2724.54, "total_tokens": 1025916640} {"current_steps": 5684, "total_steps": 9134, "loss": 0.9935, "learning_rate": 1.562987471007683e-05, "epoch": 0.6222392512110347, "percentage": 62.23, "elapsed_time": "4 days, 8:36:52", "remaining_time": "2 days, 15:29:51", "throughput": 2724.57, "total_tokens": 1026105696} {"current_steps": 5685, "total_steps": 9134, "loss": 0.8621, "learning_rate": 1.5621903450205162e-05, "epoch": 0.6223487232819727, "percentage": 62.24, "elapsed_time": "4 days, 8:37:57", "remaining_time": "2 days, 15:28:44", "throughput": 2724.57, "total_tokens": 1026285792} {"current_steps": 5686, "total_steps": 9134, "loss": 0.8591, "learning_rate": 1.561393329974438e-05, "epoch": 0.6224581953529106, "percentage": 62.25, "elapsed_time": "4 days, 8:39:00", "remaining_time": "2 days, 15:27:35", "throughput": 2724.53, "total_tokens": 1026441472} {"current_steps": 5687, "total_steps": 9134, "loss": 0.8509, "learning_rate": 1.560596425963735e-05, "epoch": 0.6225676674238485, "percentage": 62.26, "elapsed_time": "4 days, 8:40:04", "remaining_time": "2 days, 15:26:28", "throughput": 2724.48, "total_tokens": 1026596032} {"current_steps": 5688, "total_steps": 9134, "loss": 0.9961, "learning_rate": 1.559799633082679e-05, "epoch": 0.6226771394947864, "percentage": 62.27, "elapsed_time": "4 days, 8:41:07", "remaining_time": "2 days, 15:25:20", "throughput": 2724.46, "total_tokens": 1026760448} {"current_steps": 5689, "total_steps": 9134, "loss": 0.6539, "learning_rate": 1.559002951425529e-05, "epoch": 0.6227866115657243, "percentage": 62.28, "elapsed_time": "4 days, 8:42:15", "remaining_time": "2 days, 15:24:15", "throughput": 2724.45, "total_tokens": 1026942336} {"current_steps": 5690, "total_steps": 9134, "loss": 0.6516, "learning_rate": 1.5582063810865315e-05, "epoch": 0.6228960836366622, "percentage": 62.29, "elapsed_time": "4 days, 8:43:18", "remaining_time": "2 days, 15:23:06", "throughput": 2724.43, "total_tokens": 1027104736} {"current_steps": 5691, "total_steps": 9134, "loss": 0.752, "learning_rate": 1.557409922159918e-05, "epoch": 0.6230055557076001, "percentage": 62.31, "elapsed_time": "4 days, 8:44:19", "remaining_time": "2 days, 15:21:57", "throughput": 2724.4, "total_tokens": 1027262208} {"current_steps": 5692, "total_steps": 9134, "loss": 0.7543, "learning_rate": 1.5566135747399097e-05, "epoch": 0.623115027778538, "percentage": 62.32, "elapsed_time": "4 days, 8:45:22", "remaining_time": "2 days, 15:20:48", "throughput": 2724.34, "total_tokens": 1027408032} {"current_steps": 5693, "total_steps": 9134, "loss": 0.7811, "learning_rate": 1.555817338920711e-05, "epoch": 0.6232244998494759, "percentage": 62.33, "elapsed_time": "4 days, 8:46:25", "remaining_time": "2 days, 15:19:41", "throughput": 2724.33, "total_tokens": 1027578720} {"current_steps": 5694, "total_steps": 9134, "loss": 0.6918, "learning_rate": 1.555021214796516e-05, "epoch": 0.6233339719204138, "percentage": 62.34, "elapsed_time": "4 days, 8:47:34", "remaining_time": "2 days, 15:18:36", "throughput": 2724.34, "total_tokens": 1027769792} {"current_steps": 5695, "total_steps": 9134, "loss": 0.9691, "learning_rate": 1.5542252024615056e-05, "epoch": 0.6234434439913517, "percentage": 62.35, "elapsed_time": "4 days, 8:48:43", "remaining_time": "2 days, 15:17:31", "throughput": 2724.42, "total_tokens": 1027987968} {"current_steps": 5696, "total_steps": 9134, "loss": 0.7457, "learning_rate": 1.5534293020098454e-05, "epoch": 0.6235529160622896, "percentage": 62.36, "elapsed_time": "4 days, 8:49:47", "remaining_time": "2 days, 15:16:24", "throughput": 2724.41, "total_tokens": 1028158656} {"current_steps": 5697, "total_steps": 9134, "loss": 0.8696, "learning_rate": 1.5526335135356895e-05, "epoch": 0.6236623881332275, "percentage": 62.37, "elapsed_time": "4 days, 8:50:53", "remaining_time": "2 days, 15:15:17", "throughput": 2724.39, "total_tokens": 1028331136} {"current_steps": 5698, "total_steps": 9134, "loss": 0.8051, "learning_rate": 1.551837837133177e-05, "epoch": 0.6237718602041654, "percentage": 62.38, "elapsed_time": "4 days, 8:52:00", "remaining_time": "2 days, 15:14:12", "throughput": 2724.45, "total_tokens": 1028536096} {"current_steps": 5699, "total_steps": 9134, "loss": 0.6651, "learning_rate": 1.5510422728964374e-05, "epoch": 0.6238813322751033, "percentage": 62.39, "elapsed_time": "4 days, 8:53:02", "remaining_time": "2 days, 15:13:03", "throughput": 2724.41, "total_tokens": 1028689536} {"current_steps": 5700, "total_steps": 9134, "loss": 0.6841, "learning_rate": 1.5502468209195815e-05, "epoch": 0.6239908043460413, "percentage": 62.4, "elapsed_time": "4 days, 8:54:07", "remaining_time": "2 days, 15:11:55", "throughput": 2724.39, "total_tokens": 1028858880} {"current_steps": 5701, "total_steps": 9134, "loss": 1.0211, "learning_rate": 1.549451481296711e-05, "epoch": 0.6241002764169791, "percentage": 62.42, "elapsed_time": "4 days, 8:55:16", "remaining_time": "2 days, 15:10:51", "throughput": 2724.39, "total_tokens": 1029048608} {"current_steps": 5702, "total_steps": 9134, "loss": 0.8262, "learning_rate": 1.548656254121914e-05, "epoch": 0.624209748487917, "percentage": 62.43, "elapsed_time": "4 days, 8:56:23", "remaining_time": "2 days, 15:09:45", "throughput": 2724.45, "total_tokens": 1029253120} {"current_steps": 5703, "total_steps": 9134, "loss": 0.6913, "learning_rate": 1.547861139489263e-05, "epoch": 0.6243192205588549, "percentage": 62.44, "elapsed_time": "4 days, 8:57:31", "remaining_time": "2 days, 15:08:40", "throughput": 2724.4, "total_tokens": 1029417312} {"current_steps": 5704, "total_steps": 9134, "loss": 0.8695, "learning_rate": 1.5470661374928198e-05, "epoch": 0.6244286926297928, "percentage": 62.45, "elapsed_time": "4 days, 8:58:38", "remaining_time": "2 days, 15:07:34", "throughput": 2724.41, "total_tokens": 1029605472} {"current_steps": 5705, "total_steps": 9134, "loss": 0.8171, "learning_rate": 1.5462712482266296e-05, "epoch": 0.6245381647007308, "percentage": 62.46, "elapsed_time": "4 days, 8:59:45", "remaining_time": "2 days, 15:06:29", "throughput": 2724.47, "total_tokens": 1029813120} {"current_steps": 5706, "total_steps": 9134, "loss": 0.7275, "learning_rate": 1.545476471784728e-05, "epoch": 0.6246476367716687, "percentage": 62.47, "elapsed_time": "4 days, 9:00:52", "remaining_time": "2 days, 15:05:23", "throughput": 2724.48, "total_tokens": 1029999264} {"current_steps": 5707, "total_steps": 9134, "loss": 0.8385, "learning_rate": 1.544681808261135e-05, "epoch": 0.6247571088426065, "percentage": 62.48, "elapsed_time": "4 days, 9:02:02", "remaining_time": "2 days, 15:04:18", "throughput": 2724.47, "total_tokens": 1030182048} {"current_steps": 5708, "total_steps": 9134, "loss": 0.6031, "learning_rate": 1.5438872577498575e-05, "epoch": 0.6248665809135444, "percentage": 62.49, "elapsed_time": "4 days, 9:03:07", "remaining_time": "2 days, 15:03:12", "throughput": 2724.39, "total_tokens": 1030331680} {"current_steps": 5709, "total_steps": 9134, "loss": 0.6648, "learning_rate": 1.5430928203448903e-05, "epoch": 0.6249760529844823, "percentage": 62.5, "elapsed_time": "4 days, 9:04:13", "remaining_time": "2 days, 15:02:05", "throughput": 2724.32, "total_tokens": 1030484000} {"current_steps": 5710, "total_steps": 9134, "loss": 0.8431, "learning_rate": 1.5422984961402125e-05, "epoch": 0.6250855250554203, "percentage": 62.51, "elapsed_time": "4 days, 9:05:20", "remaining_time": "2 days, 15:00:59", "throughput": 2724.33, "total_tokens": 1030670592} {"current_steps": 5711, "total_steps": 9134, "loss": 0.8321, "learning_rate": 1.541504285229793e-05, "epoch": 0.6251949971263582, "percentage": 62.52, "elapsed_time": "4 days, 9:06:26", "remaining_time": "2 days, 14:59:53", "throughput": 2724.33, "total_tokens": 1030849344} {"current_steps": 5712, "total_steps": 9134, "loss": 0.8123, "learning_rate": 1.5407101877075827e-05, "epoch": 0.625304469197296, "percentage": 62.54, "elapsed_time": "4 days, 9:07:30", "remaining_time": "2 days, 14:58:45", "throughput": 2724.31, "total_tokens": 1031015552} {"current_steps": 5713, "total_steps": 9134, "loss": 0.7077, "learning_rate": 1.5399162036675245e-05, "epoch": 0.6254139412682339, "percentage": 62.55, "elapsed_time": "4 days, 9:08:39", "remaining_time": "2 days, 14:57:40", "throughput": 2724.3, "total_tokens": 1031200800} {"current_steps": 5714, "total_steps": 9134, "loss": 0.6698, "learning_rate": 1.5391223332035434e-05, "epoch": 0.6255234133391718, "percentage": 62.56, "elapsed_time": "4 days, 9:09:42", "remaining_time": "2 days, 14:56:32", "throughput": 2724.27, "total_tokens": 1031360064} {"current_steps": 5715, "total_steps": 9134, "loss": 0.8364, "learning_rate": 1.5383285764095534e-05, "epoch": 0.6256328854101098, "percentage": 62.57, "elapsed_time": "4 days, 9:10:47", "remaining_time": "2 days, 14:55:25", "throughput": 2724.3, "total_tokens": 1031548896} {"current_steps": 5716, "total_steps": 9134, "loss": 0.739, "learning_rate": 1.5375349333794545e-05, "epoch": 0.6257423574810477, "percentage": 62.58, "elapsed_time": "4 days, 9:11:50", "remaining_time": "2 days, 14:54:17", "throughput": 2724.26, "total_tokens": 1031703456} {"current_steps": 5717, "total_steps": 9134, "loss": 0.8619, "learning_rate": 1.5367414042071333e-05, "epoch": 0.6258518295519856, "percentage": 62.59, "elapsed_time": "4 days, 9:12:50", "remaining_time": "2 days, 14:53:08", "throughput": 2724.21, "total_tokens": 1031851968} {"current_steps": 5718, "total_steps": 9134, "loss": 0.9245, "learning_rate": 1.5359479889864625e-05, "epoch": 0.6259613016229234, "percentage": 62.6, "elapsed_time": "4 days, 9:13:57", "remaining_time": "2 days, 14:52:01", "throughput": 2724.21, "total_tokens": 1032032512} {"current_steps": 5719, "total_steps": 9134, "loss": 0.7887, "learning_rate": 1.535154687811301e-05, "epoch": 0.6260707736938613, "percentage": 62.61, "elapsed_time": "4 days, 9:15:06", "remaining_time": "2 days, 14:50:57", "throughput": 2724.25, "total_tokens": 1032238592} {"current_steps": 5720, "total_steps": 9134, "loss": 0.6371, "learning_rate": 1.534361500775497e-05, "epoch": 0.6261802457647992, "percentage": 62.62, "elapsed_time": "4 days, 9:16:14", "remaining_time": "2 days, 14:49:52", "throughput": 2724.29, "total_tokens": 1032438848} {"current_steps": 5721, "total_steps": 9134, "loss": 0.8898, "learning_rate": 1.5335684279728798e-05, "epoch": 0.6262897178357372, "percentage": 62.63, "elapsed_time": "4 days, 9:17:20", "remaining_time": "2 days, 14:48:45", "throughput": 2724.3, "total_tokens": 1032620736} {"current_steps": 5722, "total_steps": 9134, "loss": 0.8825, "learning_rate": 1.5327754694972705e-05, "epoch": 0.6263991899066751, "percentage": 62.65, "elapsed_time": "4 days, 9:18:23", "remaining_time": "2 days, 14:47:37", "throughput": 2724.28, "total_tokens": 1032786720} {"current_steps": 5723, "total_steps": 9134, "loss": 0.8472, "learning_rate": 1.531982625442475e-05, "epoch": 0.626508661977613, "percentage": 62.66, "elapsed_time": "4 days, 9:19:28", "remaining_time": "2 days, 14:46:30", "throughput": 2724.26, "total_tokens": 1032952032} {"current_steps": 5724, "total_steps": 9134, "loss": 0.7449, "learning_rate": 1.5311898959022832e-05, "epoch": 0.6266181340485508, "percentage": 62.67, "elapsed_time": "4 days, 9:20:30", "remaining_time": "2 days, 14:45:21", "throughput": 2724.21, "total_tokens": 1033103904} {"current_steps": 5725, "total_steps": 9134, "loss": 0.6532, "learning_rate": 1.530397280970476e-05, "epoch": 0.6267276061194887, "percentage": 62.68, "elapsed_time": "4 days, 9:21:31", "remaining_time": "2 days, 14:44:12", "throughput": 2724.15, "total_tokens": 1033247936} {"current_steps": 5726, "total_steps": 9134, "loss": 0.5987, "learning_rate": 1.5296047807408152e-05, "epoch": 0.6268370781904267, "percentage": 62.69, "elapsed_time": "4 days, 9:22:39", "remaining_time": "2 days, 14:43:07", "throughput": 2724.11, "total_tokens": 1033415936} {"current_steps": 5727, "total_steps": 9134, "loss": 0.626, "learning_rate": 1.5288123953070552e-05, "epoch": 0.6269465502613646, "percentage": 62.7, "elapsed_time": "4 days, 9:23:38", "remaining_time": "2 days, 14:41:56", "throughput": 2724.02, "total_tokens": 1033545184} {"current_steps": 5728, "total_steps": 9134, "loss": 0.5331, "learning_rate": 1.5280201247629312e-05, "epoch": 0.6270560223323025, "percentage": 62.71, "elapsed_time": "4 days, 9:24:45", "remaining_time": "2 days, 14:40:50", "throughput": 2723.98, "total_tokens": 1033710496} {"current_steps": 5729, "total_steps": 9134, "loss": 0.8359, "learning_rate": 1.527227969202169e-05, "epoch": 0.6271654944032403, "percentage": 62.72, "elapsed_time": "4 days, 9:25:47", "remaining_time": "2 days, 14:39:41", "throughput": 2723.96, "total_tokens": 1033872224} {"current_steps": 5730, "total_steps": 9134, "loss": 0.7496, "learning_rate": 1.5264359287184783e-05, "epoch": 0.6272749664741782, "percentage": 62.73, "elapsed_time": "4 days, 9:26:51", "remaining_time": "2 days, 14:38:34", "throughput": 2724.0, "total_tokens": 1034061952} {"current_steps": 5731, "total_steps": 9134, "loss": 0.7454, "learning_rate": 1.5256440034055557e-05, "epoch": 0.6273844385451162, "percentage": 62.74, "elapsed_time": "4 days, 9:27:57", "remaining_time": "2 days, 14:37:28", "throughput": 2724.03, "total_tokens": 1034254816} {"current_steps": 5732, "total_steps": 9134, "loss": 0.7045, "learning_rate": 1.5248521933570858e-05, "epoch": 0.6274939106160541, "percentage": 62.75, "elapsed_time": "4 days, 9:29:04", "remaining_time": "2 days, 14:36:22", "throughput": 2724.02, "total_tokens": 1034429536} {"current_steps": 5733, "total_steps": 9134, "loss": 0.6308, "learning_rate": 1.5240604986667362e-05, "epoch": 0.627603382686992, "percentage": 62.77, "elapsed_time": "4 days, 9:30:11", "remaining_time": "2 days, 14:35:16", "throughput": 2724.04, "total_tokens": 1034622624} {"current_steps": 5734, "total_steps": 9134, "loss": 0.5376, "learning_rate": 1.5232689194281652e-05, "epoch": 0.6277128547579299, "percentage": 62.78, "elapsed_time": "4 days, 9:31:19", "remaining_time": "2 days, 14:34:10", "throughput": 2723.99, "total_tokens": 1034785024} {"current_steps": 5735, "total_steps": 9134, "loss": 0.8973, "learning_rate": 1.5224774557350125e-05, "epoch": 0.6278223268288677, "percentage": 62.79, "elapsed_time": "4 days, 9:32:26", "remaining_time": "2 days, 14:33:05", "throughput": 2724.0, "total_tokens": 1034974304} {"current_steps": 5736, "total_steps": 9134, "loss": 0.7951, "learning_rate": 1.5216861076809083e-05, "epoch": 0.6279317988998057, "percentage": 62.8, "elapsed_time": "4 days, 9:33:33", "remaining_time": "2 days, 14:31:59", "throughput": 2724.0, "total_tokens": 1035155520} {"current_steps": 5737, "total_steps": 9134, "loss": 0.7006, "learning_rate": 1.5208948753594677e-05, "epoch": 0.6280412709707436, "percentage": 62.81, "elapsed_time": "4 days, 9:34:39", "remaining_time": "2 days, 14:30:53", "throughput": 2723.95, "total_tokens": 1035318368} {"current_steps": 5738, "total_steps": 9134, "loss": 0.7764, "learning_rate": 1.5201037588642916e-05, "epoch": 0.6281507430416815, "percentage": 62.82, "elapsed_time": "4 days, 9:35:45", "remaining_time": "2 days, 14:29:46", "throughput": 2723.95, "total_tokens": 1035498240} {"current_steps": 5739, "total_steps": 9134, "loss": 0.8466, "learning_rate": 1.5193127582889677e-05, "epoch": 0.6282602151126194, "percentage": 62.83, "elapsed_time": "4 days, 9:36:54", "remaining_time": "2 days, 14:28:42", "throughput": 2723.97, "total_tokens": 1035694240} {"current_steps": 5740, "total_steps": 9134, "loss": 0.7353, "learning_rate": 1.5185218737270694e-05, "epoch": 0.6283696871835573, "percentage": 62.84, "elapsed_time": "4 days, 9:38:00", "remaining_time": "2 days, 14:27:35", "throughput": 2723.99, "total_tokens": 1035879936} {"current_steps": 5741, "total_steps": 9134, "loss": 0.9621, "learning_rate": 1.5177311052721568e-05, "epoch": 0.6284791592544952, "percentage": 62.85, "elapsed_time": "4 days, 9:39:09", "remaining_time": "2 days, 14:26:31", "throughput": 2723.96, "total_tokens": 1036058464} {"current_steps": 5742, "total_steps": 9134, "loss": 0.8621, "learning_rate": 1.5169404530177778e-05, "epoch": 0.6285886313254331, "percentage": 62.86, "elapsed_time": "4 days, 9:40:19", "remaining_time": "2 days, 14:25:27", "throughput": 2724.0, "total_tokens": 1036263200} {"current_steps": 5743, "total_steps": 9134, "loss": 0.7314, "learning_rate": 1.5161499170574629e-05, "epoch": 0.628698103396371, "percentage": 62.87, "elapsed_time": "4 days, 9:41:27", "remaining_time": "2 days, 14:24:22", "throughput": 2723.98, "total_tokens": 1036439264} {"current_steps": 5744, "total_steps": 9134, "loss": 0.8541, "learning_rate": 1.515359497484733e-05, "epoch": 0.6288075754673089, "percentage": 62.89, "elapsed_time": "4 days, 9:42:34", "remaining_time": "2 days, 14:23:15", "throughput": 2723.95, "total_tokens": 1036611968} {"current_steps": 5745, "total_steps": 9134, "loss": 0.6829, "learning_rate": 1.5145691943930914e-05, "epoch": 0.6289170475382468, "percentage": 62.9, "elapsed_time": "4 days, 9:43:37", "remaining_time": "2 days, 14:22:08", "throughput": 2723.91, "total_tokens": 1036769216} {"current_steps": 5746, "total_steps": 9134, "loss": 0.8594, "learning_rate": 1.513779007876031e-05, "epoch": 0.6290265196091847, "percentage": 62.91, "elapsed_time": "4 days, 9:44:45", "remaining_time": "2 days, 14:21:02", "throughput": 2723.95, "total_tokens": 1036967008} {"current_steps": 5747, "total_steps": 9134, "loss": 0.9295, "learning_rate": 1.5129889380270279e-05, "epoch": 0.6291359916801226, "percentage": 62.92, "elapsed_time": "4 days, 9:45:52", "remaining_time": "2 days, 14:19:56", "throughput": 2724.02, "total_tokens": 1037176672} {"current_steps": 5748, "total_steps": 9134, "loss": 0.8273, "learning_rate": 1.5121989849395465e-05, "epoch": 0.6292454637510605, "percentage": 62.93, "elapsed_time": "4 days, 9:47:01", "remaining_time": "2 days, 14:18:52", "throughput": 2724.06, "total_tokens": 1037380288} {"current_steps": 5749, "total_steps": 9134, "loss": 0.8229, "learning_rate": 1.5114091487070376e-05, "epoch": 0.6293549358219984, "percentage": 62.94, "elapsed_time": "4 days, 9:48:10", "remaining_time": "2 days, 14:17:47", "throughput": 2724.08, "total_tokens": 1037576512} {"current_steps": 5750, "total_steps": 9134, "loss": 0.6341, "learning_rate": 1.5106194294229359e-05, "epoch": 0.6294644078929363, "percentage": 62.95, "elapsed_time": "4 days, 9:49:17", "remaining_time": "2 days, 14:16:42", "throughput": 2724.04, "total_tokens": 1037746304} {"current_steps": 5751, "total_steps": 9134, "loss": 1.0341, "learning_rate": 1.5098298271806649e-05, "epoch": 0.6295738799638743, "percentage": 62.96, "elapsed_time": "4 days, 9:50:26", "remaining_time": "2 days, 14:15:37", "throughput": 2724.09, "total_tokens": 1037949920} {"current_steps": 5752, "total_steps": 9134, "loss": 0.6469, "learning_rate": 1.5090403420736315e-05, "epoch": 0.6296833520348121, "percentage": 62.97, "elapsed_time": "4 days, 9:51:31", "remaining_time": "2 days, 14:14:30", "throughput": 2724.07, "total_tokens": 1038119936} {"current_steps": 5753, "total_steps": 9134, "loss": 0.6648, "learning_rate": 1.5082509741952328e-05, "epoch": 0.62979282410575, "percentage": 62.98, "elapsed_time": "4 days, 9:52:40", "remaining_time": "2 days, 14:13:25", "throughput": 2724.05, "total_tokens": 1038300480} {"current_steps": 5754, "total_steps": 9134, "loss": 1.0703, "learning_rate": 1.5074617236388467e-05, "epoch": 0.6299022961766879, "percentage": 63.0, "elapsed_time": "4 days, 9:53:47", "remaining_time": "2 days, 14:12:19", "throughput": 2724.11, "total_tokens": 1038505440} {"current_steps": 5755, "total_steps": 9134, "loss": 0.8052, "learning_rate": 1.506672590497841e-05, "epoch": 0.6300117682476258, "percentage": 63.01, "elapsed_time": "4 days, 9:54:53", "remaining_time": "2 days, 14:11:13", "throughput": 2724.09, "total_tokens": 1038677696} {"current_steps": 5756, "total_steps": 9134, "loss": 0.8284, "learning_rate": 1.5058835748655703e-05, "epoch": 0.6301212403185638, "percentage": 63.02, "elapsed_time": "4 days, 9:56:02", "remaining_time": "2 days, 14:10:08", "throughput": 2724.18, "total_tokens": 1038899456} {"current_steps": 5757, "total_steps": 9134, "loss": 0.852, "learning_rate": 1.5050946768353708e-05, "epoch": 0.6302307123895017, "percentage": 63.03, "elapsed_time": "4 days, 9:57:06", "remaining_time": "2 days, 14:09:01", "throughput": 2724.18, "total_tokens": 1039074624} {"current_steps": 5758, "total_steps": 9134, "loss": 0.8474, "learning_rate": 1.5043058965005702e-05, "epoch": 0.6303401844604395, "percentage": 63.04, "elapsed_time": "4 days, 9:58:14", "remaining_time": "2 days, 14:07:55", "throughput": 2724.22, "total_tokens": 1039276896} {"current_steps": 5759, "total_steps": 9134, "loss": 0.8027, "learning_rate": 1.5035172339544781e-05, "epoch": 0.6304496565313774, "percentage": 63.05, "elapsed_time": "4 days, 9:59:18", "remaining_time": "2 days, 14:06:48", "throughput": 2724.23, "total_tokens": 1039453856} {"current_steps": 5760, "total_steps": 9134, "loss": 0.7073, "learning_rate": 1.5027286892903924e-05, "epoch": 0.6305591286023153, "percentage": 63.06, "elapsed_time": "4 days, 10:00:26", "remaining_time": "2 days, 14:05:42", "throughput": 2724.29, "total_tokens": 1039662176} {"current_steps": 5761, "total_steps": 9134, "loss": 0.5238, "learning_rate": 1.501940262601596e-05, "epoch": 0.6306686006732533, "percentage": 63.07, "elapsed_time": "4 days, 10:01:31", "remaining_time": "2 days, 14:04:36", "throughput": 2724.28, "total_tokens": 1039833536} {"current_steps": 5762, "total_steps": 9134, "loss": 0.8213, "learning_rate": 1.5011519539813584e-05, "epoch": 0.6307780727441912, "percentage": 63.08, "elapsed_time": "4 days, 10:02:41", "remaining_time": "2 days, 14:03:31", "throughput": 2724.25, "total_tokens": 1040011168} {"current_steps": 5763, "total_steps": 9134, "loss": 0.5296, "learning_rate": 1.5003637635229361e-05, "epoch": 0.630887544815129, "percentage": 63.09, "elapsed_time": "4 days, 10:03:50", "remaining_time": "2 days, 14:02:27", "throughput": 2724.3, "total_tokens": 1040223072} {"current_steps": 5764, "total_steps": 9134, "loss": 0.9224, "learning_rate": 1.4995756913195688e-05, "epoch": 0.6309970168860669, "percentage": 63.1, "elapsed_time": "4 days, 10:04:56", "remaining_time": "2 days, 14:01:21", "throughput": 2724.27, "total_tokens": 1040389952} {"current_steps": 5765, "total_steps": 9134, "loss": 0.5188, "learning_rate": 1.4987877374644858e-05, "epoch": 0.6311064889570048, "percentage": 63.12, "elapsed_time": "4 days, 10:06:03", "remaining_time": "2 days, 14:00:15", "throughput": 2724.24, "total_tokens": 1040558400} {"current_steps": 5766, "total_steps": 9134, "loss": 0.7875, "learning_rate": 1.4979999020508983e-05, "epoch": 0.6312159610279428, "percentage": 63.13, "elapsed_time": "4 days, 10:07:07", "remaining_time": "2 days, 13:59:07", "throughput": 2724.25, "total_tokens": 1040736480} {"current_steps": 5767, "total_steps": 9134, "loss": 0.6848, "learning_rate": 1.4972121851720078e-05, "epoch": 0.6313254330988807, "percentage": 63.14, "elapsed_time": "4 days, 10:08:10", "remaining_time": "2 days, 13:57:59", "throughput": 2724.18, "total_tokens": 1040884544} {"current_steps": 5768, "total_steps": 9134, "loss": 0.8038, "learning_rate": 1.4964245869209979e-05, "epoch": 0.6314349051698186, "percentage": 63.15, "elapsed_time": "4 days, 10:09:14", "remaining_time": "2 days, 13:56:51", "throughput": 2724.17, "total_tokens": 1041052768} {"current_steps": 5769, "total_steps": 9134, "loss": 0.8989, "learning_rate": 1.4956371073910408e-05, "epoch": 0.6315443772407564, "percentage": 63.16, "elapsed_time": "4 days, 10:10:24", "remaining_time": "2 days, 13:55:47", "throughput": 2724.19, "total_tokens": 1041249888} {"current_steps": 5770, "total_steps": 9134, "loss": 0.7042, "learning_rate": 1.4948497466752943e-05, "epoch": 0.6316538493116943, "percentage": 63.17, "elapsed_time": "4 days, 10:11:28", "remaining_time": "2 days, 13:54:40", "throughput": 2724.19, "total_tokens": 1041427296} {"current_steps": 5771, "total_steps": 9134, "loss": 0.7241, "learning_rate": 1.494062504866901e-05, "epoch": 0.6317633213826322, "percentage": 63.18, "elapsed_time": "4 days, 10:12:32", "remaining_time": "2 days, 13:53:32", "throughput": 2724.15, "total_tokens": 1041585888} {"current_steps": 5772, "total_steps": 9134, "loss": 1.0199, "learning_rate": 1.4932753820589912e-05, "epoch": 0.6318727934535702, "percentage": 63.19, "elapsed_time": "4 days, 10:13:41", "remaining_time": "2 days, 13:52:27", "throughput": 2724.19, "total_tokens": 1041787936} {"current_steps": 5773, "total_steps": 9134, "loss": 0.6415, "learning_rate": 1.492488378344678e-05, "epoch": 0.6319822655245081, "percentage": 63.2, "elapsed_time": "4 days, 10:14:47", "remaining_time": "2 days, 13:51:21", "throughput": 2724.23, "total_tokens": 1041982816} {"current_steps": 5774, "total_steps": 9134, "loss": 0.7796, "learning_rate": 1.4917014938170648e-05, "epoch": 0.632091737595446, "percentage": 63.21, "elapsed_time": "4 days, 10:15:52", "remaining_time": "2 days, 13:50:14", "throughput": 2724.22, "total_tokens": 1042157984} {"current_steps": 5775, "total_steps": 9134, "loss": 0.5959, "learning_rate": 1.4909147285692366e-05, "epoch": 0.6322012096663838, "percentage": 63.23, "elapsed_time": "4 days, 10:16:59", "remaining_time": "2 days, 13:49:08", "throughput": 2724.26, "total_tokens": 1042354432} {"current_steps": 5776, "total_steps": 9134, "loss": 0.7966, "learning_rate": 1.4901280826942665e-05, "epoch": 0.6323106817373217, "percentage": 63.24, "elapsed_time": "4 days, 10:18:09", "remaining_time": "2 days, 13:48:04", "throughput": 2724.31, "total_tokens": 1042562752} {"current_steps": 5777, "total_steps": 9134, "loss": 0.6455, "learning_rate": 1.4893415562852148e-05, "epoch": 0.6324201538082597, "percentage": 63.25, "elapsed_time": "4 days, 10:19:13", "remaining_time": "2 days, 13:46:56", "throughput": 2724.33, "total_tokens": 1042744416} {"current_steps": 5778, "total_steps": 9134, "loss": 0.6854, "learning_rate": 1.4885551494351242e-05, "epoch": 0.6325296258791976, "percentage": 63.26, "elapsed_time": "4 days, 10:20:22", "remaining_time": "2 days, 13:45:52", "throughput": 2724.33, "total_tokens": 1042935264} {"current_steps": 5779, "total_steps": 9134, "loss": 0.8252, "learning_rate": 1.4877688622370262e-05, "epoch": 0.6326390979501355, "percentage": 63.27, "elapsed_time": "4 days, 10:21:30", "remaining_time": "2 days, 13:44:47", "throughput": 2724.35, "total_tokens": 1043127904} {"current_steps": 5780, "total_steps": 9134, "loss": 0.7803, "learning_rate": 1.4869826947839366e-05, "epoch": 0.6327485700210733, "percentage": 63.28, "elapsed_time": "4 days, 10:22:34", "remaining_time": "2 days, 13:43:39", "throughput": 2724.35, "total_tokens": 1043299936} {"current_steps": 5781, "total_steps": 9134, "loss": 0.7851, "learning_rate": 1.4861966471688577e-05, "epoch": 0.6328580420920112, "percentage": 63.29, "elapsed_time": "4 days, 10:23:43", "remaining_time": "2 days, 13:42:35", "throughput": 2724.41, "total_tokens": 1043512288} {"current_steps": 5782, "total_steps": 9134, "loss": 0.863, "learning_rate": 1.4854107194847771e-05, "epoch": 0.6329675141629492, "percentage": 63.3, "elapsed_time": "4 days, 10:24:53", "remaining_time": "2 days, 13:41:30", "throughput": 2724.44, "total_tokens": 1043714560} {"current_steps": 5783, "total_steps": 9134, "loss": 0.6618, "learning_rate": 1.4846249118246686e-05, "epoch": 0.6330769862338871, "percentage": 63.31, "elapsed_time": "4 days, 10:25:58", "remaining_time": "2 days, 13:40:24", "throughput": 2724.39, "total_tokens": 1043872256} {"current_steps": 5784, "total_steps": 9134, "loss": 0.6614, "learning_rate": 1.483839224281493e-05, "epoch": 0.633186458304825, "percentage": 63.32, "elapsed_time": "4 days, 10:27:06", "remaining_time": "2 days, 13:39:18", "throughput": 2724.38, "total_tokens": 1044055936} {"current_steps": 5785, "total_steps": 9134, "loss": 0.5432, "learning_rate": 1.4830536569481934e-05, "epoch": 0.6332959303757629, "percentage": 63.33, "elapsed_time": "4 days, 10:28:15", "remaining_time": "2 days, 13:38:13", "throughput": 2724.37, "total_tokens": 1044238944} {"current_steps": 5786, "total_steps": 9134, "loss": 0.7651, "learning_rate": 1.4822682099177035e-05, "epoch": 0.6334054024467007, "percentage": 63.35, "elapsed_time": "4 days, 10:29:21", "remaining_time": "2 days, 13:37:07", "throughput": 2724.36, "total_tokens": 1044412320} {"current_steps": 5787, "total_steps": 9134, "loss": 0.6066, "learning_rate": 1.4814828832829374e-05, "epoch": 0.6335148745176387, "percentage": 63.36, "elapsed_time": "4 days, 10:30:23", "remaining_time": "2 days, 13:35:58", "throughput": 2724.31, "total_tokens": 1044565536} {"current_steps": 5788, "total_steps": 9134, "loss": 0.6904, "learning_rate": 1.4806976771368006e-05, "epoch": 0.6336243465885766, "percentage": 63.37, "elapsed_time": "4 days, 10:31:32", "remaining_time": "2 days, 13:34:54", "throughput": 2724.34, "total_tokens": 1044763328} {"current_steps": 5789, "total_steps": 9134, "loss": 0.6534, "learning_rate": 1.4799125915721787e-05, "epoch": 0.6337338186595145, "percentage": 63.38, "elapsed_time": "4 days, 10:32:35", "remaining_time": "2 days, 13:33:46", "throughput": 2724.3, "total_tokens": 1044920576} {"current_steps": 5790, "total_steps": 9134, "loss": 0.692, "learning_rate": 1.479127626681947e-05, "epoch": 0.6338432907304524, "percentage": 63.39, "elapsed_time": "4 days, 10:33:42", "remaining_time": "2 days, 13:32:40", "throughput": 2724.34, "total_tokens": 1045115904} {"current_steps": 5791, "total_steps": 9134, "loss": 0.8748, "learning_rate": 1.4783427825589663e-05, "epoch": 0.6339527628013903, "percentage": 63.4, "elapsed_time": "4 days, 10:34:48", "remaining_time": "2 days, 13:31:33", "throughput": 2724.36, "total_tokens": 1045308320} {"current_steps": 5792, "total_steps": 9134, "loss": 0.7778, "learning_rate": 1.4775580592960808e-05, "epoch": 0.6340622348723282, "percentage": 63.41, "elapsed_time": "4 days, 10:35:58", "remaining_time": "2 days, 13:30:29", "throughput": 2724.4, "total_tokens": 1045513280} {"current_steps": 5793, "total_steps": 9134, "loss": 0.8257, "learning_rate": 1.4767734569861233e-05, "epoch": 0.6341717069432661, "percentage": 63.42, "elapsed_time": "4 days, 10:37:05", "remaining_time": "2 days, 13:29:23", "throughput": 2724.43, "total_tokens": 1045706816} {"current_steps": 5794, "total_steps": 9134, "loss": 0.6331, "learning_rate": 1.4759889757219087e-05, "epoch": 0.634281179014204, "percentage": 63.43, "elapsed_time": "4 days, 10:38:14", "remaining_time": "2 days, 13:28:19", "throughput": 2724.52, "total_tokens": 1045925664} {"current_steps": 5795, "total_steps": 9134, "loss": 0.6771, "learning_rate": 1.4752046155962418e-05, "epoch": 0.6343906510851419, "percentage": 63.44, "elapsed_time": "4 days, 10:39:19", "remaining_time": "2 days, 13:27:12", "throughput": 2724.52, "total_tokens": 1046105312} {"current_steps": 5796, "total_steps": 9134, "loss": 0.8011, "learning_rate": 1.4744203767019088e-05, "epoch": 0.6345001231560798, "percentage": 63.46, "elapsed_time": "4 days, 10:40:25", "remaining_time": "2 days, 13:26:05", "throughput": 2724.48, "total_tokens": 1046269280} {"current_steps": 5797, "total_steps": 9134, "loss": 0.8938, "learning_rate": 1.4736362591316844e-05, "epoch": 0.6346095952270177, "percentage": 63.47, "elapsed_time": "4 days, 10:41:34", "remaining_time": "2 days, 13:25:01", "throughput": 2724.54, "total_tokens": 1046483424} {"current_steps": 5798, "total_steps": 9134, "loss": 0.7271, "learning_rate": 1.4728522629783297e-05, "epoch": 0.6347190672979556, "percentage": 63.48, "elapsed_time": "4 days, 10:42:36", "remaining_time": "2 days, 13:23:52", "throughput": 2724.5, "total_tokens": 1046633280} {"current_steps": 5799, "total_steps": 9134, "loss": 0.6378, "learning_rate": 1.4720683883345876e-05, "epoch": 0.6348285393688935, "percentage": 63.49, "elapsed_time": "4 days, 10:43:45", "remaining_time": "2 days, 13:22:47", "throughput": 2724.52, "total_tokens": 1046832416} {"current_steps": 5800, "total_steps": 9134, "loss": 0.8368, "learning_rate": 1.4712846352931909e-05, "epoch": 0.6349380114398314, "percentage": 63.5, "elapsed_time": "4 days, 10:44:51", "remaining_time": "2 days, 13:21:41", "throughput": 2724.5, "total_tokens": 1047003552} {"current_steps": 5801, "total_steps": 9134, "loss": 0.7684, "learning_rate": 1.4705010039468547e-05, "epoch": 0.6350474835107693, "percentage": 63.51, "elapsed_time": "4 days, 10:45:57", "remaining_time": "2 days, 13:20:35", "throughput": 2724.47, "total_tokens": 1047169984} {"current_steps": 5802, "total_steps": 9134, "loss": 0.6879, "learning_rate": 1.4697174943882821e-05, "epoch": 0.6351569555817073, "percentage": 63.52, "elapsed_time": "4 days, 10:47:05", "remaining_time": "2 days, 13:19:29", "throughput": 2724.5, "total_tokens": 1047364864} {"current_steps": 5803, "total_steps": 9134, "loss": 0.9187, "learning_rate": 1.4689341067101597e-05, "epoch": 0.6352664276526451, "percentage": 63.53, "elapsed_time": "4 days, 10:48:11", "remaining_time": "2 days, 13:18:23", "throughput": 2724.49, "total_tokens": 1047541600} {"current_steps": 5804, "total_steps": 9134, "loss": 0.6108, "learning_rate": 1.4681508410051615e-05, "epoch": 0.635375899723583, "percentage": 63.54, "elapsed_time": "4 days, 10:49:17", "remaining_time": "2 days, 13:17:16", "throughput": 2724.51, "total_tokens": 1047731776} {"current_steps": 5805, "total_steps": 9134, "loss": 0.7885, "learning_rate": 1.4673676973659473e-05, "epoch": 0.6354853717945209, "percentage": 63.55, "elapsed_time": "4 days, 10:50:22", "remaining_time": "2 days, 13:16:09", "throughput": 2724.54, "total_tokens": 1047918368} {"current_steps": 5806, "total_steps": 9134, "loss": 0.6892, "learning_rate": 1.4665846758851593e-05, "epoch": 0.6355948438654588, "percentage": 63.56, "elapsed_time": "4 days, 10:51:27", "remaining_time": "2 days, 13:15:03", "throughput": 2724.48, "total_tokens": 1048073600} {"current_steps": 5807, "total_steps": 9134, "loss": 0.7689, "learning_rate": 1.4658017766554295e-05, "epoch": 0.6357043159363968, "percentage": 63.58, "elapsed_time": "4 days, 10:52:35", "remaining_time": "2 days, 13:13:57", "throughput": 2724.44, "total_tokens": 1048244288} {"current_steps": 5808, "total_steps": 9134, "loss": 0.6985, "learning_rate": 1.4650189997693717e-05, "epoch": 0.6358137880073347, "percentage": 63.59, "elapsed_time": "4 days, 10:53:41", "remaining_time": "2 days, 13:12:51", "throughput": 2724.44, "total_tokens": 1048424832} {"current_steps": 5809, "total_steps": 9134, "loss": 0.6583, "learning_rate": 1.4642363453195874e-05, "epoch": 0.6359232600782725, "percentage": 63.6, "elapsed_time": "4 days, 10:54:46", "remaining_time": "2 days, 13:11:44", "throughput": 2724.46, "total_tokens": 1048605600} {"current_steps": 5810, "total_steps": 9134, "loss": 0.6551, "learning_rate": 1.4634538133986647e-05, "epoch": 0.6360327321492104, "percentage": 63.61, "elapsed_time": "4 days, 10:55:49", "remaining_time": "2 days, 13:10:36", "throughput": 2724.43, "total_tokens": 1048767776} {"current_steps": 5811, "total_steps": 9134, "loss": 0.7421, "learning_rate": 1.4626714040991733e-05, "epoch": 0.6361422042201483, "percentage": 63.62, "elapsed_time": "4 days, 10:56:56", "remaining_time": "2 days, 13:09:30", "throughput": 2724.44, "total_tokens": 1048955264} {"current_steps": 5812, "total_steps": 9134, "loss": 1.0403, "learning_rate": 1.4618891175136724e-05, "epoch": 0.6362516762910863, "percentage": 63.63, "elapsed_time": "4 days, 10:58:02", "remaining_time": "2 days, 13:08:23", "throughput": 2724.46, "total_tokens": 1049141632} {"current_steps": 5813, "total_steps": 9134, "loss": 0.7462, "learning_rate": 1.4611069537347032e-05, "epoch": 0.6363611483620242, "percentage": 63.64, "elapsed_time": "4 days, 10:59:07", "remaining_time": "2 days, 13:07:16", "throughput": 2724.46, "total_tokens": 1049318592} {"current_steps": 5814, "total_steps": 9134, "loss": 0.7804, "learning_rate": 1.4603249128547968e-05, "epoch": 0.636470620432962, "percentage": 63.65, "elapsed_time": "4 days, 11:00:13", "remaining_time": "2 days, 13:06:10", "throughput": 2724.44, "total_tokens": 1049490848} {"current_steps": 5815, "total_steps": 9134, "loss": 0.5823, "learning_rate": 1.4595429949664647e-05, "epoch": 0.6365800925038999, "percentage": 63.66, "elapsed_time": "4 days, 11:01:19", "remaining_time": "2 days, 13:05:04", "throughput": 2724.43, "total_tokens": 1049665344} {"current_steps": 5816, "total_steps": 9134, "loss": 0.8098, "learning_rate": 1.4587612001622078e-05, "epoch": 0.6366895645748378, "percentage": 63.67, "elapsed_time": "4 days, 11:02:23", "remaining_time": "2 days, 13:03:56", "throughput": 2724.44, "total_tokens": 1049844544} {"current_steps": 5817, "total_steps": 9134, "loss": 0.8392, "learning_rate": 1.4579795285345105e-05, "epoch": 0.6367990366457758, "percentage": 63.69, "elapsed_time": "4 days, 11:03:27", "remaining_time": "2 days, 13:02:48", "throughput": 2724.45, "total_tokens": 1050024416} {"current_steps": 5818, "total_steps": 9134, "loss": 0.6096, "learning_rate": 1.457197980175843e-05, "epoch": 0.6369085087167137, "percentage": 63.7, "elapsed_time": "4 days, 11:04:36", "remaining_time": "2 days, 13:01:44", "throughput": 2724.43, "total_tokens": 1050204064} {"current_steps": 5819, "total_steps": 9134, "loss": 1.0148, "learning_rate": 1.4564165551786608e-05, "epoch": 0.6370179807876516, "percentage": 63.71, "elapsed_time": "4 days, 11:05:41", "remaining_time": "2 days, 13:00:37", "throughput": 2724.39, "total_tokens": 1050365120} {"current_steps": 5820, "total_steps": 9134, "loss": 0.9983, "learning_rate": 1.455635253635404e-05, "epoch": 0.6371274528585894, "percentage": 63.72, "elapsed_time": "4 days, 11:06:50", "remaining_time": "2 days, 12:59:32", "throughput": 2724.44, "total_tokens": 1050573440} {"current_steps": 5821, "total_steps": 9134, "loss": 0.6563, "learning_rate": 1.454854075638502e-05, "epoch": 0.6372369249295273, "percentage": 63.73, "elapsed_time": "4 days, 11:07:49", "remaining_time": "2 days, 12:58:22", "throughput": 2724.39, "total_tokens": 1050714560} {"current_steps": 5822, "total_steps": 9134, "loss": 0.7213, "learning_rate": 1.4540730212803633e-05, "epoch": 0.6373463970004652, "percentage": 63.74, "elapsed_time": "4 days, 11:08:52", "remaining_time": "2 days, 12:57:14", "throughput": 2724.35, "total_tokens": 1050869568} {"current_steps": 5823, "total_steps": 9134, "loss": 0.5928, "learning_rate": 1.4532920906533875e-05, "epoch": 0.6374558690714032, "percentage": 63.75, "elapsed_time": "4 days, 11:10:00", "remaining_time": "2 days, 12:56:09", "throughput": 2724.34, "total_tokens": 1051051456} {"current_steps": 5824, "total_steps": 9134, "loss": 0.6504, "learning_rate": 1.4525112838499567e-05, "epoch": 0.6375653411423411, "percentage": 63.76, "elapsed_time": "4 days, 11:11:10", "remaining_time": "2 days, 12:55:04", "throughput": 2724.36, "total_tokens": 1051251488} {"current_steps": 5825, "total_steps": 9134, "loss": 0.7007, "learning_rate": 1.4517306009624382e-05, "epoch": 0.637674813213279, "percentage": 63.77, "elapsed_time": "4 days, 11:12:15", "remaining_time": "2 days, 12:53:57", "throughput": 2724.38, "total_tokens": 1051432928} {"current_steps": 5826, "total_steps": 9134, "loss": 0.7974, "learning_rate": 1.450950042083186e-05, "epoch": 0.6377842852842168, "percentage": 63.78, "elapsed_time": "4 days, 11:13:18", "remaining_time": "2 days, 12:52:49", "throughput": 2724.34, "total_tokens": 1051589280} {"current_steps": 5827, "total_steps": 9134, "loss": 0.9087, "learning_rate": 1.4501696073045382e-05, "epoch": 0.6378937573551547, "percentage": 63.79, "elapsed_time": "4 days, 11:14:25", "remaining_time": "2 days, 12:51:44", "throughput": 2724.38, "total_tokens": 1051791776} {"current_steps": 5828, "total_steps": 9134, "loss": 0.67, "learning_rate": 1.4493892967188188e-05, "epoch": 0.6380032294260927, "percentage": 63.81, "elapsed_time": "4 days, 11:15:34", "remaining_time": "2 days, 12:50:39", "throughput": 2724.44, "total_tokens": 1052000096} {"current_steps": 5829, "total_steps": 9134, "loss": 0.7275, "learning_rate": 1.4486091104183364e-05, "epoch": 0.6381127014970306, "percentage": 63.82, "elapsed_time": "4 days, 11:16:40", "remaining_time": "2 days, 12:49:32", "throughput": 2724.38, "total_tokens": 1052157344} {"current_steps": 5830, "total_steps": 9134, "loss": 0.6996, "learning_rate": 1.4478290484953871e-05, "epoch": 0.6382221735679685, "percentage": 63.83, "elapsed_time": "4 days, 11:17:46", "remaining_time": "2 days, 12:48:26", "throughput": 2724.34, "total_tokens": 1052323776} {"current_steps": 5831, "total_steps": 9134, "loss": 0.6478, "learning_rate": 1.4470491110422502e-05, "epoch": 0.6383316456389063, "percentage": 63.84, "elapsed_time": "4 days, 11:18:47", "remaining_time": "2 days, 12:47:17", "throughput": 2724.3, "total_tokens": 1052471392} {"current_steps": 5832, "total_steps": 9134, "loss": 0.6081, "learning_rate": 1.4462692981511906e-05, "epoch": 0.6384411177098442, "percentage": 63.85, "elapsed_time": "4 days, 11:19:49", "remaining_time": "2 days, 12:46:08", "throughput": 2724.26, "total_tokens": 1052624608} {"current_steps": 5833, "total_steps": 9134, "loss": 0.8397, "learning_rate": 1.4454896099144583e-05, "epoch": 0.6385505897807822, "percentage": 63.86, "elapsed_time": "4 days, 11:20:57", "remaining_time": "2 days, 12:45:03", "throughput": 2724.29, "total_tokens": 1052821952} {"current_steps": 5834, "total_steps": 9134, "loss": 0.8159, "learning_rate": 1.4447100464242894e-05, "epoch": 0.6386600618517201, "percentage": 63.87, "elapsed_time": "4 days, 11:22:07", "remaining_time": "2 days, 12:43:59", "throughput": 2724.35, "total_tokens": 1053036544} {"current_steps": 5835, "total_steps": 9134, "loss": 0.8028, "learning_rate": 1.4439306077729048e-05, "epoch": 0.638769533922658, "percentage": 63.88, "elapsed_time": "4 days, 11:23:14", "remaining_time": "2 days, 12:42:53", "throughput": 2724.37, "total_tokens": 1053226720} {"current_steps": 5836, "total_steps": 9134, "loss": 0.8351, "learning_rate": 1.4431512940525102e-05, "epoch": 0.6388790059935959, "percentage": 63.89, "elapsed_time": "4 days, 11:24:21", "remaining_time": "2 days, 12:41:47", "throughput": 2724.42, "total_tokens": 1053427424} {"current_steps": 5837, "total_steps": 9134, "loss": 0.8371, "learning_rate": 1.4423721053552963e-05, "epoch": 0.6389884780645337, "percentage": 63.9, "elapsed_time": "4 days, 11:25:24", "remaining_time": "2 days, 12:40:39", "throughput": 2724.37, "total_tokens": 1053582432} {"current_steps": 5838, "total_steps": 9134, "loss": 0.8339, "learning_rate": 1.4415930417734414e-05, "epoch": 0.6390979501354717, "percentage": 63.92, "elapsed_time": "4 days, 11:26:32", "remaining_time": "2 days, 12:39:34", "throughput": 2724.38, "total_tokens": 1053770592} {"current_steps": 5839, "total_steps": 9134, "loss": 0.808, "learning_rate": 1.4408141033991064e-05, "epoch": 0.6392074222064096, "percentage": 63.93, "elapsed_time": "4 days, 11:27:40", "remaining_time": "2 days, 12:38:29", "throughput": 2724.38, "total_tokens": 1053956288} {"current_steps": 5840, "total_steps": 9134, "loss": 0.8097, "learning_rate": 1.4400352903244382e-05, "epoch": 0.6393168942773475, "percentage": 63.94, "elapsed_time": "4 days, 11:28:49", "remaining_time": "2 days, 12:37:24", "throughput": 2724.44, "total_tokens": 1054167072} {"current_steps": 5841, "total_steps": 9134, "loss": 0.7692, "learning_rate": 1.4392566026415688e-05, "epoch": 0.6394263663482854, "percentage": 63.95, "elapsed_time": "4 days, 11:29:53", "remaining_time": "2 days, 12:36:16", "throughput": 2724.4, "total_tokens": 1054323200} {"current_steps": 5842, "total_steps": 9134, "loss": 0.7929, "learning_rate": 1.4384780404426157e-05, "epoch": 0.6395358384192233, "percentage": 63.96, "elapsed_time": "4 days, 11:31:02", "remaining_time": "2 days, 12:35:11", "throughput": 2724.41, "total_tokens": 1054516064} {"current_steps": 5843, "total_steps": 9134, "loss": 0.6091, "learning_rate": 1.4376996038196807e-05, "epoch": 0.6396453104901612, "percentage": 63.97, "elapsed_time": "4 days, 11:32:07", "remaining_time": "2 days, 12:34:05", "throughput": 2724.38, "total_tokens": 1054682272} {"current_steps": 5844, "total_steps": 9134, "loss": 0.8387, "learning_rate": 1.4369212928648513e-05, "epoch": 0.6397547825610991, "percentage": 63.98, "elapsed_time": "4 days, 11:33:11", "remaining_time": "2 days, 12:32:57", "throughput": 2724.39, "total_tokens": 1054862816} {"current_steps": 5845, "total_steps": 9134, "loss": 0.8011, "learning_rate": 1.4361431076702019e-05, "epoch": 0.639864254632037, "percentage": 63.99, "elapsed_time": "4 days, 11:34:18", "remaining_time": "2 days, 12:31:51", "throughput": 2724.4, "total_tokens": 1055047616} {"current_steps": 5846, "total_steps": 9134, "loss": 0.7982, "learning_rate": 1.4353650483277881e-05, "epoch": 0.6399737267029749, "percentage": 64.0, "elapsed_time": "4 days, 11:35:26", "remaining_time": "2 days, 12:30:46", "throughput": 2724.43, "total_tokens": 1055242272} {"current_steps": 5847, "total_steps": 9134, "loss": 0.5904, "learning_rate": 1.4345871149296552e-05, "epoch": 0.6400831987739128, "percentage": 64.01, "elapsed_time": "4 days, 11:36:32", "remaining_time": "2 days, 12:29:39", "throughput": 2724.43, "total_tokens": 1055424384} {"current_steps": 5848, "total_steps": 9134, "loss": 0.8858, "learning_rate": 1.433809307567828e-05, "epoch": 0.6401926708448507, "percentage": 64.02, "elapsed_time": "4 days, 11:37:39", "remaining_time": "2 days, 12:28:34", "throughput": 2724.47, "total_tokens": 1055622400} {"current_steps": 5849, "total_steps": 9134, "loss": 0.6447, "learning_rate": 1.4330316263343224e-05, "epoch": 0.6403021429157886, "percentage": 64.04, "elapsed_time": "4 days, 11:38:43", "remaining_time": "2 days, 12:27:26", "throughput": 2724.44, "total_tokens": 1055786144} {"current_steps": 5850, "total_steps": 9134, "loss": 0.6204, "learning_rate": 1.432254071321136e-05, "epoch": 0.6404116149867265, "percentage": 64.05, "elapsed_time": "4 days, 11:39:50", "remaining_time": "2 days, 12:26:20", "throughput": 2724.46, "total_tokens": 1055974976} {"current_steps": 5851, "total_steps": 9134, "loss": 0.7833, "learning_rate": 1.4314766426202507e-05, "epoch": 0.6405210870576644, "percentage": 64.06, "elapsed_time": "4 days, 11:40:54", "remaining_time": "2 days, 12:25:13", "throughput": 2724.41, "total_tokens": 1056128416} {"current_steps": 5852, "total_steps": 9134, "loss": 0.753, "learning_rate": 1.430699340323638e-05, "epoch": 0.6406305591286023, "percentage": 64.07, "elapsed_time": "4 days, 11:42:02", "remaining_time": "2 days, 12:24:08", "throughput": 2724.4, "total_tokens": 1056310976} {"current_steps": 5853, "total_steps": 9134, "loss": 0.6965, "learning_rate": 1.429922164523247e-05, "epoch": 0.6407400311995403, "percentage": 64.08, "elapsed_time": "4 days, 11:43:06", "remaining_time": "2 days, 12:23:00", "throughput": 2724.34, "total_tokens": 1056462176} {"current_steps": 5854, "total_steps": 9134, "loss": 0.6152, "learning_rate": 1.4291451153110202e-05, "epoch": 0.6408495032704781, "percentage": 64.09, "elapsed_time": "4 days, 11:44:12", "remaining_time": "2 days, 12:21:54", "throughput": 2724.33, "total_tokens": 1056637344} {"current_steps": 5855, "total_steps": 9134, "loss": 0.7361, "learning_rate": 1.4283681927788772e-05, "epoch": 0.640958975341416, "percentage": 64.1, "elapsed_time": "4 days, 11:45:15", "remaining_time": "2 days, 12:20:46", "throughput": 2724.31, "total_tokens": 1056802432} {"current_steps": 5856, "total_steps": 9134, "loss": 0.9905, "learning_rate": 1.4275913970187305e-05, "epoch": 0.6410684474123539, "percentage": 64.11, "elapsed_time": "4 days, 11:46:24", "remaining_time": "2 days, 12:19:41", "throughput": 2724.39, "total_tokens": 1057023072} {"current_steps": 5857, "total_steps": 9134, "loss": 0.7575, "learning_rate": 1.4268147281224695e-05, "epoch": 0.6411779194832918, "percentage": 64.12, "elapsed_time": "4 days, 11:47:34", "remaining_time": "2 days, 12:18:36", "throughput": 2724.41, "total_tokens": 1057219296} {"current_steps": 5858, "total_steps": 9134, "loss": 0.7153, "learning_rate": 1.4260381861819755e-05, "epoch": 0.6412873915542298, "percentage": 64.13, "elapsed_time": "4 days, 11:48:42", "remaining_time": "2 days, 12:17:31", "throughput": 2724.41, "total_tokens": 1057403872} {"current_steps": 5859, "total_steps": 9134, "loss": 0.6355, "learning_rate": 1.4252617712891109e-05, "epoch": 0.6413968636251677, "percentage": 64.14, "elapsed_time": "4 days, 11:49:47", "remaining_time": "2 days, 12:16:24", "throughput": 2724.39, "total_tokens": 1057575232} {"current_steps": 5860, "total_steps": 9134, "loss": 0.8774, "learning_rate": 1.424485483535724e-05, "epoch": 0.6415063356961055, "percentage": 64.16, "elapsed_time": "4 days, 11:50:55", "remaining_time": "2 days, 12:15:19", "throughput": 2724.37, "total_tokens": 1057750176} {"current_steps": 5861, "total_steps": 9134, "loss": 0.7405, "learning_rate": 1.4237093230136489e-05, "epoch": 0.6416158077670434, "percentage": 64.17, "elapsed_time": "4 days, 11:52:01", "remaining_time": "2 days, 12:14:12", "throughput": 2724.3, "total_tokens": 1057904736} {"current_steps": 5862, "total_steps": 9134, "loss": 0.7912, "learning_rate": 1.4229332898147022e-05, "epoch": 0.6417252798379813, "percentage": 64.18, "elapsed_time": "4 days, 11:53:10", "remaining_time": "2 days, 12:13:08", "throughput": 2724.31, "total_tokens": 1058098272} {"current_steps": 5863, "total_steps": 9134, "loss": 1.1416, "learning_rate": 1.4221573840306902e-05, "epoch": 0.6418347519089193, "percentage": 64.19, "elapsed_time": "4 days, 11:54:19", "remaining_time": "2 days, 12:12:03", "throughput": 2724.37, "total_tokens": 1058305248} {"current_steps": 5864, "total_steps": 9134, "loss": 0.8632, "learning_rate": 1.421381605753397e-05, "epoch": 0.6419442239798572, "percentage": 64.2, "elapsed_time": "4 days, 11:55:20", "remaining_time": "2 days, 12:10:54", "throughput": 2724.31, "total_tokens": 1058452416} {"current_steps": 5865, "total_steps": 9134, "loss": 0.6574, "learning_rate": 1.4206059550745993e-05, "epoch": 0.642053696050795, "percentage": 64.21, "elapsed_time": "4 days, 11:56:21", "remaining_time": "2 days, 12:09:45", "throughput": 2724.28, "total_tokens": 1058604736} {"current_steps": 5866, "total_steps": 9134, "loss": 0.6998, "learning_rate": 1.4198304320860534e-05, "epoch": 0.6421631681217329, "percentage": 64.22, "elapsed_time": "4 days, 11:57:28", "remaining_time": "2 days, 12:08:39", "throughput": 2724.23, "total_tokens": 1058768256} {"current_steps": 5867, "total_steps": 9134, "loss": 0.6786, "learning_rate": 1.4190550368795024e-05, "epoch": 0.6422726401926708, "percentage": 64.23, "elapsed_time": "4 days, 11:58:37", "remaining_time": "2 days, 12:07:35", "throughput": 2724.23, "total_tokens": 1058956864} {"current_steps": 5868, "total_steps": 9134, "loss": 0.9602, "learning_rate": 1.4182797695466743e-05, "epoch": 0.6423821122636088, "percentage": 64.24, "elapsed_time": "4 days, 11:59:45", "remaining_time": "2 days, 12:06:29", "throughput": 2724.23, "total_tokens": 1059140768} {"current_steps": 5869, "total_steps": 9134, "loss": 0.7441, "learning_rate": 1.4175046301792816e-05, "epoch": 0.6424915843345467, "percentage": 64.25, "elapsed_time": "4 days, 12:00:53", "remaining_time": "2 days, 12:05:24", "throughput": 2724.23, "total_tokens": 1059326240} {"current_steps": 5870, "total_steps": 9134, "loss": 0.8584, "learning_rate": 1.4167296188690204e-05, "epoch": 0.6426010564054846, "percentage": 64.27, "elapsed_time": "4 days, 12:01:59", "remaining_time": "2 days, 12:04:17", "throughput": 2724.18, "total_tokens": 1059486624} {"current_steps": 5871, "total_steps": 9134, "loss": 0.8884, "learning_rate": 1.4159547357075759e-05, "epoch": 0.6427105284764224, "percentage": 64.28, "elapsed_time": "4 days, 12:03:03", "remaining_time": "2 days, 12:03:10", "throughput": 2724.15, "total_tokens": 1059651040} {"current_steps": 5872, "total_steps": 9134, "loss": 0.8569, "learning_rate": 1.4151799807866135e-05, "epoch": 0.6428200005473603, "percentage": 64.29, "elapsed_time": "4 days, 12:04:06", "remaining_time": "2 days, 12:02:02", "throughput": 2724.14, "total_tokens": 1059816352} {"current_steps": 5873, "total_steps": 9134, "loss": 0.5537, "learning_rate": 1.4144053541977855e-05, "epoch": 0.6429294726182982, "percentage": 64.3, "elapsed_time": "4 days, 12:05:10", "remaining_time": "2 days, 12:00:54", "throughput": 2724.11, "total_tokens": 1059978752} {"current_steps": 5874, "total_steps": 9134, "loss": 0.6876, "learning_rate": 1.4136308560327288e-05, "epoch": 0.6430389446892362, "percentage": 64.31, "elapsed_time": "4 days, 12:06:17", "remaining_time": "2 days, 11:59:48", "throughput": 2724.07, "total_tokens": 1060146304} {"current_steps": 5875, "total_steps": 9134, "loss": 0.8544, "learning_rate": 1.4128564863830655e-05, "epoch": 0.6431484167601741, "percentage": 64.32, "elapsed_time": "4 days, 12:07:23", "remaining_time": "2 days, 11:58:42", "throughput": 2724.0, "total_tokens": 1060300416} {"current_steps": 5876, "total_steps": 9134, "loss": 0.8103, "learning_rate": 1.4120822453404011e-05, "epoch": 0.643257888831112, "percentage": 64.33, "elapsed_time": "4 days, 12:08:30", "remaining_time": "2 days, 11:57:36", "throughput": 2724.01, "total_tokens": 1060483648} {"current_steps": 5877, "total_steps": 9134, "loss": 0.6578, "learning_rate": 1.4113081329963265e-05, "epoch": 0.6433673609020498, "percentage": 64.34, "elapsed_time": "4 days, 12:09:31", "remaining_time": "2 days, 11:56:27", "throughput": 2723.96, "total_tokens": 1060632160} {"current_steps": 5878, "total_steps": 9134, "loss": 0.9817, "learning_rate": 1.4105341494424206e-05, "epoch": 0.6434768329729877, "percentage": 64.35, "elapsed_time": "4 days, 12:10:36", "remaining_time": "2 days, 11:55:20", "throughput": 2723.96, "total_tokens": 1060810464} {"current_steps": 5879, "total_steps": 9134, "loss": 0.8496, "learning_rate": 1.40976029477024e-05, "epoch": 0.6435863050439257, "percentage": 64.36, "elapsed_time": "4 days, 12:11:45", "remaining_time": "2 days, 11:54:15", "throughput": 2723.99, "total_tokens": 1061007136} {"current_steps": 5880, "total_steps": 9134, "loss": 0.7507, "learning_rate": 1.4089865690713337e-05, "epoch": 0.6436957771148636, "percentage": 64.37, "elapsed_time": "4 days, 12:12:52", "remaining_time": "2 days, 11:53:10", "throughput": 2723.99, "total_tokens": 1061191488} {"current_steps": 5881, "total_steps": 9134, "loss": 0.8594, "learning_rate": 1.40821297243723e-05, "epoch": 0.6438052491858015, "percentage": 64.39, "elapsed_time": "4 days, 12:14:01", "remaining_time": "2 days, 11:52:05", "throughput": 2724.02, "total_tokens": 1061390176} {"current_steps": 5882, "total_steps": 9134, "loss": 0.8612, "learning_rate": 1.407439504959445e-05, "epoch": 0.6439147212567393, "percentage": 64.4, "elapsed_time": "4 days, 12:15:09", "remaining_time": "2 days, 11:50:59", "throughput": 2724.07, "total_tokens": 1061596704} {"current_steps": 5883, "total_steps": 9134, "loss": 0.7493, "learning_rate": 1.4066661667294779e-05, "epoch": 0.6440241933276772, "percentage": 64.41, "elapsed_time": "4 days, 12:16:14", "remaining_time": "2 days, 11:49:53", "throughput": 2724.11, "total_tokens": 1061791136} {"current_steps": 5884, "total_steps": 9134, "loss": 0.9063, "learning_rate": 1.405892957838812e-05, "epoch": 0.6441336653986152, "percentage": 64.42, "elapsed_time": "4 days, 12:17:15", "remaining_time": "2 days, 11:48:44", "throughput": 2724.04, "total_tokens": 1061930688} {"current_steps": 5885, "total_steps": 9134, "loss": 0.6925, "learning_rate": 1.4051198783789196e-05, "epoch": 0.6442431374695531, "percentage": 64.43, "elapsed_time": "4 days, 12:18:24", "remaining_time": "2 days, 11:47:39", "throughput": 2724.06, "total_tokens": 1062122432} {"current_steps": 5886, "total_steps": 9134, "loss": 1.0481, "learning_rate": 1.4043469284412509e-05, "epoch": 0.644352609540491, "percentage": 64.44, "elapsed_time": "4 days, 12:19:31", "remaining_time": "2 days, 11:46:33", "throughput": 2724.11, "total_tokens": 1062326496} {"current_steps": 5887, "total_steps": 9134, "loss": 0.6791, "learning_rate": 1.4035741081172476e-05, "epoch": 0.6444620816114289, "percentage": 64.45, "elapsed_time": "4 days, 12:20:41", "remaining_time": "2 days, 11:45:29", "throughput": 2724.14, "total_tokens": 1062526976} {"current_steps": 5888, "total_steps": 9134, "loss": 0.7345, "learning_rate": 1.4028014174983295e-05, "epoch": 0.6445715536823667, "percentage": 64.46, "elapsed_time": "4 days, 12:21:46", "remaining_time": "2 days, 11:44:22", "throughput": 2724.11, "total_tokens": 1062695424} {"current_steps": 5889, "total_steps": 9134, "loss": 0.8422, "learning_rate": 1.402028856675908e-05, "epoch": 0.6446810257533047, "percentage": 64.47, "elapsed_time": "4 days, 12:22:54", "remaining_time": "2 days, 11:43:16", "throughput": 2724.16, "total_tokens": 1062898592} {"current_steps": 5890, "total_steps": 9134, "loss": 0.693, "learning_rate": 1.4012564257413718e-05, "epoch": 0.6447904978242426, "percentage": 64.48, "elapsed_time": "4 days, 12:24:00", "remaining_time": "2 days, 11:42:10", "throughput": 2724.22, "total_tokens": 1063102656} {"current_steps": 5891, "total_steps": 9134, "loss": 0.6337, "learning_rate": 1.4004841247861011e-05, "epoch": 0.6448999698951805, "percentage": 64.5, "elapsed_time": "4 days, 12:25:08", "remaining_time": "2 days, 11:41:05", "throughput": 2724.23, "total_tokens": 1063289248} {"current_steps": 5892, "total_steps": 9134, "loss": 0.6774, "learning_rate": 1.3997119539014566e-05, "epoch": 0.6450094419661184, "percentage": 64.51, "elapsed_time": "4 days, 12:26:13", "remaining_time": "2 days, 11:39:58", "throughput": 2724.2, "total_tokens": 1063457248} {"current_steps": 5893, "total_steps": 9134, "loss": 0.8856, "learning_rate": 1.3989399131787836e-05, "epoch": 0.6451189140370563, "percentage": 64.52, "elapsed_time": "4 days, 12:27:19", "remaining_time": "2 days, 11:38:51", "throughput": 2724.19, "total_tokens": 1063633536} {"current_steps": 5894, "total_steps": 9134, "loss": 0.7736, "learning_rate": 1.398168002709416e-05, "epoch": 0.6452283861079942, "percentage": 64.53, "elapsed_time": "4 days, 12:28:28", "remaining_time": "2 days, 11:37:46", "throughput": 2724.19, "total_tokens": 1063819904} {"current_steps": 5895, "total_steps": 9134, "loss": 0.8029, "learning_rate": 1.3973962225846654e-05, "epoch": 0.6453378581789321, "percentage": 64.54, "elapsed_time": "4 days, 12:29:34", "remaining_time": "2 days, 11:36:40", "throughput": 2724.13, "total_tokens": 1063976032} {"current_steps": 5896, "total_steps": 9134, "loss": 0.805, "learning_rate": 1.3966245728958355e-05, "epoch": 0.64544733024987, "percentage": 64.55, "elapsed_time": "4 days, 12:30:44", "remaining_time": "2 days, 11:35:36", "throughput": 2724.22, "total_tokens": 1064201376} {"current_steps": 5897, "total_steps": 9134, "loss": 1.0171, "learning_rate": 1.3958530537342075e-05, "epoch": 0.6455568023208079, "percentage": 64.56, "elapsed_time": "4 days, 12:31:52", "remaining_time": "2 days, 11:34:31", "throughput": 2724.29, "total_tokens": 1064413056} {"current_steps": 5898, "total_steps": 9134, "loss": 0.6528, "learning_rate": 1.3950816651910537e-05, "epoch": 0.6456662743917458, "percentage": 64.57, "elapsed_time": "4 days, 12:32:58", "remaining_time": "2 days, 11:33:24", "throughput": 2724.3, "total_tokens": 1064597184} {"current_steps": 5899, "total_steps": 9134, "loss": 0.7325, "learning_rate": 1.3943104073576263e-05, "epoch": 0.6457757464626837, "percentage": 64.58, "elapsed_time": "4 days, 12:34:05", "remaining_time": "2 days, 11:32:18", "throughput": 2724.32, "total_tokens": 1064786688} {"current_steps": 5900, "total_steps": 9134, "loss": 0.5231, "learning_rate": 1.393539280325164e-05, "epoch": 0.6458852185336216, "percentage": 64.59, "elapsed_time": "4 days, 12:35:12", "remaining_time": "2 days, 11:31:13", "throughput": 2724.29, "total_tokens": 1064958944} {"current_steps": 5901, "total_steps": 9134, "loss": 0.7512, "learning_rate": 1.3927682841848899e-05, "epoch": 0.6459946906045595, "percentage": 64.6, "elapsed_time": "4 days, 12:36:19", "remaining_time": "2 days, 11:30:07", "throughput": 2724.26, "total_tokens": 1065131872} {"current_steps": 5902, "total_steps": 9134, "loss": 0.7698, "learning_rate": 1.391997419028011e-05, "epoch": 0.6461041626754974, "percentage": 64.62, "elapsed_time": "4 days, 12:37:24", "remaining_time": "2 days, 11:29:00", "throughput": 2724.2, "total_tokens": 1065284192} {"current_steps": 5903, "total_steps": 9134, "loss": 0.7973, "learning_rate": 1.3912266849457195e-05, "epoch": 0.6462136347464353, "percentage": 64.63, "elapsed_time": "4 days, 12:38:25", "remaining_time": "2 days, 11:27:51", "throughput": 2724.13, "total_tokens": 1065424640} {"current_steps": 5904, "total_steps": 9134, "loss": 0.7326, "learning_rate": 1.3904560820291902e-05, "epoch": 0.6463231068173733, "percentage": 64.64, "elapsed_time": "4 days, 12:39:32", "remaining_time": "2 days, 11:26:45", "throughput": 2724.18, "total_tokens": 1065624224} {"current_steps": 5905, "total_steps": 9134, "loss": 0.5482, "learning_rate": 1.3896856103695866e-05, "epoch": 0.6464325788883111, "percentage": 64.65, "elapsed_time": "4 days, 12:40:38", "remaining_time": "2 days, 11:25:38", "throughput": 2724.19, "total_tokens": 1065808576} {"current_steps": 5906, "total_steps": 9134, "loss": 0.6962, "learning_rate": 1.3889152700580527e-05, "epoch": 0.646542050959249, "percentage": 64.66, "elapsed_time": "4 days, 12:41:46", "remaining_time": "2 days, 11:24:33", "throughput": 2724.2, "total_tokens": 1065998304} {"current_steps": 5907, "total_steps": 9134, "loss": 0.9826, "learning_rate": 1.3881450611857181e-05, "epoch": 0.6466515230301869, "percentage": 64.67, "elapsed_time": "4 days, 12:42:53", "remaining_time": "2 days, 11:23:27", "throughput": 2724.25, "total_tokens": 1066199232} {"current_steps": 5908, "total_steps": 9134, "loss": 0.7421, "learning_rate": 1.3873749838436972e-05, "epoch": 0.6467609951011248, "percentage": 64.68, "elapsed_time": "4 days, 12:44:02", "remaining_time": "2 days, 11:22:22", "throughput": 2724.29, "total_tokens": 1066403296} {"current_steps": 5909, "total_steps": 9134, "loss": 0.8185, "learning_rate": 1.386605038123089e-05, "epoch": 0.6468704671720628, "percentage": 64.69, "elapsed_time": "4 days, 12:45:05", "remaining_time": "2 days, 11:21:15", "throughput": 2724.28, "total_tokens": 1066569728} {"current_steps": 5910, "total_steps": 9134, "loss": 0.6906, "learning_rate": 1.3858352241149763e-05, "epoch": 0.6469799392430007, "percentage": 64.7, "elapsed_time": "4 days, 12:46:14", "remaining_time": "2 days, 11:20:10", "throughput": 2724.28, "total_tokens": 1066757216} {"current_steps": 5911, "total_steps": 9134, "loss": 1.0453, "learning_rate": 1.3850655419104267e-05, "epoch": 0.6470894113139385, "percentage": 64.71, "elapsed_time": "4 days, 12:47:22", "remaining_time": "2 days, 11:19:04", "throughput": 2724.29, "total_tokens": 1066946944} {"current_steps": 5912, "total_steps": 9134, "loss": 0.7292, "learning_rate": 1.3842959916004911e-05, "epoch": 0.6471988833848764, "percentage": 64.73, "elapsed_time": "4 days, 12:48:26", "remaining_time": "2 days, 11:17:57", "throughput": 2724.27, "total_tokens": 1067116512} {"current_steps": 5913, "total_steps": 9134, "loss": 0.7697, "learning_rate": 1.3835265732762076e-05, "epoch": 0.6473083554558143, "percentage": 64.74, "elapsed_time": "4 days, 12:49:32", "remaining_time": "2 days, 11:16:50", "throughput": 2724.24, "total_tokens": 1067283392} {"current_steps": 5914, "total_steps": 9134, "loss": 0.8917, "learning_rate": 1.3827572870285963e-05, "epoch": 0.6474178275267523, "percentage": 64.75, "elapsed_time": "4 days, 12:50:39", "remaining_time": "2 days, 11:15:45", "throughput": 2724.2, "total_tokens": 1067448928} {"current_steps": 5915, "total_steps": 9134, "loss": 0.6908, "learning_rate": 1.3819881329486622e-05, "epoch": 0.6475272995976902, "percentage": 64.76, "elapsed_time": "4 days, 12:51:45", "remaining_time": "2 days, 11:14:38", "throughput": 2724.23, "total_tokens": 1067642912} {"current_steps": 5916, "total_steps": 9134, "loss": 0.5815, "learning_rate": 1.3812191111273944e-05, "epoch": 0.647636771668628, "percentage": 64.77, "elapsed_time": "4 days, 12:52:51", "remaining_time": "2 days, 11:13:32", "throughput": 2724.21, "total_tokens": 1067812704} {"current_steps": 5917, "total_steps": 9134, "loss": 0.8752, "learning_rate": 1.3804502216557675e-05, "epoch": 0.6477462437395659, "percentage": 64.78, "elapsed_time": "4 days, 12:54:00", "remaining_time": "2 days, 11:12:27", "throughput": 2724.24, "total_tokens": 1068014080} {"current_steps": 5918, "total_steps": 9134, "loss": 0.7348, "learning_rate": 1.3796814646247385e-05, "epoch": 0.6478557158105038, "percentage": 64.79, "elapsed_time": "4 days, 12:55:08", "remaining_time": "2 days, 11:11:22", "throughput": 2724.24, "total_tokens": 1068196192} {"current_steps": 5919, "total_steps": 9134, "loss": 0.772, "learning_rate": 1.3789128401252502e-05, "epoch": 0.6479651878814418, "percentage": 64.8, "elapsed_time": "4 days, 12:56:13", "remaining_time": "2 days, 11:10:15", "throughput": 2724.22, "total_tokens": 1068367104} {"current_steps": 5920, "total_steps": 9134, "loss": 0.8221, "learning_rate": 1.3781443482482314e-05, "epoch": 0.6480746599523797, "percentage": 64.81, "elapsed_time": "4 days, 12:57:19", "remaining_time": "2 days, 11:09:08", "throughput": 2724.22, "total_tokens": 1068547424} {"current_steps": 5921, "total_steps": 9134, "loss": 0.8589, "learning_rate": 1.37737598908459e-05, "epoch": 0.6481841320233176, "percentage": 64.82, "elapsed_time": "4 days, 12:58:29", "remaining_time": "2 days, 11:08:04", "throughput": 2724.25, "total_tokens": 1068746560} {"current_steps": 5922, "total_steps": 9134, "loss": 0.7561, "learning_rate": 1.3766077627252233e-05, "epoch": 0.6482936040942554, "percentage": 64.83, "elapsed_time": "4 days, 12:59:35", "remaining_time": "2 days, 11:06:58", "throughput": 2724.25, "total_tokens": 1068929568} {"current_steps": 5923, "total_steps": 9134, "loss": 0.7756, "learning_rate": 1.3758396692610112e-05, "epoch": 0.6484030761651933, "percentage": 64.85, "elapsed_time": "4 days, 13:00:39", "remaining_time": "2 days, 11:05:50", "throughput": 2724.23, "total_tokens": 1069092864} {"current_steps": 5924, "total_steps": 9134, "loss": 0.633, "learning_rate": 1.3750717087828172e-05, "epoch": 0.6485125482361312, "percentage": 64.86, "elapsed_time": "4 days, 13:01:45", "remaining_time": "2 days, 11:04:44", "throughput": 2724.22, "total_tokens": 1069268928} {"current_steps": 5925, "total_steps": 9134, "loss": 0.6591, "learning_rate": 1.3743038813814896e-05, "epoch": 0.6486220203070692, "percentage": 64.87, "elapsed_time": "4 days, 13:02:54", "remaining_time": "2 days, 11:03:39", "throughput": 2724.3, "total_tokens": 1069491584} {"current_steps": 5926, "total_steps": 9134, "loss": 0.8802, "learning_rate": 1.3735361871478597e-05, "epoch": 0.6487314923780071, "percentage": 64.88, "elapsed_time": "4 days, 13:04:04", "remaining_time": "2 days, 11:02:35", "throughput": 2724.39, "total_tokens": 1069716256} {"current_steps": 5927, "total_steps": 9134, "loss": 0.9045, "learning_rate": 1.3727686261727474e-05, "epoch": 0.648840964448945, "percentage": 64.89, "elapsed_time": "4 days, 13:05:13", "remaining_time": "2 days, 11:01:30", "throughput": 2724.4, "total_tokens": 1069909120} {"current_steps": 5928, "total_steps": 9134, "loss": 0.8696, "learning_rate": 1.3720011985469494e-05, "epoch": 0.6489504365198828, "percentage": 64.9, "elapsed_time": "4 days, 13:06:21", "remaining_time": "2 days, 11:00:25", "throughput": 2724.36, "total_tokens": 1070080704} {"current_steps": 5929, "total_steps": 9134, "loss": 0.897, "learning_rate": 1.371233904361256e-05, "epoch": 0.6490599085908207, "percentage": 64.91, "elapsed_time": "4 days, 13:07:31", "remaining_time": "2 days, 10:59:20", "throughput": 2724.39, "total_tokens": 1070278496} {"current_steps": 5930, "total_steps": 9134, "loss": 0.8333, "learning_rate": 1.370466743706431e-05, "epoch": 0.6491693806617587, "percentage": 64.92, "elapsed_time": "4 days, 13:08:39", "remaining_time": "2 days, 10:58:16", "throughput": 2724.43, "total_tokens": 1070482560} {"current_steps": 5931, "total_steps": 9134, "loss": 0.6972, "learning_rate": 1.3696997166732328e-05, "epoch": 0.6492788527326966, "percentage": 64.93, "elapsed_time": "4 days, 13:09:44", "remaining_time": "2 days, 10:57:09", "throughput": 2724.43, "total_tokens": 1070661312} {"current_steps": 5932, "total_steps": 9134, "loss": 0.8837, "learning_rate": 1.3689328233523968e-05, "epoch": 0.6493883248036345, "percentage": 64.94, "elapsed_time": "4 days, 13:10:51", "remaining_time": "2 days, 10:56:03", "throughput": 2724.41, "total_tokens": 1070833120} {"current_steps": 5933, "total_steps": 9134, "loss": 0.724, "learning_rate": 1.3681660638346455e-05, "epoch": 0.6494977968745723, "percentage": 64.96, "elapsed_time": "4 days, 13:11:54", "remaining_time": "2 days, 10:54:55", "throughput": 2724.38, "total_tokens": 1070995296} {"current_steps": 5934, "total_steps": 9134, "loss": 0.8572, "learning_rate": 1.3673994382106856e-05, "epoch": 0.6496072689455102, "percentage": 64.97, "elapsed_time": "4 days, 13:13:01", "remaining_time": "2 days, 10:53:49", "throughput": 2724.39, "total_tokens": 1071181216} {"current_steps": 5935, "total_steps": 9134, "loss": 0.9961, "learning_rate": 1.3666329465712058e-05, "epoch": 0.6497167410164482, "percentage": 64.98, "elapsed_time": "4 days, 13:14:08", "remaining_time": "2 days, 10:52:43", "throughput": 2724.42, "total_tokens": 1071372960} {"current_steps": 5936, "total_steps": 9134, "loss": 0.9336, "learning_rate": 1.3658665890068836e-05, "epoch": 0.6498262130873861, "percentage": 64.99, "elapsed_time": "4 days, 13:15:18", "remaining_time": "2 days, 10:51:39", "throughput": 2724.43, "total_tokens": 1071568960} {"current_steps": 5937, "total_steps": 9134, "loss": 0.8987, "learning_rate": 1.3651003656083742e-05, "epoch": 0.649935685158324, "percentage": 65.0, "elapsed_time": "4 days, 13:16:27", "remaining_time": "2 days, 10:50:34", "throughput": 2724.51, "total_tokens": 1071787136} {"current_steps": 5938, "total_steps": 9134, "loss": 0.906, "learning_rate": 1.3643342764663225e-05, "epoch": 0.6500451572292619, "percentage": 65.01, "elapsed_time": "4 days, 13:17:34", "remaining_time": "2 days, 10:49:28", "throughput": 2724.55, "total_tokens": 1071986048} {"current_steps": 5939, "total_steps": 9134, "loss": 0.9414, "learning_rate": 1.3635683216713551e-05, "epoch": 0.6501546293001997, "percentage": 65.02, "elapsed_time": "4 days, 13:18:41", "remaining_time": "2 days, 10:48:22", "throughput": 2724.54, "total_tokens": 1072163456} {"current_steps": 5940, "total_steps": 9134, "loss": 0.6553, "learning_rate": 1.362802501314083e-05, "epoch": 0.6502641013711377, "percentage": 65.03, "elapsed_time": "4 days, 13:19:50", "remaining_time": "2 days, 10:47:17", "throughput": 2724.6, "total_tokens": 1072376928} {"current_steps": 5941, "total_steps": 9134, "loss": 0.6666, "learning_rate": 1.3620368154851008e-05, "epoch": 0.6503735734420756, "percentage": 65.04, "elapsed_time": "4 days, 13:20:56", "remaining_time": "2 days, 10:46:11", "throughput": 2724.54, "total_tokens": 1072534400} {"current_steps": 5942, "total_steps": 9134, "loss": 0.7073, "learning_rate": 1.361271264274988e-05, "epoch": 0.6504830455130135, "percentage": 65.05, "elapsed_time": "4 days, 13:22:02", "remaining_time": "2 days, 10:45:04", "throughput": 2724.53, "total_tokens": 1072709120} {"current_steps": 5943, "total_steps": 9134, "loss": 0.809, "learning_rate": 1.3605058477743077e-05, "epoch": 0.6505925175839514, "percentage": 65.06, "elapsed_time": "4 days, 13:23:11", "remaining_time": "2 days, 10:44:00", "throughput": 2724.63, "total_tokens": 1072937824} {"current_steps": 5944, "total_steps": 9134, "loss": 0.6617, "learning_rate": 1.3597405660736074e-05, "epoch": 0.6507019896548893, "percentage": 65.08, "elapsed_time": "4 days, 13:24:18", "remaining_time": "2 days, 10:42:54", "throughput": 2724.68, "total_tokens": 1073138304} {"current_steps": 5945, "total_steps": 9134, "loss": 0.6744, "learning_rate": 1.3589754192634168e-05, "epoch": 0.6508114617258272, "percentage": 65.09, "elapsed_time": "4 days, 13:25:25", "remaining_time": "2 days, 10:41:48", "throughput": 2724.69, "total_tokens": 1073324224} {"current_steps": 5946, "total_steps": 9134, "loss": 1.1437, "learning_rate": 1.3582104074342544e-05, "epoch": 0.6509209337967651, "percentage": 65.1, "elapsed_time": "4 days, 13:26:28", "remaining_time": "2 days, 10:40:40", "throughput": 2724.6, "total_tokens": 1073459744} {"current_steps": 5947, "total_steps": 9134, "loss": 0.8746, "learning_rate": 1.3574455306766179e-05, "epoch": 0.651030405867703, "percentage": 65.11, "elapsed_time": "4 days, 13:27:38", "remaining_time": "2 days, 10:39:36", "throughput": 2724.66, "total_tokens": 1073674112} {"current_steps": 5948, "total_steps": 9134, "loss": 0.7593, "learning_rate": 1.3566807890809907e-05, "epoch": 0.6511398779386409, "percentage": 65.12, "elapsed_time": "4 days, 13:28:39", "remaining_time": "2 days, 10:38:26", "throughput": 2724.61, "total_tokens": 1073821952} {"current_steps": 5949, "total_steps": 9134, "loss": 0.9731, "learning_rate": 1.3559161827378409e-05, "epoch": 0.6512493500095788, "percentage": 65.13, "elapsed_time": "4 days, 13:29:45", "remaining_time": "2 days, 10:37:20", "throughput": 2724.64, "total_tokens": 1074013248} {"current_steps": 5950, "total_steps": 9134, "loss": 0.736, "learning_rate": 1.3551517117376195e-05, "epoch": 0.6513588220805167, "percentage": 65.14, "elapsed_time": "4 days, 13:30:48", "remaining_time": "2 days, 10:36:12", "throughput": 2724.62, "total_tokens": 1074175648} {"current_steps": 5951, "total_steps": 9134, "loss": 0.7391, "learning_rate": 1.3543873761707617e-05, "epoch": 0.6514682941514546, "percentage": 65.15, "elapsed_time": "4 days, 13:31:55", "remaining_time": "2 days, 10:35:06", "throughput": 2724.62, "total_tokens": 1074358880} {"current_steps": 5952, "total_steps": 9134, "loss": 0.795, "learning_rate": 1.3536231761276866e-05, "epoch": 0.6515777662223925, "percentage": 65.16, "elapsed_time": "4 days, 13:33:02", "remaining_time": "2 days, 10:34:01", "throughput": 2724.62, "total_tokens": 1074542784} {"current_steps": 5953, "total_steps": 9134, "loss": 0.7072, "learning_rate": 1.3528591116988e-05, "epoch": 0.6516872382933304, "percentage": 65.17, "elapsed_time": "4 days, 13:34:07", "remaining_time": "2 days, 10:32:53", "throughput": 2724.62, "total_tokens": 1074717056} {"current_steps": 5954, "total_steps": 9134, "loss": 0.8962, "learning_rate": 1.3520951829744857e-05, "epoch": 0.6517967103642683, "percentage": 65.19, "elapsed_time": "4 days, 13:35:10", "remaining_time": "2 days, 10:31:46", "throughput": 2724.57, "total_tokens": 1074873856} {"current_steps": 5955, "total_steps": 9134, "loss": 0.592, "learning_rate": 1.351331390045118e-05, "epoch": 0.6519061824352063, "percentage": 65.2, "elapsed_time": "4 days, 13:36:16", "remaining_time": "2 days, 10:30:39", "throughput": 2724.54, "total_tokens": 1075040512} {"current_steps": 5956, "total_steps": 9134, "loss": 0.5933, "learning_rate": 1.3505677330010505e-05, "epoch": 0.6520156545061441, "percentage": 65.21, "elapsed_time": "4 days, 13:37:17", "remaining_time": "2 days, 10:29:30", "throughput": 2724.48, "total_tokens": 1075179616} {"current_steps": 5957, "total_steps": 9134, "loss": 0.726, "learning_rate": 1.3498042119326232e-05, "epoch": 0.652125126577082, "percentage": 65.22, "elapsed_time": "4 days, 13:38:20", "remaining_time": "2 days, 10:28:22", "throughput": 2724.41, "total_tokens": 1075324096} {"current_steps": 5958, "total_steps": 9134, "loss": 0.8596, "learning_rate": 1.3490408269301585e-05, "epoch": 0.6522345986480199, "percentage": 65.23, "elapsed_time": "4 days, 13:39:25", "remaining_time": "2 days, 10:27:15", "throughput": 2724.4, "total_tokens": 1075498368} {"current_steps": 5959, "total_steps": 9134, "loss": 0.8312, "learning_rate": 1.3482775780839632e-05, "epoch": 0.6523440707189578, "percentage": 65.24, "elapsed_time": "4 days, 13:40:31", "remaining_time": "2 days, 10:26:09", "throughput": 2724.4, "total_tokens": 1075679360} {"current_steps": 5960, "total_steps": 9134, "loss": 1.0448, "learning_rate": 1.3475144654843302e-05, "epoch": 0.6524535427898958, "percentage": 65.25, "elapsed_time": "4 days, 13:41:41", "remaining_time": "2 days, 10:25:04", "throughput": 2724.43, "total_tokens": 1075882304} {"current_steps": 5961, "total_steps": 9134, "loss": 1.1132, "learning_rate": 1.346751489221531e-05, "epoch": 0.6525630148608337, "percentage": 65.26, "elapsed_time": "4 days, 13:42:50", "remaining_time": "2 days, 10:23:59", "throughput": 2724.5, "total_tokens": 1076095552} {"current_steps": 5962, "total_steps": 9134, "loss": 0.8572, "learning_rate": 1.3459886493858282e-05, "epoch": 0.6526724869317715, "percentage": 65.27, "elapsed_time": "4 days, 13:43:56", "remaining_time": "2 days, 10:22:53", "throughput": 2724.49, "total_tokens": 1076272512} {"current_steps": 5963, "total_steps": 9134, "loss": 0.8037, "learning_rate": 1.3452259460674599e-05, "epoch": 0.6527819590027094, "percentage": 65.28, "elapsed_time": "4 days, 13:45:05", "remaining_time": "2 days, 10:21:49", "throughput": 2724.55, "total_tokens": 1076486656} {"current_steps": 5964, "total_steps": 9134, "loss": 0.6937, "learning_rate": 1.3444633793566556e-05, "epoch": 0.6528914310736473, "percentage": 65.29, "elapsed_time": "4 days, 13:46:13", "remaining_time": "2 days, 10:20:43", "throughput": 2724.62, "total_tokens": 1076696320} {"current_steps": 5965, "total_steps": 9134, "loss": 1.0418, "learning_rate": 1.3437009493436243e-05, "epoch": 0.6530009031445853, "percentage": 65.31, "elapsed_time": "4 days, 13:47:20", "remaining_time": "2 days, 10:19:37", "throughput": 2724.66, "total_tokens": 1076897920} {"current_steps": 5966, "total_steps": 9134, "loss": 0.8658, "learning_rate": 1.3429386561185606e-05, "epoch": 0.6531103752155232, "percentage": 65.32, "elapsed_time": "4 days, 13:48:27", "remaining_time": "2 days, 10:18:31", "throughput": 2724.64, "total_tokens": 1077070176} {"current_steps": 5967, "total_steps": 9134, "loss": 0.6483, "learning_rate": 1.3421764997716418e-05, "epoch": 0.653219847286461, "percentage": 65.33, "elapsed_time": "4 days, 13:49:29", "remaining_time": "2 days, 10:17:23", "throughput": 2724.6, "total_tokens": 1077226080} {"current_steps": 5968, "total_steps": 9134, "loss": 0.6413, "learning_rate": 1.3414144803930284e-05, "epoch": 0.6533293193573989, "percentage": 65.34, "elapsed_time": "4 days, 13:50:37", "remaining_time": "2 days, 10:16:18", "throughput": 2724.62, "total_tokens": 1077416256} {"current_steps": 5969, "total_steps": 9134, "loss": 0.6472, "learning_rate": 1.3406525980728697e-05, "epoch": 0.6534387914283368, "percentage": 65.35, "elapsed_time": "4 days, 13:51:44", "remaining_time": "2 days, 10:15:11", "throughput": 2724.62, "total_tokens": 1077597920} {"current_steps": 5970, "total_steps": 9134, "loss": 0.6306, "learning_rate": 1.3398908529012899e-05, "epoch": 0.6535482634992748, "percentage": 65.36, "elapsed_time": "4 days, 13:52:50", "remaining_time": "2 days, 10:14:05", "throughput": 2724.63, "total_tokens": 1077780928} {"current_steps": 5971, "total_steps": 9134, "loss": 0.9286, "learning_rate": 1.3391292449684067e-05, "epoch": 0.6536577355702127, "percentage": 65.37, "elapsed_time": "4 days, 13:53:59", "remaining_time": "2 days, 10:13:00", "throughput": 2724.66, "total_tokens": 1077981856} {"current_steps": 5972, "total_steps": 9134, "loss": 0.6376, "learning_rate": 1.3383677743643126e-05, "epoch": 0.6537672076411506, "percentage": 65.38, "elapsed_time": "4 days, 13:55:07", "remaining_time": "2 days, 10:11:55", "throughput": 2724.72, "total_tokens": 1078189728} {"current_steps": 5973, "total_steps": 9134, "loss": 0.8157, "learning_rate": 1.3376064411790909e-05, "epoch": 0.6538766797120884, "percentage": 65.39, "elapsed_time": "4 days, 13:56:12", "remaining_time": "2 days, 10:10:48", "throughput": 2724.75, "total_tokens": 1078378784} {"current_steps": 5974, "total_steps": 9134, "loss": 0.5301, "learning_rate": 1.3368452455028052e-05, "epoch": 0.6539861517830263, "percentage": 65.4, "elapsed_time": "4 days, 13:57:18", "remaining_time": "2 days, 10:09:42", "throughput": 2724.75, "total_tokens": 1078562016} {"current_steps": 5975, "total_steps": 9134, "loss": 0.7936, "learning_rate": 1.3360841874255034e-05, "epoch": 0.6540956238539642, "percentage": 65.41, "elapsed_time": "4 days, 13:58:25", "remaining_time": "2 days, 10:08:36", "throughput": 2724.75, "total_tokens": 1078744128} {"current_steps": 5976, "total_steps": 9134, "loss": 0.6272, "learning_rate": 1.3353232670372173e-05, "epoch": 0.6542050959249022, "percentage": 65.43, "elapsed_time": "4 days, 13:59:30", "remaining_time": "2 days, 10:07:29", "throughput": 2724.76, "total_tokens": 1078921984} {"current_steps": 5977, "total_steps": 9134, "loss": 0.9028, "learning_rate": 1.3345624844279611e-05, "epoch": 0.6543145679958401, "percentage": 65.44, "elapsed_time": "4 days, 14:00:36", "remaining_time": "2 days, 10:06:23", "throughput": 2724.75, "total_tokens": 1079100960} {"current_steps": 5978, "total_steps": 9134, "loss": 0.7619, "learning_rate": 1.3338018396877371e-05, "epoch": 0.654424040066778, "percentage": 65.45, "elapsed_time": "4 days, 14:01:38", "remaining_time": "2 days, 10:05:14", "throughput": 2724.68, "total_tokens": 1079241184} {"current_steps": 5979, "total_steps": 9134, "loss": 0.8663, "learning_rate": 1.3330413329065238e-05, "epoch": 0.6545335121377158, "percentage": 65.46, "elapsed_time": "4 days, 14:02:39", "remaining_time": "2 days, 10:04:05", "throughput": 2724.65, "total_tokens": 1079394400} {"current_steps": 5980, "total_steps": 9134, "loss": 0.6069, "learning_rate": 1.3322809641742917e-05, "epoch": 0.6546429842086537, "percentage": 65.47, "elapsed_time": "4 days, 14:03:43", "remaining_time": "2 days, 10:02:58", "throughput": 2724.57, "total_tokens": 1079540672} {"current_steps": 5981, "total_steps": 9134, "loss": 0.9535, "learning_rate": 1.3315207335809888e-05, "epoch": 0.6547524562795917, "percentage": 65.48, "elapsed_time": "4 days, 14:04:44", "remaining_time": "2 days, 10:01:49", "throughput": 2724.53, "total_tokens": 1079689856} {"current_steps": 5982, "total_steps": 9134, "loss": 0.8527, "learning_rate": 1.3307606412165491e-05, "epoch": 0.6548619283505296, "percentage": 65.49, "elapsed_time": "4 days, 14:05:51", "remaining_time": "2 days, 10:00:43", "throughput": 2724.56, "total_tokens": 1079883616} {"current_steps": 5983, "total_steps": 9134, "loss": 0.8021, "learning_rate": 1.3300006871708905e-05, "epoch": 0.6549714004214675, "percentage": 65.5, "elapsed_time": "4 days, 14:06:58", "remaining_time": "2 days, 9:59:37", "throughput": 2724.55, "total_tokens": 1080059904} {"current_steps": 5984, "total_steps": 9134, "loss": 0.7427, "learning_rate": 1.3292408715339141e-05, "epoch": 0.6550808724924054, "percentage": 65.51, "elapsed_time": "4 days, 14:08:06", "remaining_time": "2 days, 9:58:31", "throughput": 2724.56, "total_tokens": 1080251648} {"current_steps": 5985, "total_steps": 9134, "loss": 0.7652, "learning_rate": 1.3284811943955045e-05, "epoch": 0.6551903445633432, "percentage": 65.52, "elapsed_time": "4 days, 14:09:13", "remaining_time": "2 days, 9:57:26", "throughput": 2724.6, "total_tokens": 1080447424} {"current_steps": 5986, "total_steps": 9134, "loss": 0.8264, "learning_rate": 1.32772165584553e-05, "epoch": 0.6552998166342812, "percentage": 65.54, "elapsed_time": "4 days, 14:10:17", "remaining_time": "2 days, 9:56:18", "throughput": 2724.53, "total_tokens": 1080598176} {"current_steps": 5987, "total_steps": 9134, "loss": 0.9441, "learning_rate": 1.3269622559738416e-05, "epoch": 0.6554092887052191, "percentage": 65.55, "elapsed_time": "4 days, 14:11:23", "remaining_time": "2 days, 9:55:12", "throughput": 2724.52, "total_tokens": 1080771552} {"current_steps": 5988, "total_steps": 9134, "loss": 0.7342, "learning_rate": 1.3262029948702766e-05, "epoch": 0.655518760776157, "percentage": 65.56, "elapsed_time": "4 days, 14:12:32", "remaining_time": "2 days, 9:54:07", "throughput": 2724.54, "total_tokens": 1080969120} {"current_steps": 5989, "total_steps": 9134, "loss": 0.8244, "learning_rate": 1.3254438726246537e-05, "epoch": 0.6556282328470949, "percentage": 65.57, "elapsed_time": "4 days, 14:13:36", "remaining_time": "2 days, 9:52:59", "throughput": 2724.54, "total_tokens": 1081140704} {"current_steps": 5990, "total_steps": 9134, "loss": 0.6652, "learning_rate": 1.3246848893267749e-05, "epoch": 0.6557377049180327, "percentage": 65.58, "elapsed_time": "4 days, 14:14:41", "remaining_time": "2 days, 9:51:53", "throughput": 2724.5, "total_tokens": 1081303104} {"current_steps": 5991, "total_steps": 9134, "loss": 0.7169, "learning_rate": 1.3239260450664275e-05, "epoch": 0.6558471769889707, "percentage": 65.59, "elapsed_time": "4 days, 14:15:47", "remaining_time": "2 days, 9:50:46", "throughput": 2724.53, "total_tokens": 1081493280} {"current_steps": 5992, "total_steps": 9134, "loss": 0.6045, "learning_rate": 1.3231673399333802e-05, "epoch": 0.6559566490599086, "percentage": 65.6, "elapsed_time": "4 days, 14:16:55", "remaining_time": "2 days, 9:49:41", "throughput": 2724.56, "total_tokens": 1081690848} {"current_steps": 5993, "total_steps": 9134, "loss": 0.7478, "learning_rate": 1.3224087740173871e-05, "epoch": 0.6560661211308465, "percentage": 65.61, "elapsed_time": "4 days, 14:18:00", "remaining_time": "2 days, 9:48:34", "throughput": 2724.54, "total_tokens": 1081861088} {"current_steps": 5994, "total_steps": 9134, "loss": 0.6801, "learning_rate": 1.3216503474081838e-05, "epoch": 0.6561755932017844, "percentage": 65.62, "elapsed_time": "4 days, 14:19:00", "remaining_time": "2 days, 9:47:24", "throughput": 2724.45, "total_tokens": 1081991232} {"current_steps": 5995, "total_steps": 9134, "loss": 0.7745, "learning_rate": 1.3208920601954938e-05, "epoch": 0.6562850652727223, "percentage": 65.63, "elapsed_time": "4 days, 14:20:10", "remaining_time": "2 days, 9:46:20", "throughput": 2724.54, "total_tokens": 1082214112} {"current_steps": 5996, "total_steps": 9134, "loss": 0.88, "learning_rate": 1.320133912469017e-05, "epoch": 0.6563945373436602, "percentage": 65.64, "elapsed_time": "4 days, 14:21:16", "remaining_time": "2 days, 9:45:14", "throughput": 2724.52, "total_tokens": 1082385472} {"current_steps": 5997, "total_steps": 9134, "loss": 0.7173, "learning_rate": 1.3193759043184437e-05, "epoch": 0.6565040094145981, "percentage": 65.66, "elapsed_time": "4 days, 14:22:20", "remaining_time": "2 days, 9:44:06", "throughput": 2724.5, "total_tokens": 1082553472} {"current_steps": 5998, "total_steps": 9134, "loss": 0.8104, "learning_rate": 1.318618035833444e-05, "epoch": 0.656613481485536, "percentage": 65.67, "elapsed_time": "4 days, 14:23:27", "remaining_time": "2 days, 9:43:00", "throughput": 2724.49, "total_tokens": 1082733568} {"current_steps": 5999, "total_steps": 9134, "loss": 0.8061, "learning_rate": 1.317860307103672e-05, "epoch": 0.6567229535564739, "percentage": 65.68, "elapsed_time": "4 days, 14:24:35", "remaining_time": "2 days, 9:41:55", "throughput": 2724.48, "total_tokens": 1082915904} {"current_steps": 6000, "total_steps": 9134, "loss": 0.6742, "learning_rate": 1.3171027182187665e-05, "epoch": 0.6568324256274118, "percentage": 65.69, "elapsed_time": "4 days, 14:25:42", "remaining_time": "2 days, 9:40:49", "throughput": 2724.5, "total_tokens": 1083104288} {"current_steps": 6001, "total_steps": 9134, "loss": 0.6619, "learning_rate": 1.3163452692683465e-05, "epoch": 0.6569418976983498, "percentage": 65.7, "elapsed_time": "4 days, 14:29:17", "remaining_time": "2 days, 9:41:01", "throughput": 2723.53, "total_tokens": 1083305888} {"current_steps": 6002, "total_steps": 9134, "loss": 0.6062, "learning_rate": 1.3155879603420207e-05, "epoch": 0.6570513697692876, "percentage": 65.71, "elapsed_time": "4 days, 14:30:18", "remaining_time": "2 days, 9:39:52", "throughput": 2723.5, "total_tokens": 1083458208} {"current_steps": 6003, "total_steps": 9134, "loss": 0.6019, "learning_rate": 1.3148307915293728e-05, "epoch": 0.6571608418402255, "percentage": 65.72, "elapsed_time": "4 days, 14:31:27", "remaining_time": "2 days, 9:38:46", "throughput": 2723.51, "total_tokens": 1083650176} {"current_steps": 6004, "total_steps": 9134, "loss": 0.7772, "learning_rate": 1.3140737629199787e-05, "epoch": 0.6572703139111634, "percentage": 65.73, "elapsed_time": "4 days, 14:32:33", "remaining_time": "2 days, 9:37:40", "throughput": 2723.53, "total_tokens": 1083837216} {"current_steps": 6005, "total_steps": 9134, "loss": 0.8285, "learning_rate": 1.3133168746033895e-05, "epoch": 0.6573797859821013, "percentage": 65.74, "elapsed_time": "4 days, 14:33:36", "remaining_time": "2 days, 9:36:32", "throughput": 2723.5, "total_tokens": 1083997152} {"current_steps": 6006, "total_steps": 9134, "loss": 0.8265, "learning_rate": 1.3125601266691462e-05, "epoch": 0.6574892580530393, "percentage": 65.75, "elapsed_time": "4 days, 14:34:39", "remaining_time": "2 days, 9:35:24", "throughput": 2723.52, "total_tokens": 1084179264} {"current_steps": 6007, "total_steps": 9134, "loss": 0.8466, "learning_rate": 1.3118035192067702e-05, "epoch": 0.6575987301239771, "percentage": 65.77, "elapsed_time": "4 days, 14:35:46", "remaining_time": "2 days, 9:34:19", "throughput": 2723.5, "total_tokens": 1084351968} {"current_steps": 6008, "total_steps": 9134, "loss": 0.7496, "learning_rate": 1.311047052305766e-05, "epoch": 0.657708202194915, "percentage": 65.78, "elapsed_time": "4 days, 14:36:55", "remaining_time": "2 days, 9:33:13", "throughput": 2723.54, "total_tokens": 1084554464} {"current_steps": 6009, "total_steps": 9134, "loss": 0.5124, "learning_rate": 1.310290726055623e-05, "epoch": 0.6578176742658529, "percentage": 65.79, "elapsed_time": "4 days, 14:38:00", "remaining_time": "2 days, 9:32:07", "throughput": 2723.52, "total_tokens": 1084725152} {"current_steps": 6010, "total_steps": 9134, "loss": 0.6117, "learning_rate": 1.3095345405458115e-05, "epoch": 0.6579271463367908, "percentage": 65.8, "elapsed_time": "4 days, 14:39:02", "remaining_time": "2 days, 9:30:58", "throughput": 2723.48, "total_tokens": 1084877248} {"current_steps": 6011, "total_steps": 9134, "loss": 0.7874, "learning_rate": 1.30877849586579e-05, "epoch": 0.6580366184077288, "percentage": 65.81, "elapsed_time": "4 days, 14:40:07", "remaining_time": "2 days, 9:29:51", "throughput": 2723.44, "total_tokens": 1085038752} {"current_steps": 6012, "total_steps": 9134, "loss": 0.6582, "learning_rate": 1.3080225921049938e-05, "epoch": 0.6581460904786667, "percentage": 65.82, "elapsed_time": "4 days, 14:41:09", "remaining_time": "2 days, 9:28:42", "throughput": 2723.38, "total_tokens": 1085184800} {"current_steps": 6013, "total_steps": 9134, "loss": 1.0005, "learning_rate": 1.3072668293528467e-05, "epoch": 0.6582555625496045, "percentage": 65.83, "elapsed_time": "4 days, 14:42:15", "remaining_time": "2 days, 9:27:36", "throughput": 2723.44, "total_tokens": 1085387968} {"current_steps": 6014, "total_steps": 9134, "loss": 0.7605, "learning_rate": 1.306511207698754e-05, "epoch": 0.6583650346205424, "percentage": 65.84, "elapsed_time": "4 days, 14:43:20", "remaining_time": "2 days, 9:26:29", "throughput": 2723.46, "total_tokens": 1085574112} {"current_steps": 6015, "total_steps": 9134, "loss": 0.7655, "learning_rate": 1.3057557272321036e-05, "epoch": 0.6584745066914803, "percentage": 65.85, "elapsed_time": "4 days, 14:44:25", "remaining_time": "2 days, 9:25:22", "throughput": 2723.44, "total_tokens": 1085742112} {"current_steps": 6016, "total_steps": 9134, "loss": 0.7383, "learning_rate": 1.3050003880422676e-05, "epoch": 0.6585839787624183, "percentage": 65.86, "elapsed_time": "4 days, 14:45:31", "remaining_time": "2 days, 9:24:16", "throughput": 2723.47, "total_tokens": 1085933408} {"current_steps": 6017, "total_steps": 9134, "loss": 0.9374, "learning_rate": 1.3042451902186012e-05, "epoch": 0.6586934508333562, "percentage": 65.87, "elapsed_time": "4 days, 14:46:33", "remaining_time": "2 days, 9:23:07", "throughput": 2723.44, "total_tokens": 1086089312} {"current_steps": 6018, "total_steps": 9134, "loss": 0.7916, "learning_rate": 1.303490133850443e-05, "epoch": 0.6588029229042941, "percentage": 65.89, "elapsed_time": "4 days, 14:47:34", "remaining_time": "2 days, 9:21:58", "throughput": 2723.36, "total_tokens": 1086225952} {"current_steps": 6019, "total_steps": 9134, "loss": 0.8897, "learning_rate": 1.3027352190271136e-05, "epoch": 0.6589123949752319, "percentage": 65.9, "elapsed_time": "4 days, 14:48:39", "remaining_time": "2 days, 9:20:52", "throughput": 2723.39, "total_tokens": 1086415008} {"current_steps": 6020, "total_steps": 9134, "loss": 0.6153, "learning_rate": 1.3019804458379204e-05, "epoch": 0.6590218670461698, "percentage": 65.91, "elapsed_time": "4 days, 14:49:38", "remaining_time": "2 days, 9:19:42", "throughput": 2723.34, "total_tokens": 1086553888} {"current_steps": 6021, "total_steps": 9134, "loss": 0.7156, "learning_rate": 1.3012258143721499e-05, "epoch": 0.6591313391171078, "percentage": 65.92, "elapsed_time": "4 days, 14:50:43", "remaining_time": "2 days, 9:18:34", "throughput": 2723.33, "total_tokens": 1086725248} {"current_steps": 6022, "total_steps": 9134, "loss": 0.8381, "learning_rate": 1.3004713247190736e-05, "epoch": 0.6592408111880457, "percentage": 65.93, "elapsed_time": "4 days, 14:51:47", "remaining_time": "2 days, 9:17:27", "throughput": 2723.38, "total_tokens": 1086923936} {"current_steps": 6023, "total_steps": 9134, "loss": 0.6207, "learning_rate": 1.2997169769679468e-05, "epoch": 0.6593502832589836, "percentage": 65.94, "elapsed_time": "4 days, 14:52:50", "remaining_time": "2 days, 9:16:19", "throughput": 2723.35, "total_tokens": 1087081408} {"current_steps": 6024, "total_steps": 9134, "loss": 0.8838, "learning_rate": 1.298962771208007e-05, "epoch": 0.6594597553299214, "percentage": 65.95, "elapsed_time": "4 days, 14:53:57", "remaining_time": "2 days, 9:15:13", "throughput": 2723.36, "total_tokens": 1087266208} {"current_steps": 6025, "total_steps": 9134, "loss": 0.8405, "learning_rate": 1.2982087075284754e-05, "epoch": 0.6595692274008593, "percentage": 65.96, "elapsed_time": "4 days, 14:54:59", "remaining_time": "2 days, 9:14:05", "throughput": 2723.32, "total_tokens": 1087421440} {"current_steps": 6026, "total_steps": 9134, "loss": 0.6128, "learning_rate": 1.2974547860185566e-05, "epoch": 0.6596786994717972, "percentage": 65.97, "elapsed_time": "4 days, 14:56:05", "remaining_time": "2 days, 9:12:58", "throughput": 2723.35, "total_tokens": 1087608928} {"current_steps": 6027, "total_steps": 9134, "loss": 0.888, "learning_rate": 1.2967010067674362e-05, "epoch": 0.6597881715427352, "percentage": 65.98, "elapsed_time": "4 days, 14:57:10", "remaining_time": "2 days, 9:11:51", "throughput": 2723.32, "total_tokens": 1087778048} {"current_steps": 6028, "total_steps": 9134, "loss": 0.7787, "learning_rate": 1.2959473698642888e-05, "epoch": 0.6598976436136731, "percentage": 66.0, "elapsed_time": "4 days, 14:58:18", "remaining_time": "2 days, 9:10:46", "throughput": 2723.42, "total_tokens": 1088002944} {"current_steps": 6029, "total_steps": 9134, "loss": 0.8233, "learning_rate": 1.2951938753982634e-05, "epoch": 0.660007115684611, "percentage": 66.01, "elapsed_time": "4 days, 14:59:24", "remaining_time": "2 days, 9:09:40", "throughput": 2723.45, "total_tokens": 1088193344} {"current_steps": 6030, "total_steps": 9134, "loss": 0.7897, "learning_rate": 1.2944405234585005e-05, "epoch": 0.6601165877555488, "percentage": 66.02, "elapsed_time": "4 days, 15:00:32", "remaining_time": "2 days, 9:08:34", "throughput": 2723.44, "total_tokens": 1088376352} {"current_steps": 6031, "total_steps": 9134, "loss": 0.9002, "learning_rate": 1.293687314134119e-05, "epoch": 0.6602260598264867, "percentage": 66.03, "elapsed_time": "4 days, 15:01:39", "remaining_time": "2 days, 9:07:28", "throughput": 2723.42, "total_tokens": 1088548832} {"current_steps": 6032, "total_steps": 9134, "loss": 0.7395, "learning_rate": 1.2929342475142225e-05, "epoch": 0.6603355318974247, "percentage": 66.04, "elapsed_time": "4 days, 15:02:44", "remaining_time": "2 days, 9:06:21", "throughput": 2723.43, "total_tokens": 1088729824} {"current_steps": 6033, "total_steps": 9134, "loss": 0.5672, "learning_rate": 1.2921813236878965e-05, "epoch": 0.6604450039683626, "percentage": 66.05, "elapsed_time": "4 days, 15:03:51", "remaining_time": "2 days, 9:05:15", "throughput": 2723.45, "total_tokens": 1088920896} {"current_steps": 6034, "total_steps": 9134, "loss": 0.6098, "learning_rate": 1.2914285427442102e-05, "epoch": 0.6605544760393005, "percentage": 66.06, "elapsed_time": "4 days, 15:04:56", "remaining_time": "2 days, 9:04:08", "throughput": 2723.46, "total_tokens": 1089099424} {"current_steps": 6035, "total_steps": 9134, "loss": 0.6151, "learning_rate": 1.290675904772219e-05, "epoch": 0.6606639481102384, "percentage": 66.07, "elapsed_time": "4 days, 15:05:57", "remaining_time": "2 days, 9:02:59", "throughput": 2723.41, "total_tokens": 1089247712} {"current_steps": 6036, "total_steps": 9134, "loss": 0.8356, "learning_rate": 1.2899234098609541e-05, "epoch": 0.6607734201811762, "percentage": 66.08, "elapsed_time": "4 days, 15:07:03", "remaining_time": "2 days, 9:01:53", "throughput": 2723.46, "total_tokens": 1089447072} {"current_steps": 6037, "total_steps": 9134, "loss": 0.8525, "learning_rate": 1.2891710580994387e-05, "epoch": 0.6608828922521142, "percentage": 66.09, "elapsed_time": "4 days, 15:08:10", "remaining_time": "2 days, 9:00:47", "throughput": 2723.48, "total_tokens": 1089637472} {"current_steps": 6038, "total_steps": 9134, "loss": 0.7664, "learning_rate": 1.2884188495766709e-05, "epoch": 0.6609923643230521, "percentage": 66.1, "elapsed_time": "4 days, 15:09:16", "remaining_time": "2 days, 8:59:41", "throughput": 2723.53, "total_tokens": 1089835488} {"current_steps": 6039, "total_steps": 9134, "loss": 1.2275, "learning_rate": 1.2876667843816373e-05, "epoch": 0.66110183639399, "percentage": 66.12, "elapsed_time": "4 days, 15:10:25", "remaining_time": "2 days, 8:58:36", "throughput": 2723.61, "total_tokens": 1090055680} {"current_steps": 6040, "total_steps": 9134, "loss": 0.8112, "learning_rate": 1.2869148626033059e-05, "epoch": 0.6612113084649279, "percentage": 66.13, "elapsed_time": "4 days, 15:11:33", "remaining_time": "2 days, 8:57:30", "throughput": 2723.62, "total_tokens": 1090246752} {"current_steps": 6041, "total_steps": 9134, "loss": 0.7249, "learning_rate": 1.2861630843306271e-05, "epoch": 0.6613207805358657, "percentage": 66.14, "elapsed_time": "4 days, 15:12:36", "remaining_time": "2 days, 8:56:22", "throughput": 2723.61, "total_tokens": 1090412960} {"current_steps": 6042, "total_steps": 9134, "loss": 0.7935, "learning_rate": 1.285411449652535e-05, "epoch": 0.6614302526068037, "percentage": 66.15, "elapsed_time": "4 days, 15:13:39", "remaining_time": "2 days, 8:55:15", "throughput": 2723.54, "total_tokens": 1090557216} {"current_steps": 6043, "total_steps": 9134, "loss": 0.9119, "learning_rate": 1.2846599586579456e-05, "epoch": 0.6615397246777416, "percentage": 66.16, "elapsed_time": "4 days, 15:14:48", "remaining_time": "2 days, 8:54:09", "throughput": 2723.51, "total_tokens": 1090734176} {"current_steps": 6044, "total_steps": 9134, "loss": 0.7617, "learning_rate": 1.2839086114357617e-05, "epoch": 0.6616491967486795, "percentage": 66.17, "elapsed_time": "4 days, 15:15:52", "remaining_time": "2 days, 8:53:02", "throughput": 2723.5, "total_tokens": 1090902848} {"current_steps": 6045, "total_steps": 9134, "loss": 0.9162, "learning_rate": 1.2831574080748621e-05, "epoch": 0.6617586688196174, "percentage": 66.18, "elapsed_time": "4 days, 15:16:56", "remaining_time": "2 days, 8:51:55", "throughput": 2723.51, "total_tokens": 1091081824} {"current_steps": 6046, "total_steps": 9134, "loss": 0.7773, "learning_rate": 1.2824063486641172e-05, "epoch": 0.6618681408905553, "percentage": 66.19, "elapsed_time": "4 days, 15:17:59", "remaining_time": "2 days, 8:50:47", "throughput": 2723.51, "total_tokens": 1091254528} {"current_steps": 6047, "total_steps": 9134, "loss": 0.6688, "learning_rate": 1.2816554332923714e-05, "epoch": 0.6619776129614932, "percentage": 66.2, "elapsed_time": "4 days, 15:19:04", "remaining_time": "2 days, 8:49:40", "throughput": 2723.54, "total_tokens": 1091445152} {"current_steps": 6048, "total_steps": 9134, "loss": 0.7595, "learning_rate": 1.28090466204846e-05, "epoch": 0.6620870850324311, "percentage": 66.21, "elapsed_time": "4 days, 15:20:12", "remaining_time": "2 days, 8:48:35", "throughput": 2723.53, "total_tokens": 1091625024} {"current_steps": 6049, "total_steps": 9134, "loss": 0.8138, "learning_rate": 1.2801540350211963e-05, "epoch": 0.662196557103369, "percentage": 66.23, "elapsed_time": "4 days, 15:21:19", "remaining_time": "2 days, 8:47:29", "throughput": 2723.5, "total_tokens": 1091793248} {"current_steps": 6050, "total_steps": 9134, "loss": 0.7339, "learning_rate": 1.2794035522993785e-05, "epoch": 0.6623060291743069, "percentage": 66.24, "elapsed_time": "4 days, 15:22:26", "remaining_time": "2 days, 8:46:23", "throughput": 2723.51, "total_tokens": 1091982752} {"current_steps": 6051, "total_steps": 9134, "loss": 0.7657, "learning_rate": 1.2786532139717872e-05, "epoch": 0.6624155012452448, "percentage": 66.25, "elapsed_time": "4 days, 15:23:32", "remaining_time": "2 days, 8:45:16", "throughput": 2723.52, "total_tokens": 1092163072} {"current_steps": 6052, "total_steps": 9134, "loss": 0.6465, "learning_rate": 1.2779030201271846e-05, "epoch": 0.6625249733161828, "percentage": 66.26, "elapsed_time": "4 days, 15:24:36", "remaining_time": "2 days, 8:44:09", "throughput": 2723.5, "total_tokens": 1092331744} {"current_steps": 6053, "total_steps": 9134, "loss": 0.7728, "learning_rate": 1.2771529708543203e-05, "epoch": 0.6626344453871206, "percentage": 66.27, "elapsed_time": "4 days, 15:25:43", "remaining_time": "2 days, 8:43:03", "throughput": 2723.49, "total_tokens": 1092510496} {"current_steps": 6054, "total_steps": 9134, "loss": 0.8976, "learning_rate": 1.2764030662419201e-05, "epoch": 0.6627439174580585, "percentage": 66.28, "elapsed_time": "4 days, 15:26:47", "remaining_time": "2 days, 8:41:56", "throughput": 2723.51, "total_tokens": 1092694400} {"current_steps": 6055, "total_steps": 9134, "loss": 0.6845, "learning_rate": 1.2756533063786991e-05, "epoch": 0.6628533895289964, "percentage": 66.29, "elapsed_time": "4 days, 15:27:48", "remaining_time": "2 days, 8:40:47", "throughput": 2723.45, "total_tokens": 1092833280} {"current_steps": 6056, "total_steps": 9134, "loss": 0.8025, "learning_rate": 1.2749036913533514e-05, "epoch": 0.6629628615999343, "percentage": 66.3, "elapsed_time": "4 days, 15:28:47", "remaining_time": "2 days, 8:39:37", "throughput": 2723.4, "total_tokens": 1092973728} {"current_steps": 6057, "total_steps": 9134, "loss": 0.6519, "learning_rate": 1.2741542212545549e-05, "epoch": 0.6630723336708723, "percentage": 66.31, "elapsed_time": "4 days, 15:29:52", "remaining_time": "2 days, 8:38:30", "throughput": 2723.4, "total_tokens": 1093153152} {"current_steps": 6058, "total_steps": 9134, "loss": 1.0345, "learning_rate": 1.2734048961709707e-05, "epoch": 0.6631818057418101, "percentage": 66.32, "elapsed_time": "4 days, 15:30:59", "remaining_time": "2 days, 8:37:24", "throughput": 2723.46, "total_tokens": 1093359232} {"current_steps": 6059, "total_steps": 9134, "loss": 0.6562, "learning_rate": 1.2726557161912425e-05, "epoch": 0.663291277812748, "percentage": 66.33, "elapsed_time": "4 days, 15:32:04", "remaining_time": "2 days, 8:36:17", "throughput": 2723.44, "total_tokens": 1093529248} {"current_steps": 6060, "total_steps": 9134, "loss": 0.8941, "learning_rate": 1.2719066814039957e-05, "epoch": 0.6634007498836859, "percentage": 66.35, "elapsed_time": "4 days, 15:33:13", "remaining_time": "2 days, 8:35:12", "throughput": 2723.53, "total_tokens": 1093752352} {"current_steps": 6061, "total_steps": 9134, "loss": 0.7756, "learning_rate": 1.2711577918978417e-05, "epoch": 0.6635102219546238, "percentage": 66.36, "elapsed_time": "4 days, 15:34:21", "remaining_time": "2 days, 8:34:07", "throughput": 2723.52, "total_tokens": 1093933792} {"current_steps": 6062, "total_steps": 9134, "loss": 0.7306, "learning_rate": 1.270409047761372e-05, "epoch": 0.6636196940255618, "percentage": 66.37, "elapsed_time": "4 days, 15:35:24", "remaining_time": "2 days, 8:32:59", "throughput": 2723.49, "total_tokens": 1094094624} {"current_steps": 6063, "total_steps": 9134, "loss": 0.7176, "learning_rate": 1.2696604490831609e-05, "epoch": 0.6637291660964997, "percentage": 66.38, "elapsed_time": "4 days, 15:36:29", "remaining_time": "2 days, 8:31:52", "throughput": 2723.46, "total_tokens": 1094254336} {"current_steps": 6064, "total_steps": 9134, "loss": 0.6973, "learning_rate": 1.268911995951767e-05, "epoch": 0.6638386381674375, "percentage": 66.39, "elapsed_time": "4 days, 15:37:36", "remaining_time": "2 days, 8:30:46", "throughput": 2723.52, "total_tokens": 1094463552} {"current_steps": 6065, "total_steps": 9134, "loss": 0.9368, "learning_rate": 1.2681636884557307e-05, "epoch": 0.6639481102383754, "percentage": 66.4, "elapsed_time": "4 days, 15:38:45", "remaining_time": "2 days, 8:29:41", "throughput": 2723.58, "total_tokens": 1094674784} {"current_steps": 6066, "total_steps": 9134, "loss": 0.5613, "learning_rate": 1.2674155266835753e-05, "epoch": 0.6640575823093133, "percentage": 66.41, "elapsed_time": "4 days, 15:39:47", "remaining_time": "2 days, 8:28:33", "throughput": 2723.56, "total_tokens": 1094836960} {"current_steps": 6067, "total_steps": 9134, "loss": 0.9068, "learning_rate": 1.2666675107238052e-05, "epoch": 0.6641670543802513, "percentage": 66.42, "elapsed_time": "4 days, 15:40:52", "remaining_time": "2 days, 8:27:26", "throughput": 2723.52, "total_tokens": 1094999136} {"current_steps": 6068, "total_steps": 9134, "loss": 0.904, "learning_rate": 1.2659196406649132e-05, "epoch": 0.6642765264511892, "percentage": 66.43, "elapsed_time": "4 days, 15:41:55", "remaining_time": "2 days, 8:26:18", "throughput": 2723.51, "total_tokens": 1095162432} {"current_steps": 6069, "total_steps": 9134, "loss": 0.7755, "learning_rate": 1.2651719165953666e-05, "epoch": 0.6643859985221271, "percentage": 66.44, "elapsed_time": "4 days, 15:42:56", "remaining_time": "2 days, 8:25:09", "throughput": 2723.47, "total_tokens": 1095314528} {"current_steps": 6070, "total_steps": 9134, "loss": 0.9319, "learning_rate": 1.2644243386036234e-05, "epoch": 0.6644954705930649, "percentage": 66.46, "elapsed_time": "4 days, 15:44:04", "remaining_time": "2 days, 8:24:03", "throughput": 2723.5, "total_tokens": 1095510080} {"current_steps": 6071, "total_steps": 9134, "loss": 0.6669, "learning_rate": 1.2636769067781173e-05, "epoch": 0.6646049426640028, "percentage": 66.47, "elapsed_time": "4 days, 15:45:12", "remaining_time": "2 days, 8:22:58", "throughput": 2723.56, "total_tokens": 1095724896} {"current_steps": 6072, "total_steps": 9134, "loss": 0.7786, "learning_rate": 1.2629296212072703e-05, "epoch": 0.6647144147349408, "percentage": 66.48, "elapsed_time": "4 days, 15:46:17", "remaining_time": "2 days, 8:21:51", "throughput": 2723.58, "total_tokens": 1095908128} {"current_steps": 6073, "total_steps": 9134, "loss": 0.9956, "learning_rate": 1.2621824819794845e-05, "epoch": 0.6648238868058787, "percentage": 66.49, "elapsed_time": "4 days, 15:47:24", "remaining_time": "2 days, 8:20:45", "throughput": 2723.58, "total_tokens": 1096087328} {"current_steps": 6074, "total_steps": 9134, "loss": 0.6956, "learning_rate": 1.2614354891831437e-05, "epoch": 0.6649333588768166, "percentage": 66.5, "elapsed_time": "4 days, 15:48:31", "remaining_time": "2 days, 8:19:40", "throughput": 2723.62, "total_tokens": 1096290272} {"current_steps": 6075, "total_steps": 9134, "loss": 0.7308, "learning_rate": 1.2606886429066186e-05, "epoch": 0.6650428309477544, "percentage": 66.51, "elapsed_time": "4 days, 15:49:36", "remaining_time": "2 days, 8:18:33", "throughput": 2723.6, "total_tokens": 1096457152} {"current_steps": 6076, "total_steps": 9134, "loss": 1.0721, "learning_rate": 1.2599419432382561e-05, "epoch": 0.6651523030186923, "percentage": 66.52, "elapsed_time": "4 days, 15:50:45", "remaining_time": "2 days, 8:17:28", "throughput": 2723.66, "total_tokens": 1096669952} {"current_steps": 6077, "total_steps": 9134, "loss": 0.8268, "learning_rate": 1.259195390266393e-05, "epoch": 0.6652617750896302, "percentage": 66.53, "elapsed_time": "4 days, 15:51:53", "remaining_time": "2 days, 8:16:22", "throughput": 2723.7, "total_tokens": 1096871776} {"current_steps": 6078, "total_steps": 9134, "loss": 0.7313, "learning_rate": 1.2584489840793414e-05, "epoch": 0.6653712471605682, "percentage": 66.54, "elapsed_time": "4 days, 15:53:01", "remaining_time": "2 days, 8:15:17", "throughput": 2723.77, "total_tokens": 1097084128} {"current_steps": 6079, "total_steps": 9134, "loss": 0.8143, "learning_rate": 1.2577027247654033e-05, "epoch": 0.6654807192315061, "percentage": 66.55, "elapsed_time": "4 days, 15:54:10", "remaining_time": "2 days, 8:14:12", "throughput": 2723.75, "total_tokens": 1097262880} {"current_steps": 6080, "total_steps": 9134, "loss": 0.8541, "learning_rate": 1.2569566124128563e-05, "epoch": 0.665590191302444, "percentage": 66.56, "elapsed_time": "4 days, 15:55:12", "remaining_time": "2 days, 8:13:04", "throughput": 2723.73, "total_tokens": 1097426400} {"current_steps": 6081, "total_steps": 9134, "loss": 0.7082, "learning_rate": 1.2562106471099667e-05, "epoch": 0.6656996633733818, "percentage": 66.58, "elapsed_time": "4 days, 15:56:20", "remaining_time": "2 days, 8:11:58", "throughput": 2723.73, "total_tokens": 1097608064} {"current_steps": 6082, "total_steps": 9134, "loss": 0.6727, "learning_rate": 1.2554648289449798e-05, "epoch": 0.6658091354443197, "percentage": 66.59, "elapsed_time": "4 days, 15:57:28", "remaining_time": "2 days, 8:10:53", "throughput": 2723.78, "total_tokens": 1097815264} {"current_steps": 6083, "total_steps": 9134, "loss": 0.653, "learning_rate": 1.254719158006124e-05, "epoch": 0.6659186075152577, "percentage": 66.6, "elapsed_time": "4 days, 15:58:31", "remaining_time": "2 days, 8:09:45", "throughput": 2723.74, "total_tokens": 1097969824} {"current_steps": 6084, "total_steps": 9134, "loss": 0.8874, "learning_rate": 1.253973634381612e-05, "epoch": 0.6660280795861956, "percentage": 66.61, "elapsed_time": "4 days, 15:59:35", "remaining_time": "2 days, 8:08:37", "throughput": 2723.71, "total_tokens": 1098132224} {"current_steps": 6085, "total_steps": 9134, "loss": 0.5278, "learning_rate": 1.2532282581596355e-05, "epoch": 0.6661375516571335, "percentage": 66.62, "elapsed_time": "4 days, 16:00:42", "remaining_time": "2 days, 8:07:32", "throughput": 2723.72, "total_tokens": 1098320832} {"current_steps": 6086, "total_steps": 9134, "loss": 0.9085, "learning_rate": 1.2524830294283748e-05, "epoch": 0.6662470237280714, "percentage": 66.63, "elapsed_time": "4 days, 16:01:47", "remaining_time": "2 days, 8:06:25", "throughput": 2723.7, "total_tokens": 1098487040} {"current_steps": 6087, "total_steps": 9134, "loss": 0.8951, "learning_rate": 1.251737948275985e-05, "epoch": 0.6663564957990092, "percentage": 66.64, "elapsed_time": "4 days, 16:02:56", "remaining_time": "2 days, 8:05:19", "throughput": 2723.74, "total_tokens": 1098690208} {"current_steps": 6088, "total_steps": 9134, "loss": 0.9142, "learning_rate": 1.2509930147906107e-05, "epoch": 0.6664659678699472, "percentage": 66.65, "elapsed_time": "4 days, 16:04:01", "remaining_time": "2 days, 8:04:13", "throughput": 2723.77, "total_tokens": 1098881728} {"current_steps": 6089, "total_steps": 9134, "loss": 0.8937, "learning_rate": 1.2502482290603748e-05, "epoch": 0.6665754399408851, "percentage": 66.66, "elapsed_time": "4 days, 16:05:10", "remaining_time": "2 days, 8:03:08", "throughput": 2723.84, "total_tokens": 1099098336} {"current_steps": 6090, "total_steps": 9134, "loss": 0.9336, "learning_rate": 1.2495035911733844e-05, "epoch": 0.666684912011823, "percentage": 66.67, "elapsed_time": "4 days, 16:06:15", "remaining_time": "2 days, 8:02:01", "throughput": 2723.88, "total_tokens": 1099292544} {"current_steps": 6091, "total_steps": 9134, "loss": 0.911, "learning_rate": 1.2487591012177285e-05, "epoch": 0.6667943840827609, "percentage": 66.68, "elapsed_time": "4 days, 16:07:24", "remaining_time": "2 days, 8:00:56", "throughput": 2723.93, "total_tokens": 1099497952} {"current_steps": 6092, "total_steps": 9134, "loss": 0.8022, "learning_rate": 1.2480147592814791e-05, "epoch": 0.6669038561536987, "percentage": 66.7, "elapsed_time": "4 days, 16:08:27", "remaining_time": "2 days, 7:59:48", "throughput": 2723.87, "total_tokens": 1099647584} {"current_steps": 6093, "total_steps": 9134, "loss": 0.635, "learning_rate": 1.2472705654526904e-05, "epoch": 0.6670133282246367, "percentage": 66.71, "elapsed_time": "4 days, 16:09:30", "remaining_time": "2 days, 7:58:40", "throughput": 2723.83, "total_tokens": 1099802144} {"current_steps": 6094, "total_steps": 9134, "loss": 1.0026, "learning_rate": 1.2465265198193977e-05, "epoch": 0.6671228002955746, "percentage": 66.72, "elapsed_time": "4 days, 16:10:35", "remaining_time": "2 days, 7:57:33", "throughput": 2723.82, "total_tokens": 1099975744} {"current_steps": 6095, "total_steps": 9134, "loss": 0.7759, "learning_rate": 1.2457826224696225e-05, "epoch": 0.6672322723665125, "percentage": 66.73, "elapsed_time": "4 days, 16:11:42", "remaining_time": "2 days, 7:56:27", "throughput": 2723.84, "total_tokens": 1100165696} {"current_steps": 6096, "total_steps": 9134, "loss": 0.983, "learning_rate": 1.2450388734913657e-05, "epoch": 0.6673417444374504, "percentage": 66.74, "elapsed_time": "4 days, 16:12:50", "remaining_time": "2 days, 7:55:22", "throughput": 2723.87, "total_tokens": 1100363040} {"current_steps": 6097, "total_steps": 9134, "loss": 0.6779, "learning_rate": 1.2442952729726109e-05, "epoch": 0.6674512165083883, "percentage": 66.75, "elapsed_time": "4 days, 16:13:57", "remaining_time": "2 days, 7:54:16", "throughput": 2723.89, "total_tokens": 1100553888} {"current_steps": 6098, "total_steps": 9134, "loss": 0.7319, "learning_rate": 1.2435518210013248e-05, "epoch": 0.6675606885793262, "percentage": 66.76, "elapsed_time": "4 days, 16:14:59", "remaining_time": "2 days, 7:53:08", "throughput": 2723.86, "total_tokens": 1100712032} {"current_steps": 6099, "total_steps": 9134, "loss": 0.7459, "learning_rate": 1.2428085176654563e-05, "epoch": 0.6676701606502641, "percentage": 66.77, "elapsed_time": "4 days, 16:16:03", "remaining_time": "2 days, 7:52:01", "throughput": 2723.88, "total_tokens": 1100894144} {"current_steps": 6100, "total_steps": 9134, "loss": 0.9332, "learning_rate": 1.2420653630529369e-05, "epoch": 0.667779632721202, "percentage": 66.78, "elapsed_time": "4 days, 16:17:10", "remaining_time": "2 days, 7:50:55", "throughput": 2723.86, "total_tokens": 1101069088} {"current_steps": 6101, "total_steps": 9134, "loss": 0.6245, "learning_rate": 1.2413223572516802e-05, "epoch": 0.6678891047921399, "percentage": 66.79, "elapsed_time": "4 days, 16:18:17", "remaining_time": "2 days, 7:49:48", "throughput": 2723.88, "total_tokens": 1101256352} {"current_steps": 6102, "total_steps": 9134, "loss": 0.7321, "learning_rate": 1.2405795003495819e-05, "epoch": 0.6679985768630778, "percentage": 66.81, "elapsed_time": "4 days, 16:19:23", "remaining_time": "2 days, 7:48:42", "throughput": 2723.87, "total_tokens": 1101434208} {"current_steps": 6103, "total_steps": 9134, "loss": 0.8827, "learning_rate": 1.2398367924345213e-05, "epoch": 0.6681080489340158, "percentage": 66.82, "elapsed_time": "4 days, 16:20:29", "remaining_time": "2 days, 7:47:36", "throughput": 2723.82, "total_tokens": 1101591232} {"current_steps": 6104, "total_steps": 9134, "loss": 0.7978, "learning_rate": 1.2390942335943597e-05, "epoch": 0.6682175210049536, "percentage": 66.83, "elapsed_time": "4 days, 16:21:33", "remaining_time": "2 days, 7:46:28", "throughput": 2723.82, "total_tokens": 1101766624} {"current_steps": 6105, "total_steps": 9134, "loss": 0.7489, "learning_rate": 1.2383518239169397e-05, "epoch": 0.6683269930758915, "percentage": 66.84, "elapsed_time": "4 days, 16:22:40", "remaining_time": "2 days, 7:45:23", "throughput": 2723.88, "total_tokens": 1101974496} {"current_steps": 6106, "total_steps": 9134, "loss": 0.7039, "learning_rate": 1.2376095634900872e-05, "epoch": 0.6684364651468294, "percentage": 66.85, "elapsed_time": "4 days, 16:23:48", "remaining_time": "2 days, 7:44:17", "throughput": 2723.93, "total_tokens": 1102181696} {"current_steps": 6107, "total_steps": 9134, "loss": 0.6993, "learning_rate": 1.2368674524016099e-05, "epoch": 0.6685459372177673, "percentage": 66.86, "elapsed_time": "4 days, 16:24:54", "remaining_time": "2 days, 7:43:11", "throughput": 2723.94, "total_tokens": 1102364032} {"current_steps": 6108, "total_steps": 9134, "loss": 0.8255, "learning_rate": 1.2361254907392983e-05, "epoch": 0.6686554092887053, "percentage": 66.87, "elapsed_time": "4 days, 16:25:58", "remaining_time": "2 days, 7:42:03", "throughput": 2723.92, "total_tokens": 1102528000} {"current_steps": 6109, "total_steps": 9134, "loss": 0.7664, "learning_rate": 1.235383678590924e-05, "epoch": 0.6687648813596431, "percentage": 66.88, "elapsed_time": "4 days, 16:27:04", "remaining_time": "2 days, 7:40:57", "throughput": 2723.95, "total_tokens": 1102719296} {"current_steps": 6110, "total_steps": 9134, "loss": 0.8007, "learning_rate": 1.2346420160442449e-05, "epoch": 0.668874353430581, "percentage": 66.89, "elapsed_time": "4 days, 16:28:07", "remaining_time": "2 days, 7:39:49", "throughput": 2723.93, "total_tokens": 1102883040} {"current_steps": 6111, "total_steps": 9134, "loss": 0.7223, "learning_rate": 1.2339005031869947e-05, "epoch": 0.6689838255015189, "percentage": 66.9, "elapsed_time": "4 days, 16:29:08", "remaining_time": "2 days, 7:38:40", "throughput": 2723.86, "total_tokens": 1103021248} {"current_steps": 6112, "total_steps": 9134, "loss": 0.8199, "learning_rate": 1.2331591401068961e-05, "epoch": 0.6690932975724568, "percentage": 66.91, "elapsed_time": "4 days, 16:30:11", "remaining_time": "2 days, 7:37:32", "throughput": 2723.86, "total_tokens": 1103195296} {"current_steps": 6113, "total_steps": 9134, "loss": 0.7567, "learning_rate": 1.2324179268916478e-05, "epoch": 0.6692027696433948, "percentage": 66.93, "elapsed_time": "4 days, 16:31:16", "remaining_time": "2 days, 7:36:26", "throughput": 2723.89, "total_tokens": 1103384576} {"current_steps": 6114, "total_steps": 9134, "loss": 0.8462, "learning_rate": 1.2316768636289364e-05, "epoch": 0.6693122417143327, "percentage": 66.94, "elapsed_time": "4 days, 16:32:22", "remaining_time": "2 days, 7:35:19", "throughput": 2723.94, "total_tokens": 1103582368} {"current_steps": 6115, "total_steps": 9134, "loss": 0.7676, "learning_rate": 1.2309359504064274e-05, "epoch": 0.6694217137852705, "percentage": 66.95, "elapsed_time": "4 days, 16:33:31", "remaining_time": "2 days, 7:34:14", "throughput": 2723.98, "total_tokens": 1103787552} {"current_steps": 6116, "total_steps": 9134, "loss": 0.7054, "learning_rate": 1.2301951873117687e-05, "epoch": 0.6695311858562084, "percentage": 66.96, "elapsed_time": "4 days, 16:34:37", "remaining_time": "2 days, 7:33:08", "throughput": 2723.96, "total_tokens": 1103959360} {"current_steps": 6117, "total_steps": 9134, "loss": 0.8366, "learning_rate": 1.2294545744325935e-05, "epoch": 0.6696406579271463, "percentage": 66.97, "elapsed_time": "4 days, 16:35:44", "remaining_time": "2 days, 7:32:02", "throughput": 2724.01, "total_tokens": 1104164992} {"current_steps": 6118, "total_steps": 9134, "loss": 0.7889, "learning_rate": 1.2287141118565116e-05, "epoch": 0.6697501299980843, "percentage": 66.98, "elapsed_time": "4 days, 16:36:53", "remaining_time": "2 days, 7:30:57", "throughput": 2724.03, "total_tokens": 1104357408} {"current_steps": 6119, "total_steps": 9134, "loss": 0.7905, "learning_rate": 1.2279737996711216e-05, "epoch": 0.6698596020690222, "percentage": 66.99, "elapsed_time": "4 days, 16:38:02", "remaining_time": "2 days, 7:29:52", "throughput": 2724.02, "total_tokens": 1104539744} {"current_steps": 6120, "total_steps": 9134, "loss": 0.6631, "learning_rate": 1.2272336379639978e-05, "epoch": 0.6699690741399601, "percentage": 67.0, "elapsed_time": "4 days, 16:39:07", "remaining_time": "2 days, 7:28:45", "throughput": 2724.0, "total_tokens": 1104711776} {"current_steps": 6121, "total_steps": 9134, "loss": 0.9891, "learning_rate": 1.2264936268227032e-05, "epoch": 0.6700785462108979, "percentage": 67.01, "elapsed_time": "4 days, 16:40:16", "remaining_time": "2 days, 7:27:40", "throughput": 2724.1, "total_tokens": 1104939584} {"current_steps": 6122, "total_steps": 9134, "loss": 0.8852, "learning_rate": 1.2257537663347763e-05, "epoch": 0.6701880182818358, "percentage": 67.02, "elapsed_time": "4 days, 16:41:19", "remaining_time": "2 days, 7:26:32", "throughput": 2724.1, "total_tokens": 1105110720} {"current_steps": 6123, "total_steps": 9134, "loss": 0.6681, "learning_rate": 1.2250140565877438e-05, "epoch": 0.6702974903527738, "percentage": 67.04, "elapsed_time": "4 days, 16:42:23", "remaining_time": "2 days, 7:25:25", "throughput": 2724.1, "total_tokens": 1105286112} {"current_steps": 6124, "total_steps": 9134, "loss": 0.9507, "learning_rate": 1.2242744976691109e-05, "epoch": 0.6704069624237117, "percentage": 67.05, "elapsed_time": "4 days, 16:43:26", "remaining_time": "2 days, 7:24:17", "throughput": 2724.11, "total_tokens": 1105461728} {"current_steps": 6125, "total_steps": 9134, "loss": 0.5057, "learning_rate": 1.2235350896663662e-05, "epoch": 0.6705164344946496, "percentage": 67.06, "elapsed_time": "4 days, 16:44:31", "remaining_time": "2 days, 7:23:10", "throughput": 2724.13, "total_tokens": 1105647648} {"current_steps": 6126, "total_steps": 9134, "loss": 1.0572, "learning_rate": 1.2227958326669803e-05, "epoch": 0.6706259065655874, "percentage": 67.07, "elapsed_time": "4 days, 16:45:38", "remaining_time": "2 days, 7:22:04", "throughput": 2724.17, "total_tokens": 1105846784} {"current_steps": 6127, "total_steps": 9134, "loss": 0.7698, "learning_rate": 1.2220567267584048e-05, "epoch": 0.6707353786365253, "percentage": 67.08, "elapsed_time": "4 days, 16:46:43", "remaining_time": "2 days, 7:20:57", "throughput": 2724.15, "total_tokens": 1106015904} {"current_steps": 6128, "total_steps": 9134, "loss": 0.7536, "learning_rate": 1.2213177720280764e-05, "epoch": 0.6708448507074632, "percentage": 67.09, "elapsed_time": "4 days, 16:47:51", "remaining_time": "2 days, 7:19:52", "throughput": 2724.18, "total_tokens": 1106208992} {"current_steps": 6129, "total_steps": 9134, "loss": 0.7414, "learning_rate": 1.2205789685634112e-05, "epoch": 0.6709543227784012, "percentage": 67.1, "elapsed_time": "4 days, 16:48:59", "remaining_time": "2 days, 7:18:47", "throughput": 2724.25, "total_tokens": 1106425152} {"current_steps": 6130, "total_steps": 9134, "loss": 0.8358, "learning_rate": 1.2198403164518083e-05, "epoch": 0.6710637948493391, "percentage": 67.11, "elapsed_time": "4 days, 16:50:05", "remaining_time": "2 days, 7:17:40", "throughput": 2724.23, "total_tokens": 1106597408} {"current_steps": 6131, "total_steps": 9134, "loss": 0.807, "learning_rate": 1.2191018157806485e-05, "epoch": 0.671173266920277, "percentage": 67.12, "elapsed_time": "4 days, 16:51:11", "remaining_time": "2 days, 7:16:33", "throughput": 2724.23, "total_tokens": 1106776832} {"current_steps": 6132, "total_steps": 9134, "loss": 0.9014, "learning_rate": 1.2183634666372954e-05, "epoch": 0.6712827389912148, "percentage": 67.13, "elapsed_time": "4 days, 16:52:15", "remaining_time": "2 days, 7:15:26", "throughput": 2724.2, "total_tokens": 1106939680} {"current_steps": 6133, "total_steps": 9134, "loss": 0.676, "learning_rate": 1.2176252691090939e-05, "epoch": 0.6713922110621527, "percentage": 67.14, "elapsed_time": "4 days, 16:53:21", "remaining_time": "2 days, 7:14:20", "throughput": 2724.17, "total_tokens": 1107104544} {"current_steps": 6134, "total_steps": 9134, "loss": 0.6751, "learning_rate": 1.2168872232833717e-05, "epoch": 0.6715016831330907, "percentage": 67.16, "elapsed_time": "4 days, 16:54:28", "remaining_time": "2 days, 7:13:14", "throughput": 2724.18, "total_tokens": 1107294720} {"current_steps": 6135, "total_steps": 9134, "loss": 0.7461, "learning_rate": 1.216149329247437e-05, "epoch": 0.6716111552040286, "percentage": 67.17, "elapsed_time": "4 days, 16:55:34", "remaining_time": "2 days, 7:12:07", "throughput": 2724.22, "total_tokens": 1107487584} {"current_steps": 6136, "total_steps": 9134, "loss": 0.7174, "learning_rate": 1.2154115870885838e-05, "epoch": 0.6717206272749665, "percentage": 67.18, "elapsed_time": "4 days, 16:56:35", "remaining_time": "2 days, 7:10:59", "throughput": 2724.2, "total_tokens": 1107647072} {"current_steps": 6137, "total_steps": 9134, "loss": 0.6933, "learning_rate": 1.2146739968940838e-05, "epoch": 0.6718300993459044, "percentage": 67.19, "elapsed_time": "4 days, 16:57:38", "remaining_time": "2 days, 7:09:51", "throughput": 2724.17, "total_tokens": 1107805664} {"current_steps": 6138, "total_steps": 9134, "loss": 0.7058, "learning_rate": 1.2139365587511927e-05, "epoch": 0.6719395714168422, "percentage": 67.2, "elapsed_time": "4 days, 16:58:41", "remaining_time": "2 days, 7:08:43", "throughput": 2724.16, "total_tokens": 1107973664} {"current_steps": 6139, "total_steps": 9134, "loss": 0.6256, "learning_rate": 1.2131992727471484e-05, "epoch": 0.6720490434877802, "percentage": 67.21, "elapsed_time": "4 days, 16:59:43", "remaining_time": "2 days, 7:07:35", "throughput": 2724.13, "total_tokens": 1108133376} {"current_steps": 6140, "total_steps": 9134, "loss": 0.9088, "learning_rate": 1.2124621389691702e-05, "epoch": 0.6721585155587181, "percentage": 67.22, "elapsed_time": "4 days, 17:00:49", "remaining_time": "2 days, 7:06:28", "throughput": 2724.16, "total_tokens": 1108321760} {"current_steps": 6141, "total_steps": 9134, "loss": 0.7775, "learning_rate": 1.2117251575044594e-05, "epoch": 0.672267987629656, "percentage": 67.23, "elapsed_time": "4 days, 17:01:52", "remaining_time": "2 days, 7:05:21", "throughput": 2724.15, "total_tokens": 1108490432} {"current_steps": 6142, "total_steps": 9134, "loss": 0.7001, "learning_rate": 1.2109883284401987e-05, "epoch": 0.6723774597005939, "percentage": 67.24, "elapsed_time": "4 days, 17:02:58", "remaining_time": "2 days, 7:04:14", "throughput": 2724.15, "total_tokens": 1108668960} {"current_steps": 6143, "total_steps": 9134, "loss": 0.686, "learning_rate": 1.2102516518635568e-05, "epoch": 0.6724869317715317, "percentage": 67.25, "elapsed_time": "4 days, 17:04:07", "remaining_time": "2 days, 7:03:09", "throughput": 2724.17, "total_tokens": 1108865408} {"current_steps": 6144, "total_steps": 9134, "loss": 0.6469, "learning_rate": 1.2095151278616768e-05, "epoch": 0.6725964038424697, "percentage": 67.27, "elapsed_time": "4 days, 17:05:09", "remaining_time": "2 days, 7:02:01", "throughput": 2724.12, "total_tokens": 1109015936} {"current_steps": 6145, "total_steps": 9134, "loss": 1.0076, "learning_rate": 1.208778756521691e-05, "epoch": 0.6727058759134076, "percentage": 67.28, "elapsed_time": "4 days, 17:06:14", "remaining_time": "2 days, 7:00:54", "throughput": 2724.13, "total_tokens": 1109195136} {"current_steps": 6146, "total_steps": 9134, "loss": 0.7697, "learning_rate": 1.20804253793071e-05, "epoch": 0.6728153479843455, "percentage": 67.29, "elapsed_time": "4 days, 17:07:22", "remaining_time": "2 days, 6:59:49", "throughput": 2724.18, "total_tokens": 1109403008} {"current_steps": 6147, "total_steps": 9134, "loss": 0.6655, "learning_rate": 1.207306472175827e-05, "epoch": 0.6729248200552834, "percentage": 67.3, "elapsed_time": "4 days, 17:08:29", "remaining_time": "2 days, 6:58:43", "throughput": 2724.19, "total_tokens": 1109590944} {"current_steps": 6148, "total_steps": 9134, "loss": 0.6112, "learning_rate": 1.2065705593441174e-05, "epoch": 0.6730342921262213, "percentage": 67.31, "elapsed_time": "4 days, 17:09:34", "remaining_time": "2 days, 6:57:36", "throughput": 2724.21, "total_tokens": 1109775296} {"current_steps": 6149, "total_steps": 9134, "loss": 0.9071, "learning_rate": 1.2058347995226365e-05, "epoch": 0.6731437641971592, "percentage": 67.32, "elapsed_time": "4 days, 17:10:38", "remaining_time": "2 days, 6:56:29", "throughput": 2724.18, "total_tokens": 1109936576} {"current_steps": 6150, "total_steps": 9134, "loss": 0.9468, "learning_rate": 1.2050991927984273e-05, "epoch": 0.6732532362680971, "percentage": 67.33, "elapsed_time": "4 days, 17:11:43", "remaining_time": "2 days, 6:55:22", "throughput": 2724.22, "total_tokens": 1110130784} {"current_steps": 6151, "total_steps": 9134, "loss": 0.6709, "learning_rate": 1.2043637392585059e-05, "epoch": 0.673362708339035, "percentage": 67.34, "elapsed_time": "4 days, 17:12:48", "remaining_time": "2 days, 6:54:15", "throughput": 2724.2, "total_tokens": 1110298560} {"current_steps": 6152, "total_steps": 9134, "loss": 0.6217, "learning_rate": 1.2036284389898791e-05, "epoch": 0.6734721804099729, "percentage": 67.35, "elapsed_time": "4 days, 17:13:54", "remaining_time": "2 days, 6:53:08", "throughput": 2724.19, "total_tokens": 1110473056} {"current_steps": 6153, "total_steps": 9134, "loss": 0.6576, "learning_rate": 1.2028932920795284e-05, "epoch": 0.6735816524809108, "percentage": 67.36, "elapsed_time": "4 days, 17:14:59", "remaining_time": "2 days, 6:52:02", "throughput": 2724.16, "total_tokens": 1110640384} {"current_steps": 6154, "total_steps": 9134, "loss": 0.8934, "learning_rate": 1.2021582986144229e-05, "epoch": 0.6736911245518488, "percentage": 67.37, "elapsed_time": "4 days, 17:16:05", "remaining_time": "2 days, 6:50:55", "throughput": 2724.18, "total_tokens": 1110826304} {"current_steps": 6155, "total_steps": 9134, "loss": 0.8256, "learning_rate": 1.2014234586815079e-05, "epoch": 0.6738005966227866, "percentage": 67.39, "elapsed_time": "4 days, 17:17:11", "remaining_time": "2 days, 6:49:49", "throughput": 2724.18, "total_tokens": 1111006624} {"current_steps": 6156, "total_steps": 9134, "loss": 0.6484, "learning_rate": 1.2006887723677162e-05, "epoch": 0.6739100686937245, "percentage": 67.4, "elapsed_time": "4 days, 17:18:18", "remaining_time": "2 days, 6:48:43", "throughput": 2724.19, "total_tokens": 1111193216} {"current_steps": 6157, "total_steps": 9134, "loss": 0.6988, "learning_rate": 1.1999542397599589e-05, "epoch": 0.6740195407646624, "percentage": 67.41, "elapsed_time": "4 days, 17:19:21", "remaining_time": "2 days, 6:47:35", "throughput": 2724.18, "total_tokens": 1111359424} {"current_steps": 6158, "total_steps": 9134, "loss": 0.6204, "learning_rate": 1.1992198609451288e-05, "epoch": 0.6741290128356003, "percentage": 67.42, "elapsed_time": "4 days, 17:20:27", "remaining_time": "2 days, 6:46:28", "throughput": 2724.17, "total_tokens": 1111534816} {"current_steps": 6159, "total_steps": 9134, "loss": 0.8895, "learning_rate": 1.1984856360101045e-05, "epoch": 0.6742384849065383, "percentage": 67.43, "elapsed_time": "4 days, 17:21:34", "remaining_time": "2 days, 6:45:22", "throughput": 2724.16, "total_tokens": 1111714464} {"current_steps": 6160, "total_steps": 9134, "loss": 0.7933, "learning_rate": 1.1977515650417396e-05, "epoch": 0.6743479569774761, "percentage": 67.44, "elapsed_time": "4 days, 17:22:41", "remaining_time": "2 days, 6:44:17", "throughput": 2724.17, "total_tokens": 1111899040} {"current_steps": 6161, "total_steps": 9134, "loss": 0.9438, "learning_rate": 1.1970176481268766e-05, "epoch": 0.674457429048414, "percentage": 67.45, "elapsed_time": "4 days, 17:23:47", "remaining_time": "2 days, 6:43:10", "throughput": 2724.16, "total_tokens": 1112076448} {"current_steps": 6162, "total_steps": 9134, "loss": 0.7082, "learning_rate": 1.1962838853523335e-05, "epoch": 0.6745669011193519, "percentage": 67.46, "elapsed_time": "4 days, 17:24:47", "remaining_time": "2 days, 6:42:01", "throughput": 2724.14, "total_tokens": 1112230784} {"current_steps": 6163, "total_steps": 9134, "loss": 0.698, "learning_rate": 1.195550276804915e-05, "epoch": 0.6746763731902898, "percentage": 67.47, "elapsed_time": "4 days, 17:25:53", "remaining_time": "2 days, 6:40:54", "throughput": 2724.16, "total_tokens": 1112420512} {"current_steps": 6164, "total_steps": 9134, "loss": 0.6488, "learning_rate": 1.1948168225714051e-05, "epoch": 0.6747858452612278, "percentage": 67.48, "elapsed_time": "4 days, 17:27:01", "remaining_time": "2 days, 6:39:49", "throughput": 2724.15, "total_tokens": 1112602400} {"current_steps": 6165, "total_steps": 9134, "loss": 0.7395, "learning_rate": 1.1940835227385702e-05, "epoch": 0.6748953173321657, "percentage": 67.5, "elapsed_time": "4 days, 17:28:04", "remaining_time": "2 days, 6:38:41", "throughput": 2724.15, "total_tokens": 1112771744} {"current_steps": 6166, "total_steps": 9134, "loss": 0.9476, "learning_rate": 1.1933503773931581e-05, "epoch": 0.6750047894031035, "percentage": 67.51, "elapsed_time": "4 days, 17:29:13", "remaining_time": "2 days, 6:37:36", "throughput": 2724.2, "total_tokens": 1112982304} {"current_steps": 6167, "total_steps": 9134, "loss": 0.8011, "learning_rate": 1.1926173866218984e-05, "epoch": 0.6751142614740414, "percentage": 67.52, "elapsed_time": "4 days, 17:30:18", "remaining_time": "2 days, 6:36:30", "throughput": 2724.22, "total_tokens": 1113165984} {"current_steps": 6168, "total_steps": 9134, "loss": 0.947, "learning_rate": 1.1918845505115025e-05, "epoch": 0.6752237335449793, "percentage": 67.53, "elapsed_time": "4 days, 17:31:24", "remaining_time": "2 days, 6:35:23", "throughput": 2724.22, "total_tokens": 1113344736} {"current_steps": 6169, "total_steps": 9134, "loss": 0.8513, "learning_rate": 1.1911518691486626e-05, "epoch": 0.6753332056159173, "percentage": 67.54, "elapsed_time": "4 days, 17:32:26", "remaining_time": "2 days, 6:34:15", "throughput": 2724.18, "total_tokens": 1113500416} {"current_steps": 6170, "total_steps": 9134, "loss": 0.866, "learning_rate": 1.1904193426200554e-05, "epoch": 0.6754426776868552, "percentage": 67.55, "elapsed_time": "4 days, 17:33:34", "remaining_time": "2 days, 6:33:10", "throughput": 2724.19, "total_tokens": 1113691040} {"current_steps": 6171, "total_steps": 9134, "loss": 0.9745, "learning_rate": 1.1896869710123368e-05, "epoch": 0.6755521497577931, "percentage": 67.56, "elapsed_time": "4 days, 17:34:41", "remaining_time": "2 days, 6:32:04", "throughput": 2724.18, "total_tokens": 1113865984} {"current_steps": 6172, "total_steps": 9134, "loss": 0.6319, "learning_rate": 1.1889547544121443e-05, "epoch": 0.6756616218287309, "percentage": 67.57, "elapsed_time": "4 days, 17:35:50", "remaining_time": "2 days, 6:30:59", "throughput": 2724.15, "total_tokens": 1114042720} {"current_steps": 6173, "total_steps": 9134, "loss": 0.9203, "learning_rate": 1.1882226929060982e-05, "epoch": 0.6757710938996688, "percentage": 67.58, "elapsed_time": "4 days, 17:36:58", "remaining_time": "2 days, 6:29:53", "throughput": 2724.17, "total_tokens": 1114234688} {"current_steps": 6174, "total_steps": 9134, "loss": 0.7321, "learning_rate": 1.1874907865808e-05, "epoch": 0.6758805659706068, "percentage": 67.59, "elapsed_time": "4 days, 17:38:01", "remaining_time": "2 days, 6:28:45", "throughput": 2724.11, "total_tokens": 1114382528} {"current_steps": 6175, "total_steps": 9134, "loss": 0.8856, "learning_rate": 1.1867590355228326e-05, "epoch": 0.6759900380415447, "percentage": 67.6, "elapsed_time": "4 days, 17:39:07", "remaining_time": "2 days, 6:27:39", "throughput": 2724.1, "total_tokens": 1114561056} {"current_steps": 6176, "total_steps": 9134, "loss": 0.8121, "learning_rate": 1.1860274398187605e-05, "epoch": 0.6760995101124826, "percentage": 67.62, "elapsed_time": "4 days, 17:40:11", "remaining_time": "2 days, 6:26:32", "throughput": 2724.09, "total_tokens": 1114727936} {"current_steps": 6177, "total_steps": 9134, "loss": 0.6789, "learning_rate": 1.1852959995551297e-05, "epoch": 0.6762089821834204, "percentage": 67.63, "elapsed_time": "4 days, 17:41:20", "remaining_time": "2 days, 6:25:27", "throughput": 2724.14, "total_tokens": 1114938048} {"current_steps": 6178, "total_steps": 9134, "loss": 0.9061, "learning_rate": 1.1845647148184696e-05, "epoch": 0.6763184542543583, "percentage": 67.64, "elapsed_time": "4 days, 17:42:26", "remaining_time": "2 days, 6:24:20", "throughput": 2724.13, "total_tokens": 1115113888} {"current_steps": 6179, "total_steps": 9134, "loss": 0.55, "learning_rate": 1.1838335856952893e-05, "epoch": 0.6764279263252962, "percentage": 67.65, "elapsed_time": "4 days, 17:43:30", "remaining_time": "2 days, 6:23:13", "throughput": 2724.14, "total_tokens": 1115291296} {"current_steps": 6180, "total_steps": 9134, "loss": 0.8134, "learning_rate": 1.1831026122720795e-05, "epoch": 0.6765373983962342, "percentage": 67.66, "elapsed_time": "4 days, 17:44:35", "remaining_time": "2 days, 6:22:06", "throughput": 2724.12, "total_tokens": 1115462880} {"current_steps": 6181, "total_steps": 9134, "loss": 0.8201, "learning_rate": 1.1823717946353134e-05, "epoch": 0.6766468704671721, "percentage": 67.67, "elapsed_time": "4 days, 17:45:40", "remaining_time": "2 days, 6:20:59", "throughput": 2724.1, "total_tokens": 1115627968} {"current_steps": 6182, "total_steps": 9134, "loss": 0.8666, "learning_rate": 1.181641132871445e-05, "epoch": 0.67675634253811, "percentage": 67.68, "elapsed_time": "4 days, 17:46:49", "remaining_time": "2 days, 6:19:54", "throughput": 2724.14, "total_tokens": 1115833824} {"current_steps": 6183, "total_steps": 9134, "loss": 0.8388, "learning_rate": 1.1809106270669104e-05, "epoch": 0.6768658146090478, "percentage": 67.69, "elapsed_time": "4 days, 17:47:58", "remaining_time": "2 days, 6:18:50", "throughput": 2724.24, "total_tokens": 1116063200} {"current_steps": 6184, "total_steps": 9134, "loss": 0.6171, "learning_rate": 1.1801802773081258e-05, "epoch": 0.6769752866799857, "percentage": 67.7, "elapsed_time": "4 days, 17:48:57", "remaining_time": "2 days, 6:17:40", "throughput": 2724.2, "total_tokens": 1116205888} {"current_steps": 6185, "total_steps": 9134, "loss": 0.879, "learning_rate": 1.1794500836814933e-05, "epoch": 0.6770847587509237, "percentage": 67.71, "elapsed_time": "4 days, 17:50:00", "remaining_time": "2 days, 6:16:32", "throughput": 2724.17, "total_tokens": 1116367168} {"current_steps": 6186, "total_steps": 9134, "loss": 0.6222, "learning_rate": 1.1787200462733897e-05, "epoch": 0.6771942308218616, "percentage": 67.72, "elapsed_time": "4 days, 17:51:09", "remaining_time": "2 days, 6:15:27", "throughput": 2724.2, "total_tokens": 1116566976} {"current_steps": 6187, "total_steps": 9134, "loss": 0.7331, "learning_rate": 1.1779901651701796e-05, "epoch": 0.6773037028927995, "percentage": 67.74, "elapsed_time": "4 days, 17:52:16", "remaining_time": "2 days, 6:14:21", "throughput": 2724.18, "total_tokens": 1116739904} {"current_steps": 6188, "total_steps": 9134, "loss": 0.8141, "learning_rate": 1.1772604404582057e-05, "epoch": 0.6774131749637374, "percentage": 67.75, "elapsed_time": "4 days, 17:53:25", "remaining_time": "2 days, 6:13:16", "throughput": 2724.22, "total_tokens": 1116943072} {"current_steps": 6189, "total_steps": 9134, "loss": 0.6077, "learning_rate": 1.176530872223793e-05, "epoch": 0.6775226470346752, "percentage": 67.76, "elapsed_time": "4 days, 17:54:31", "remaining_time": "2 days, 6:12:10", "throughput": 2724.22, "total_tokens": 1117128096} {"current_steps": 6190, "total_steps": 9134, "loss": 0.9152, "learning_rate": 1.1758014605532483e-05, "epoch": 0.6776321191056132, "percentage": 67.77, "elapsed_time": "4 days, 17:55:35", "remaining_time": "2 days, 6:11:02", "throughput": 2724.22, "total_tokens": 1117299008} {"current_steps": 6191, "total_steps": 9134, "loss": 0.6609, "learning_rate": 1.1750722055328581e-05, "epoch": 0.6777415911765511, "percentage": 67.78, "elapsed_time": "4 days, 17:56:41", "remaining_time": "2 days, 6:09:56", "throughput": 2724.23, "total_tokens": 1117484704} {"current_steps": 6192, "total_steps": 9134, "loss": 0.7009, "learning_rate": 1.1743431072488952e-05, "epoch": 0.677851063247489, "percentage": 67.79, "elapsed_time": "4 days, 17:57:48", "remaining_time": "2 days, 6:08:50", "throughput": 2724.28, "total_tokens": 1117683840} {"current_steps": 6193, "total_steps": 9134, "loss": 1.1124, "learning_rate": 1.1736141657876068e-05, "epoch": 0.6779605353184269, "percentage": 67.8, "elapsed_time": "4 days, 17:58:56", "remaining_time": "2 days, 6:07:45", "throughput": 2724.28, "total_tokens": 1117873120} {"current_steps": 6194, "total_steps": 9134, "loss": 0.7856, "learning_rate": 1.1728853812352286e-05, "epoch": 0.6780700073893647, "percentage": 67.81, "elapsed_time": "4 days, 17:59:56", "remaining_time": "2 days, 6:06:35", "throughput": 2724.22, "total_tokens": 1118009536} {"current_steps": 6195, "total_steps": 9134, "loss": 0.6702, "learning_rate": 1.172156753677971e-05, "epoch": 0.6781794794603027, "percentage": 67.82, "elapsed_time": "4 days, 18:00:59", "remaining_time": "2 days, 6:05:28", "throughput": 2724.23, "total_tokens": 1118185600} {"current_steps": 6196, "total_steps": 9134, "loss": 1.0739, "learning_rate": 1.1714282832020318e-05, "epoch": 0.6782889515312406, "percentage": 67.83, "elapsed_time": "4 days, 18:02:08", "remaining_time": "2 days, 6:04:23", "throughput": 2724.26, "total_tokens": 1118387872} {"current_steps": 6197, "total_steps": 9134, "loss": 0.674, "learning_rate": 1.170699969893587e-05, "epoch": 0.6783984236021785, "percentage": 67.85, "elapsed_time": "4 days, 18:03:17", "remaining_time": "2 days, 6:03:18", "throughput": 2724.31, "total_tokens": 1118593504} {"current_steps": 6198, "total_steps": 9134, "loss": 0.8084, "learning_rate": 1.1699718138387947e-05, "epoch": 0.6785078956731164, "percentage": 67.86, "elapsed_time": "4 days, 18:04:22", "remaining_time": "2 days, 6:02:11", "throughput": 2724.3, "total_tokens": 1118769568} {"current_steps": 6199, "total_steps": 9134, "loss": 0.8557, "learning_rate": 1.1692438151237942e-05, "epoch": 0.6786173677440543, "percentage": 67.87, "elapsed_time": "4 days, 18:05:25", "remaining_time": "2 days, 6:01:03", "throughput": 2724.32, "total_tokens": 1118948544} {"current_steps": 6200, "total_steps": 9134, "loss": 0.9654, "learning_rate": 1.1685159738347054e-05, "epoch": 0.6787268398149922, "percentage": 67.88, "elapsed_time": "4 days, 18:06:27", "remaining_time": "2 days, 5:59:55", "throughput": 2724.27, "total_tokens": 1119095712} {"current_steps": 6201, "total_steps": 9134, "loss": 0.7937, "learning_rate": 1.1677882900576334e-05, "epoch": 0.6788363118859301, "percentage": 67.89, "elapsed_time": "4 days, 18:07:36", "remaining_time": "2 days, 5:58:50", "throughput": 2724.25, "total_tokens": 1119273568} {"current_steps": 6202, "total_steps": 9134, "loss": 0.925, "learning_rate": 1.1670607638786579e-05, "epoch": 0.678945783956868, "percentage": 67.9, "elapsed_time": "4 days, 18:08:44", "remaining_time": "2 days, 5:57:45", "throughput": 2724.26, "total_tokens": 1119467552} {"current_steps": 6203, "total_steps": 9134, "loss": 0.7855, "learning_rate": 1.166333395383847e-05, "epoch": 0.6790552560278059, "percentage": 67.91, "elapsed_time": "4 days, 18:09:49", "remaining_time": "2 days, 5:56:37", "throughput": 2724.22, "total_tokens": 1119625920} {"current_steps": 6204, "total_steps": 9134, "loss": 0.6556, "learning_rate": 1.1656061846592458e-05, "epoch": 0.6791647280987438, "percentage": 67.92, "elapsed_time": "4 days, 18:10:58", "remaining_time": "2 days, 5:55:32", "throughput": 2724.26, "total_tokens": 1119830432} {"current_steps": 6205, "total_steps": 9134, "loss": 0.8691, "learning_rate": 1.1648791317908822e-05, "epoch": 0.6792742001696818, "percentage": 67.93, "elapsed_time": "4 days, 18:12:00", "remaining_time": "2 days, 5:54:24", "throughput": 2724.2, "total_tokens": 1119971552} {"current_steps": 6206, "total_steps": 9134, "loss": 0.8292, "learning_rate": 1.164152236864765e-05, "epoch": 0.6793836722406196, "percentage": 67.94, "elapsed_time": "4 days, 18:13:07", "remaining_time": "2 days, 5:53:19", "throughput": 2724.2, "total_tokens": 1120157248} {"current_steps": 6207, "total_steps": 9134, "loss": 0.6862, "learning_rate": 1.1634254999668842e-05, "epoch": 0.6794931443115575, "percentage": 67.95, "elapsed_time": "4 days, 18:14:13", "remaining_time": "2 days, 5:52:12", "throughput": 2724.23, "total_tokens": 1120350112} {"current_steps": 6208, "total_steps": 9134, "loss": 0.8896, "learning_rate": 1.162698921183212e-05, "epoch": 0.6796026163824954, "percentage": 67.97, "elapsed_time": "4 days, 18:15:21", "remaining_time": "2 days, 5:51:07", "throughput": 2724.29, "total_tokens": 1120559104} {"current_steps": 6209, "total_steps": 9134, "loss": 0.7586, "learning_rate": 1.1619725005997007e-05, "epoch": 0.6797120884534333, "percentage": 67.98, "elapsed_time": "4 days, 18:16:30", "remaining_time": "2 days, 5:50:01", "throughput": 2724.27, "total_tokens": 1120738304} {"current_steps": 6210, "total_steps": 9134, "loss": 0.9708, "learning_rate": 1.1612462383022838e-05, "epoch": 0.6798215605243713, "percentage": 67.99, "elapsed_time": "4 days, 18:17:37", "remaining_time": "2 days, 5:48:56", "throughput": 2724.31, "total_tokens": 1120937440} {"current_steps": 6211, "total_steps": 9134, "loss": 0.5127, "learning_rate": 1.1605201343768787e-05, "epoch": 0.6799310325953091, "percentage": 68.0, "elapsed_time": "4 days, 18:18:44", "remaining_time": "2 days, 5:47:50", "throughput": 2724.3, "total_tokens": 1121113056} {"current_steps": 6212, "total_steps": 9134, "loss": 0.7639, "learning_rate": 1.1597941889093808e-05, "epoch": 0.680040504666247, "percentage": 68.01, "elapsed_time": "4 days, 18:19:51", "remaining_time": "2 days, 5:46:44", "throughput": 2724.34, "total_tokens": 1121317344} {"current_steps": 6213, "total_steps": 9134, "loss": 0.6956, "learning_rate": 1.1590684019856687e-05, "epoch": 0.6801499767371849, "percentage": 68.02, "elapsed_time": "4 days, 18:20:55", "remaining_time": "2 days, 5:45:37", "throughput": 2724.33, "total_tokens": 1121484672} {"current_steps": 6214, "total_steps": 9134, "loss": 0.866, "learning_rate": 1.1583427736916008e-05, "epoch": 0.6802594488081228, "percentage": 68.03, "elapsed_time": "4 days, 18:22:01", "remaining_time": "2 days, 5:44:30", "throughput": 2724.29, "total_tokens": 1121647744} {"current_steps": 6215, "total_steps": 9134, "loss": 0.6814, "learning_rate": 1.1576173041130184e-05, "epoch": 0.6803689208790608, "percentage": 68.04, "elapsed_time": "4 days, 18:23:10", "remaining_time": "2 days, 5:43:25", "throughput": 2724.33, "total_tokens": 1121851136} {"current_steps": 6216, "total_steps": 9134, "loss": 0.8806, "learning_rate": 1.1568919933357423e-05, "epoch": 0.6804783929499987, "percentage": 68.05, "elapsed_time": "4 days, 18:24:16", "remaining_time": "2 days, 5:42:19", "throughput": 2724.35, "total_tokens": 1122040640} {"current_steps": 6217, "total_steps": 9134, "loss": 0.7274, "learning_rate": 1.1561668414455751e-05, "epoch": 0.6805878650209365, "percentage": 68.06, "elapsed_time": "4 days, 18:25:23", "remaining_time": "2 days, 5:41:13", "throughput": 2724.37, "total_tokens": 1122231712} {"current_steps": 6218, "total_steps": 9134, "loss": 0.7445, "learning_rate": 1.1554418485283033e-05, "epoch": 0.6806973370918744, "percentage": 68.08, "elapsed_time": "4 days, 18:26:27", "remaining_time": "2 days, 5:40:05", "throughput": 2724.33, "total_tokens": 1122389632} {"current_steps": 6219, "total_steps": 9134, "loss": 0.6946, "learning_rate": 1.1547170146696887e-05, "epoch": 0.6808068091628123, "percentage": 68.09, "elapsed_time": "4 days, 18:27:34", "remaining_time": "2 days, 5:39:00", "throughput": 2724.41, "total_tokens": 1122603776} {"current_steps": 6220, "total_steps": 9134, "loss": 0.9101, "learning_rate": 1.1539923399554805e-05, "epoch": 0.6809162812337503, "percentage": 68.1, "elapsed_time": "4 days, 18:28:39", "remaining_time": "2 days, 5:37:53", "throughput": 2724.38, "total_tokens": 1122769760} {"current_steps": 6221, "total_steps": 9134, "loss": 0.7528, "learning_rate": 1.1532678244714055e-05, "epoch": 0.6810257533046882, "percentage": 68.11, "elapsed_time": "4 days, 18:29:42", "remaining_time": "2 days, 5:36:45", "throughput": 2724.38, "total_tokens": 1122940896} {"current_steps": 6222, "total_steps": 9134, "loss": 0.691, "learning_rate": 1.1525434683031718e-05, "epoch": 0.6811352253756261, "percentage": 68.12, "elapsed_time": "4 days, 18:30:44", "remaining_time": "2 days, 5:35:37", "throughput": 2724.36, "total_tokens": 1123101504} {"current_steps": 6223, "total_steps": 9134, "loss": 0.7209, "learning_rate": 1.1518192715364704e-05, "epoch": 0.6812446974465639, "percentage": 68.13, "elapsed_time": "4 days, 18:31:53", "remaining_time": "2 days, 5:34:32", "throughput": 2724.36, "total_tokens": 1123290336} {"current_steps": 6224, "total_steps": 9134, "loss": 0.8309, "learning_rate": 1.1510952342569708e-05, "epoch": 0.6813541695175018, "percentage": 68.14, "elapsed_time": "4 days, 18:33:00", "remaining_time": "2 days, 5:33:26", "throughput": 2724.37, "total_tokens": 1123474912} {"current_steps": 6225, "total_steps": 9134, "loss": 0.7177, "learning_rate": 1.1503713565503282e-05, "epoch": 0.6814636415884398, "percentage": 68.15, "elapsed_time": "4 days, 18:34:04", "remaining_time": "2 days, 5:32:19", "throughput": 2724.36, "total_tokens": 1123648288} {"current_steps": 6226, "total_steps": 9134, "loss": 0.7875, "learning_rate": 1.1496476385021723e-05, "epoch": 0.6815731136593777, "percentage": 68.16, "elapsed_time": "4 days, 18:35:13", "remaining_time": "2 days, 5:31:14", "throughput": 2724.35, "total_tokens": 1123829728} {"current_steps": 6227, "total_steps": 9134, "loss": 0.7414, "learning_rate": 1.148924080198121e-05, "epoch": 0.6816825857303156, "percentage": 68.17, "elapsed_time": "4 days, 18:36:15", "remaining_time": "2 days, 5:30:05", "throughput": 2724.32, "total_tokens": 1123987872} {"current_steps": 6228, "total_steps": 9134, "loss": 0.7983, "learning_rate": 1.1482006817237665e-05, "epoch": 0.6817920578012534, "percentage": 68.18, "elapsed_time": "4 days, 18:37:21", "remaining_time": "2 days, 5:28:59", "throughput": 2724.33, "total_tokens": 1124173792} {"current_steps": 6229, "total_steps": 9134, "loss": 0.7431, "learning_rate": 1.1474774431646878e-05, "epoch": 0.6819015298721913, "percentage": 68.2, "elapsed_time": "4 days, 18:38:25", "remaining_time": "2 days, 5:27:52", "throughput": 2724.32, "total_tokens": 1124341792} {"current_steps": 6230, "total_steps": 9134, "loss": 0.6668, "learning_rate": 1.1467543646064424e-05, "epoch": 0.6820110019431292, "percentage": 68.21, "elapsed_time": "4 days, 18:39:31", "remaining_time": "2 days, 5:26:45", "throughput": 2724.3, "total_tokens": 1124510912} {"current_steps": 6231, "total_steps": 9134, "loss": 0.843, "learning_rate": 1.1460314461345684e-05, "epoch": 0.6821204740140672, "percentage": 68.22, "elapsed_time": "4 days, 18:40:37", "remaining_time": "2 days, 5:25:39", "throughput": 2724.34, "total_tokens": 1124711616} {"current_steps": 6232, "total_steps": 9134, "loss": 0.5774, "learning_rate": 1.1453086878345862e-05, "epoch": 0.6822299460850051, "percentage": 68.23, "elapsed_time": "4 days, 18:41:37", "remaining_time": "2 days, 5:24:30", "throughput": 2724.3, "total_tokens": 1124856992} {"current_steps": 6233, "total_steps": 9134, "loss": 0.7167, "learning_rate": 1.1445860897919951e-05, "epoch": 0.682339418155943, "percentage": 68.24, "elapsed_time": "4 days, 18:42:39", "remaining_time": "2 days, 5:23:21", "throughput": 2724.26, "total_tokens": 1125007296} {"current_steps": 6234, "total_steps": 9134, "loss": 1.0314, "learning_rate": 1.1438636520922807e-05, "epoch": 0.6824488902268808, "percentage": 68.25, "elapsed_time": "4 days, 18:43:45", "remaining_time": "2 days, 5:22:15", "throughput": 2724.3, "total_tokens": 1125205088} {"current_steps": 6235, "total_steps": 9134, "loss": 0.594, "learning_rate": 1.1431413748209021e-05, "epoch": 0.6825583622978187, "percentage": 68.26, "elapsed_time": "4 days, 18:44:50", "remaining_time": "2 days, 5:21:09", "throughput": 2724.32, "total_tokens": 1125390112} {"current_steps": 6236, "total_steps": 9134, "loss": 0.6734, "learning_rate": 1.1424192580633067e-05, "epoch": 0.6826678343687567, "percentage": 68.27, "elapsed_time": "4 days, 18:45:56", "remaining_time": "2 days, 5:20:02", "throughput": 2724.36, "total_tokens": 1125586560} {"current_steps": 6237, "total_steps": 9134, "loss": 0.6722, "learning_rate": 1.1416973019049156e-05, "epoch": 0.6827773064396946, "percentage": 68.28, "elapsed_time": "4 days, 18:47:06", "remaining_time": "2 days, 5:18:57", "throughput": 2724.39, "total_tokens": 1125789728} {"current_steps": 6238, "total_steps": 9134, "loss": 0.7834, "learning_rate": 1.1409755064311384e-05, "epoch": 0.6828867785106325, "percentage": 68.29, "elapsed_time": "4 days, 18:48:11", "remaining_time": "2 days, 5:17:51", "throughput": 2724.41, "total_tokens": 1125974304} {"current_steps": 6239, "total_steps": 9134, "loss": 0.6759, "learning_rate": 1.1402538717273605e-05, "epoch": 0.6829962505815704, "percentage": 68.31, "elapsed_time": "4 days, 18:49:20", "remaining_time": "2 days, 5:16:46", "throughput": 2724.48, "total_tokens": 1126190464} {"current_steps": 6240, "total_steps": 9134, "loss": 0.789, "learning_rate": 1.1395323978789504e-05, "epoch": 0.6831057226525082, "percentage": 68.32, "elapsed_time": "4 days, 18:50:26", "remaining_time": "2 days, 5:15:39", "throughput": 2724.48, "total_tokens": 1126371232} {"current_steps": 6241, "total_steps": 9134, "loss": 0.8276, "learning_rate": 1.138811084971257e-05, "epoch": 0.6832151947234462, "percentage": 68.33, "elapsed_time": "4 days, 18:51:33", "remaining_time": "2 days, 5:14:33", "throughput": 2724.52, "total_tokens": 1126569696} {"current_steps": 6242, "total_steps": 9134, "loss": 0.7347, "learning_rate": 1.1380899330896086e-05, "epoch": 0.6833246667943841, "percentage": 68.34, "elapsed_time": "4 days, 18:52:38", "remaining_time": "2 days, 5:13:27", "throughput": 2724.57, "total_tokens": 1126769280} {"current_steps": 6243, "total_steps": 9134, "loss": 0.7242, "learning_rate": 1.13736894231932e-05, "epoch": 0.683434138865322, "percentage": 68.35, "elapsed_time": "4 days, 18:53:43", "remaining_time": "2 days, 5:12:20", "throughput": 2724.56, "total_tokens": 1126942880} {"current_steps": 6244, "total_steps": 9134, "loss": 0.8621, "learning_rate": 1.1366481127456785e-05, "epoch": 0.6835436109362599, "percentage": 68.36, "elapsed_time": "4 days, 18:54:50", "remaining_time": "2 days, 5:11:14", "throughput": 2724.57, "total_tokens": 1127129024} {"current_steps": 6245, "total_steps": 9134, "loss": 0.8514, "learning_rate": 1.1359274444539596e-05, "epoch": 0.6836530830071977, "percentage": 68.37, "elapsed_time": "4 days, 18:55:54", "remaining_time": "2 days, 5:10:06", "throughput": 2724.58, "total_tokens": 1127304864} {"current_steps": 6246, "total_steps": 9134, "loss": 0.7992, "learning_rate": 1.1352069375294169e-05, "epoch": 0.6837625550781357, "percentage": 68.38, "elapsed_time": "4 days, 18:57:01", "remaining_time": "2 days, 5:09:01", "throughput": 2724.54, "total_tokens": 1127475776} {"current_steps": 6247, "total_steps": 9134, "loss": 0.9037, "learning_rate": 1.1344865920572842e-05, "epoch": 0.6838720271490736, "percentage": 68.39, "elapsed_time": "4 days, 18:58:08", "remaining_time": "2 days, 5:07:55", "throughput": 2724.51, "total_tokens": 1127643552} {"current_steps": 6248, "total_steps": 9134, "loss": 0.6161, "learning_rate": 1.1337664081227773e-05, "epoch": 0.6839814992200115, "percentage": 68.4, "elapsed_time": "4 days, 18:59:12", "remaining_time": "2 days, 5:06:47", "throughput": 2724.48, "total_tokens": 1127804832} {"current_steps": 6249, "total_steps": 9134, "loss": 0.952, "learning_rate": 1.1330463858110927e-05, "epoch": 0.6840909712909494, "percentage": 68.41, "elapsed_time": "4 days, 19:00:19", "remaining_time": "2 days, 5:05:42", "throughput": 2724.48, "total_tokens": 1127989856} {"current_steps": 6250, "total_steps": 9134, "loss": 0.8606, "learning_rate": 1.132326525207406e-05, "epoch": 0.6842004433618873, "percentage": 68.43, "elapsed_time": "4 days, 19:01:29", "remaining_time": "2 days, 5:04:37", "throughput": 2724.48, "total_tokens": 1128178464} {"current_steps": 6251, "total_steps": 9134, "loss": 0.9025, "learning_rate": 1.1316068263968793e-05, "epoch": 0.6843099154328252, "percentage": 68.44, "elapsed_time": "4 days, 19:02:31", "remaining_time": "2 days, 5:03:29", "throughput": 2724.45, "total_tokens": 1128336384} {"current_steps": 6252, "total_steps": 9134, "loss": 0.7587, "learning_rate": 1.130887289464647e-05, "epoch": 0.6844193875037631, "percentage": 68.45, "elapsed_time": "4 days, 19:03:39", "remaining_time": "2 days, 5:02:23", "throughput": 2724.49, "total_tokens": 1128537536} {"current_steps": 6253, "total_steps": 9134, "loss": 0.6645, "learning_rate": 1.1301679144958318e-05, "epoch": 0.684528859574701, "percentage": 68.46, "elapsed_time": "4 days, 19:04:39", "remaining_time": "2 days, 5:01:14", "throughput": 2724.46, "total_tokens": 1128690080} {"current_steps": 6254, "total_steps": 9134, "loss": 0.7183, "learning_rate": 1.1294487015755339e-05, "epoch": 0.6846383316456389, "percentage": 68.47, "elapsed_time": "4 days, 19:05:46", "remaining_time": "2 days, 5:00:08", "throughput": 2724.44, "total_tokens": 1128860096} {"current_steps": 6255, "total_steps": 9134, "loss": 0.8811, "learning_rate": 1.1287296507888345e-05, "epoch": 0.6847478037165768, "percentage": 68.48, "elapsed_time": "4 days, 19:06:55", "remaining_time": "2 days, 4:59:03", "throughput": 2724.46, "total_tokens": 1129056096} {"current_steps": 6256, "total_steps": 9134, "loss": 0.8225, "learning_rate": 1.1280107622207962e-05, "epoch": 0.6848572757875148, "percentage": 68.49, "elapsed_time": "4 days, 19:08:01", "remaining_time": "2 days, 4:57:57", "throughput": 2724.49, "total_tokens": 1129250752} {"current_steps": 6257, "total_steps": 9134, "loss": 0.8315, "learning_rate": 1.1272920359564607e-05, "epoch": 0.6849667478584526, "percentage": 68.5, "elapsed_time": "4 days, 19:09:07", "remaining_time": "2 days, 4:56:51", "throughput": 2724.46, "total_tokens": 1129418528} {"current_steps": 6258, "total_steps": 9134, "loss": 0.8788, "learning_rate": 1.1265734720808549e-05, "epoch": 0.6850762199293905, "percentage": 68.51, "elapsed_time": "4 days, 19:10:13", "remaining_time": "2 days, 4:55:44", "throughput": 2724.46, "total_tokens": 1129597728} {"current_steps": 6259, "total_steps": 9134, "loss": 1.1224, "learning_rate": 1.1258550706789803e-05, "epoch": 0.6851856920003284, "percentage": 68.52, "elapsed_time": "4 days, 19:11:19", "remaining_time": "2 days, 4:54:38", "throughput": 2724.48, "total_tokens": 1129783872} {"current_steps": 6260, "total_steps": 9134, "loss": 0.7769, "learning_rate": 1.1251368318358254e-05, "epoch": 0.6852951640712663, "percentage": 68.54, "elapsed_time": "4 days, 19:12:24", "remaining_time": "2 days, 4:53:31", "throughput": 2724.43, "total_tokens": 1129941792} {"current_steps": 6261, "total_steps": 9134, "loss": 0.8395, "learning_rate": 1.1244187556363536e-05, "epoch": 0.6854046361422043, "percentage": 68.55, "elapsed_time": "4 days, 19:13:32", "remaining_time": "2 days, 4:52:26", "throughput": 2724.47, "total_tokens": 1130145408} {"current_steps": 6262, "total_steps": 9134, "loss": 0.6023, "learning_rate": 1.123700842165514e-05, "epoch": 0.6855141082131421, "percentage": 68.56, "elapsed_time": "4 days, 19:14:39", "remaining_time": "2 days, 4:51:19", "throughput": 2724.53, "total_tokens": 1130351712} {"current_steps": 6263, "total_steps": 9134, "loss": 0.8637, "learning_rate": 1.1229830915082337e-05, "epoch": 0.68562358028408, "percentage": 68.57, "elapsed_time": "4 days, 19:15:47", "remaining_time": "2 days, 4:50:14", "throughput": 2724.55, "total_tokens": 1130546592} {"current_steps": 6264, "total_steps": 9134, "loss": 0.838, "learning_rate": 1.1222655037494215e-05, "epoch": 0.6857330523550179, "percentage": 68.58, "elapsed_time": "4 days, 19:16:52", "remaining_time": "2 days, 4:49:07", "throughput": 2724.56, "total_tokens": 1130727584} {"current_steps": 6265, "total_steps": 9134, "loss": 0.8799, "learning_rate": 1.1215480789739662e-05, "epoch": 0.6858425244259558, "percentage": 68.59, "elapsed_time": "4 days, 19:17:58", "remaining_time": "2 days, 4:48:01", "throughput": 2724.54, "total_tokens": 1130896480} {"current_steps": 6266, "total_steps": 9134, "loss": 0.7976, "learning_rate": 1.120830817266737e-05, "epoch": 0.6859519964968938, "percentage": 68.6, "elapsed_time": "4 days, 19:19:05", "remaining_time": "2 days, 4:46:55", "throughput": 2724.55, "total_tokens": 1131084640} {"current_steps": 6267, "total_steps": 9134, "loss": 0.8153, "learning_rate": 1.1201137187125876e-05, "epoch": 0.6860614685678317, "percentage": 68.61, "elapsed_time": "4 days, 19:20:10", "remaining_time": "2 days, 4:45:48", "throughput": 2724.58, "total_tokens": 1131271008} {"current_steps": 6268, "total_steps": 9134, "loss": 0.7176, "learning_rate": 1.1193967833963455e-05, "epoch": 0.6861709406387695, "percentage": 68.62, "elapsed_time": "4 days, 19:21:11", "remaining_time": "2 days, 4:44:39", "throughput": 2724.56, "total_tokens": 1131432960} {"current_steps": 6269, "total_steps": 9134, "loss": 0.7403, "learning_rate": 1.1186800114028268e-05, "epoch": 0.6862804127097074, "percentage": 68.63, "elapsed_time": "4 days, 19:22:17", "remaining_time": "2 days, 4:43:33", "throughput": 2724.59, "total_tokens": 1131625152} {"current_steps": 6270, "total_steps": 9134, "loss": 0.7302, "learning_rate": 1.1179634028168198e-05, "epoch": 0.6863898847806453, "percentage": 68.64, "elapsed_time": "4 days, 19:23:23", "remaining_time": "2 days, 4:42:27", "throughput": 2724.6, "total_tokens": 1131808384} {"current_steps": 6271, "total_steps": 9134, "loss": 0.6424, "learning_rate": 1.1172469577231016e-05, "epoch": 0.6864993568515833, "percentage": 68.66, "elapsed_time": "4 days, 19:24:23", "remaining_time": "2 days, 4:41:18", "throughput": 2724.52, "total_tokens": 1131938080} {"current_steps": 6272, "total_steps": 9134, "loss": 0.6995, "learning_rate": 1.1165306762064246e-05, "epoch": 0.6866088289225212, "percentage": 68.67, "elapsed_time": "4 days, 19:25:29", "remaining_time": "2 days, 4:40:11", "throughput": 2724.55, "total_tokens": 1132131616} {"current_steps": 6273, "total_steps": 9134, "loss": 0.7676, "learning_rate": 1.115814558351524e-05, "epoch": 0.6867183009934591, "percentage": 68.68, "elapsed_time": "4 days, 19:26:35", "remaining_time": "2 days, 4:39:05", "throughput": 2724.53, "total_tokens": 1132302752} {"current_steps": 6274, "total_steps": 9134, "loss": 0.9329, "learning_rate": 1.1150986042431147e-05, "epoch": 0.6868277730643969, "percentage": 68.69, "elapsed_time": "4 days, 19:27:39", "remaining_time": "2 days, 4:37:58", "throughput": 2724.54, "total_tokens": 1132481504} {"current_steps": 6275, "total_steps": 9134, "loss": 0.979, "learning_rate": 1.1143828139658924e-05, "epoch": 0.6869372451353348, "percentage": 68.7, "elapsed_time": "4 days, 19:28:45", "remaining_time": "2 days, 4:36:52", "throughput": 2724.54, "total_tokens": 1132662048} {"current_steps": 6276, "total_steps": 9134, "loss": 0.7348, "learning_rate": 1.1136671876045363e-05, "epoch": 0.6870467172062728, "percentage": 68.71, "elapsed_time": "4 days, 19:29:51", "remaining_time": "2 days, 4:35:45", "throughput": 2724.57, "total_tokens": 1132854688} {"current_steps": 6277, "total_steps": 9134, "loss": 0.5928, "learning_rate": 1.1129517252436996e-05, "epoch": 0.6871561892772107, "percentage": 68.72, "elapsed_time": "4 days, 19:31:00", "remaining_time": "2 days, 4:34:40", "throughput": 2724.56, "total_tokens": 1133035456} {"current_steps": 6278, "total_steps": 9134, "loss": 0.8864, "learning_rate": 1.1122364269680236e-05, "epoch": 0.6872656613481486, "percentage": 68.73, "elapsed_time": "4 days, 19:32:09", "remaining_time": "2 days, 4:33:35", "throughput": 2724.61, "total_tokens": 1133244448} {"current_steps": 6279, "total_steps": 9134, "loss": 0.7834, "learning_rate": 1.1115212928621249e-05, "epoch": 0.6873751334190864, "percentage": 68.74, "elapsed_time": "4 days, 19:33:12", "remaining_time": "2 days, 4:32:27", "throughput": 2724.54, "total_tokens": 1133388480} {"current_steps": 6280, "total_steps": 9134, "loss": 0.7376, "learning_rate": 1.1108063230106031e-05, "epoch": 0.6874846054900243, "percentage": 68.75, "elapsed_time": "4 days, 19:34:21", "remaining_time": "2 days, 4:31:22", "throughput": 2724.54, "total_tokens": 1133576416} {"current_steps": 6281, "total_steps": 9134, "loss": 0.8915, "learning_rate": 1.1100915174980375e-05, "epoch": 0.6875940775609622, "percentage": 68.77, "elapsed_time": "4 days, 19:35:27", "remaining_time": "2 days, 4:30:16", "throughput": 2724.58, "total_tokens": 1133771072} {"current_steps": 6282, "total_steps": 9134, "loss": 0.814, "learning_rate": 1.1093768764089881e-05, "epoch": 0.6877035496319002, "percentage": 68.78, "elapsed_time": "4 days, 19:36:32", "remaining_time": "2 days, 4:29:09", "throughput": 2724.6, "total_tokens": 1133956096} {"current_steps": 6283, "total_steps": 9134, "loss": 0.7482, "learning_rate": 1.1086623998279963e-05, "epoch": 0.6878130217028381, "percentage": 68.79, "elapsed_time": "4 days, 19:37:38", "remaining_time": "2 days, 4:28:03", "throughput": 2724.6, "total_tokens": 1134137088} {"current_steps": 6284, "total_steps": 9134, "loss": 0.8329, "learning_rate": 1.1079480878395817e-05, "epoch": 0.687922493773776, "percentage": 68.8, "elapsed_time": "4 days, 19:38:44", "remaining_time": "2 days, 4:26:56", "throughput": 2724.59, "total_tokens": 1134311584} {"current_steps": 6285, "total_steps": 9134, "loss": 0.7921, "learning_rate": 1.107233940528248e-05, "epoch": 0.6880319658447138, "percentage": 68.81, "elapsed_time": "4 days, 19:39:52", "remaining_time": "2 days, 4:25:51", "throughput": 2724.62, "total_tokens": 1134512064} {"current_steps": 6286, "total_steps": 9134, "loss": 0.7124, "learning_rate": 1.1065199579784767e-05, "epoch": 0.6881414379156517, "percentage": 68.82, "elapsed_time": "4 days, 19:40:58", "remaining_time": "2 days, 4:24:45", "throughput": 2724.6, "total_tokens": 1134682080} {"current_steps": 6287, "total_steps": 9134, "loss": 0.7193, "learning_rate": 1.1058061402747305e-05, "epoch": 0.6882509099865897, "percentage": 68.83, "elapsed_time": "4 days, 19:42:06", "remaining_time": "2 days, 4:23:39", "throughput": 2724.58, "total_tokens": 1134857696} {"current_steps": 6288, "total_steps": 9134, "loss": 0.6807, "learning_rate": 1.1050924875014527e-05, "epoch": 0.6883603820575276, "percentage": 68.84, "elapsed_time": "4 days, 19:43:12", "remaining_time": "2 days, 4:22:32", "throughput": 2724.59, "total_tokens": 1135041824} {"current_steps": 6289, "total_steps": 9134, "loss": 0.7353, "learning_rate": 1.1043789997430668e-05, "epoch": 0.6884698541284655, "percentage": 68.85, "elapsed_time": "4 days, 19:44:18", "remaining_time": "2 days, 4:21:26", "throughput": 2724.61, "total_tokens": 1135229760} {"current_steps": 6290, "total_steps": 9134, "loss": 0.6339, "learning_rate": 1.1036656770839774e-05, "epoch": 0.6885793261994034, "percentage": 68.86, "elapsed_time": "4 days, 19:45:21", "remaining_time": "2 days, 4:20:18", "throughput": 2724.61, "total_tokens": 1135401792} {"current_steps": 6291, "total_steps": 9134, "loss": 0.7396, "learning_rate": 1.1029525196085691e-05, "epoch": 0.6886887982703412, "percentage": 68.87, "elapsed_time": "4 days, 19:46:23", "remaining_time": "2 days, 4:19:10", "throughput": 2724.6, "total_tokens": 1135569568} {"current_steps": 6292, "total_steps": 9134, "loss": 0.8012, "learning_rate": 1.102239527401206e-05, "epoch": 0.6887982703412792, "percentage": 68.89, "elapsed_time": "4 days, 19:47:24", "remaining_time": "2 days, 4:18:02", "throughput": 2724.59, "total_tokens": 1135728384} {"current_steps": 6293, "total_steps": 9134, "loss": 0.9246, "learning_rate": 1.1015267005462366e-05, "epoch": 0.6889077424122171, "percentage": 68.9, "elapsed_time": "4 days, 19:48:28", "remaining_time": "2 days, 4:16:54", "throughput": 2724.6, "total_tokens": 1135907136} {"current_steps": 6294, "total_steps": 9134, "loss": 0.8184, "learning_rate": 1.1008140391279834e-05, "epoch": 0.689017214483155, "percentage": 68.91, "elapsed_time": "4 days, 19:49:34", "remaining_time": "2 days, 4:15:48", "throughput": 2724.63, "total_tokens": 1136100000} {"current_steps": 6295, "total_steps": 9134, "loss": 0.8115, "learning_rate": 1.1001015432307554e-05, "epoch": 0.6891266865540929, "percentage": 68.92, "elapsed_time": "4 days, 19:50:43", "remaining_time": "2 days, 4:14:43", "throughput": 2724.66, "total_tokens": 1136301376} {"current_steps": 6296, "total_steps": 9134, "loss": 0.8367, "learning_rate": 1.0993892129388385e-05, "epoch": 0.6892361586250307, "percentage": 68.93, "elapsed_time": "4 days, 19:51:48", "remaining_time": "2 days, 4:13:36", "throughput": 2724.67, "total_tokens": 1136484608} {"current_steps": 6297, "total_steps": 9134, "loss": 0.8339, "learning_rate": 1.0986770483365005e-05, "epoch": 0.6893456306959687, "percentage": 68.94, "elapsed_time": "4 days, 19:52:54", "remaining_time": "2 days, 4:12:30", "throughput": 2724.68, "total_tokens": 1136664480} {"current_steps": 6298, "total_steps": 9134, "loss": 0.8491, "learning_rate": 1.0979650495079888e-05, "epoch": 0.6894551027669066, "percentage": 68.95, "elapsed_time": "4 days, 19:53:55", "remaining_time": "2 days, 4:11:21", "throughput": 2724.63, "total_tokens": 1136812320} {"current_steps": 6299, "total_steps": 9134, "loss": 0.7752, "learning_rate": 1.0972532165375305e-05, "epoch": 0.6895645748378445, "percentage": 68.96, "elapsed_time": "4 days, 19:55:04", "remaining_time": "2 days, 4:10:16", "throughput": 2724.68, "total_tokens": 1137021312} {"current_steps": 6300, "total_steps": 9134, "loss": 0.8371, "learning_rate": 1.0965415495093368e-05, "epoch": 0.6896740469087824, "percentage": 68.97, "elapsed_time": "4 days, 19:56:11", "remaining_time": "2 days, 4:09:11", "throughput": 2724.68, "total_tokens": 1137206336} {"current_steps": 6301, "total_steps": 9134, "loss": 0.9483, "learning_rate": 1.0958300485075931e-05, "epoch": 0.6897835189797203, "percentage": 68.98, "elapsed_time": "4 days, 19:57:17", "remaining_time": "2 days, 4:08:04", "throughput": 2724.62, "total_tokens": 1137359104} {"current_steps": 6302, "total_steps": 9134, "loss": 0.6081, "learning_rate": 1.095118713616472e-05, "epoch": 0.6898929910506582, "percentage": 68.99, "elapsed_time": "4 days, 19:58:23", "remaining_time": "2 days, 4:06:58", "throughput": 2724.61, "total_tokens": 1137535392} {"current_steps": 6303, "total_steps": 9134, "loss": 0.6693, "learning_rate": 1.09440754492012e-05, "epoch": 0.6900024631215961, "percentage": 69.01, "elapsed_time": "4 days, 19:59:29", "remaining_time": "2 days, 4:05:51", "throughput": 2724.62, "total_tokens": 1137717280} {"current_steps": 6304, "total_steps": 9134, "loss": 0.8012, "learning_rate": 1.093696542502669e-05, "epoch": 0.690111935192534, "percentage": 69.02, "elapsed_time": "4 days, 20:00:35", "remaining_time": "2 days, 4:04:45", "throughput": 2724.61, "total_tokens": 1137894016} {"current_steps": 6305, "total_steps": 9134, "loss": 0.8489, "learning_rate": 1.0929857064482285e-05, "epoch": 0.6902214072634719, "percentage": 69.03, "elapsed_time": "4 days, 20:01:43", "remaining_time": "2 days, 4:03:39", "throughput": 2724.63, "total_tokens": 1138088448} {"current_steps": 6306, "total_steps": 9134, "loss": 0.6417, "learning_rate": 1.0922750368408896e-05, "epoch": 0.6903308793344098, "percentage": 69.04, "elapsed_time": "4 days, 20:02:50", "remaining_time": "2 days, 4:02:34", "throughput": 2724.6, "total_tokens": 1138257344} {"current_steps": 6307, "total_steps": 9134, "loss": 0.7816, "learning_rate": 1.0915645337647224e-05, "epoch": 0.6904403514053478, "percentage": 69.05, "elapsed_time": "4 days, 20:03:52", "remaining_time": "2 days, 4:01:25", "throughput": 2724.55, "total_tokens": 1138405632} {"current_steps": 6308, "total_steps": 9134, "loss": 0.762, "learning_rate": 1.0908541973037775e-05, "epoch": 0.6905498234762856, "percentage": 69.06, "elapsed_time": "4 days, 20:04:59", "remaining_time": "2 days, 4:00:20", "throughput": 2724.51, "total_tokens": 1138571168} {"current_steps": 6309, "total_steps": 9134, "loss": 0.7214, "learning_rate": 1.090144027542089e-05, "epoch": 0.6906592955472235, "percentage": 69.07, "elapsed_time": "4 days, 20:06:03", "remaining_time": "2 days, 3:59:12", "throughput": 2724.55, "total_tokens": 1138761344} {"current_steps": 6310, "total_steps": 9134, "loss": 0.731, "learning_rate": 1.0894340245636652e-05, "epoch": 0.6907687676181614, "percentage": 69.08, "elapsed_time": "4 days, 20:07:12", "remaining_time": "2 days, 3:58:07", "throughput": 2724.54, "total_tokens": 1138947712} {"current_steps": 6311, "total_steps": 9134, "loss": 0.6828, "learning_rate": 1.0887241884525014e-05, "epoch": 0.6908782396890993, "percentage": 69.09, "elapsed_time": "4 days, 20:08:12", "remaining_time": "2 days, 3:56:58", "throughput": 2724.48, "total_tokens": 1139087040} {"current_steps": 6312, "total_steps": 9134, "loss": 1.0169, "learning_rate": 1.0880145192925666e-05, "epoch": 0.6909877117600373, "percentage": 69.1, "elapsed_time": "4 days, 20:09:20", "remaining_time": "2 days, 3:55:53", "throughput": 2724.53, "total_tokens": 1139290432} {"current_steps": 6313, "total_steps": 9134, "loss": 1.306, "learning_rate": 1.087305017167816e-05, "epoch": 0.6910971838309751, "percentage": 69.12, "elapsed_time": "4 days, 20:10:29", "remaining_time": "2 days, 3:54:48", "throughput": 2724.61, "total_tokens": 1139510624} {"current_steps": 6314, "total_steps": 9134, "loss": 0.6743, "learning_rate": 1.0865956821621808e-05, "epoch": 0.691206655901913, "percentage": 69.13, "elapsed_time": "4 days, 20:11:33", "remaining_time": "2 days, 3:53:41", "throughput": 2724.6, "total_tokens": 1139683552} {"current_steps": 6315, "total_steps": 9134, "loss": 0.6142, "learning_rate": 1.0858865143595749e-05, "epoch": 0.6913161279728509, "percentage": 69.14, "elapsed_time": "4 days, 20:12:43", "remaining_time": "2 days, 3:52:36", "throughput": 2724.61, "total_tokens": 1139876640} {"current_steps": 6316, "total_steps": 9134, "loss": 0.9913, "learning_rate": 1.0851775138438906e-05, "epoch": 0.6914256000437888, "percentage": 69.15, "elapsed_time": "4 days, 20:13:48", "remaining_time": "2 days, 3:51:29", "throughput": 2724.62, "total_tokens": 1140058528} {"current_steps": 6317, "total_steps": 9134, "loss": 0.5566, "learning_rate": 1.084468680699001e-05, "epoch": 0.6915350721147268, "percentage": 69.16, "elapsed_time": "4 days, 20:14:55", "remaining_time": "2 days, 3:50:23", "throughput": 2724.65, "total_tokens": 1140255872} {"current_steps": 6318, "total_steps": 9134, "loss": 0.7737, "learning_rate": 1.0837600150087612e-05, "epoch": 0.6916445441856647, "percentage": 69.17, "elapsed_time": "4 days, 20:16:04", "remaining_time": "2 days, 3:49:18", "throughput": 2724.75, "total_tokens": 1140482560} {"current_steps": 6319, "total_steps": 9134, "loss": 0.889, "learning_rate": 1.0830515168570043e-05, "epoch": 0.6917540162566025, "percentage": 69.18, "elapsed_time": "4 days, 20:17:11", "remaining_time": "2 days, 3:48:12", "throughput": 2724.75, "total_tokens": 1140664224} {"current_steps": 6320, "total_steps": 9134, "loss": 0.8727, "learning_rate": 1.0823431863275443e-05, "epoch": 0.6918634883275404, "percentage": 69.19, "elapsed_time": "4 days, 20:18:19", "remaining_time": "2 days, 3:47:07", "throughput": 2724.74, "total_tokens": 1140848352} {"current_steps": 6321, "total_steps": 9134, "loss": 0.8677, "learning_rate": 1.081635023504175e-05, "epoch": 0.6919729603984783, "percentage": 69.2, "elapsed_time": "4 days, 20:19:23", "remaining_time": "2 days, 3:46:00", "throughput": 2724.76, "total_tokens": 1141030912} {"current_steps": 6322, "total_steps": 9134, "loss": 0.6294, "learning_rate": 1.0809270284706713e-05, "epoch": 0.6920824324694163, "percentage": 69.21, "elapsed_time": "4 days, 20:20:26", "remaining_time": "2 days, 3:44:52", "throughput": 2724.73, "total_tokens": 1141190400} {"current_steps": 6323, "total_steps": 9134, "loss": 0.7092, "learning_rate": 1.0802192013107873e-05, "epoch": 0.6921919045403542, "percentage": 69.22, "elapsed_time": "4 days, 20:21:29", "remaining_time": "2 days, 3:43:44", "throughput": 2724.74, "total_tokens": 1141365344} {"current_steps": 6324, "total_steps": 9134, "loss": 0.8443, "learning_rate": 1.0795115421082574e-05, "epoch": 0.6923013766112921, "percentage": 69.24, "elapsed_time": "4 days, 20:22:37", "remaining_time": "2 days, 3:42:39", "throughput": 2724.74, "total_tokens": 1141551040} {"current_steps": 6325, "total_steps": 9134, "loss": 0.7903, "learning_rate": 1.0788040509467958e-05, "epoch": 0.6924108486822299, "percentage": 69.25, "elapsed_time": "4 days, 20:23:46", "remaining_time": "2 days, 3:41:33", "throughput": 2724.78, "total_tokens": 1141755104} {"current_steps": 6326, "total_steps": 9134, "loss": 0.8951, "learning_rate": 1.078096727910099e-05, "epoch": 0.6925203207531678, "percentage": 69.26, "elapsed_time": "4 days, 20:24:54", "remaining_time": "2 days, 3:40:28", "throughput": 2724.78, "total_tokens": 1141941920} {"current_steps": 6327, "total_steps": 9134, "loss": 0.7337, "learning_rate": 1.0773895730818409e-05, "epoch": 0.6926297928241057, "percentage": 69.27, "elapsed_time": "4 days, 20:25:59", "remaining_time": "2 days, 3:39:21", "throughput": 2724.77, "total_tokens": 1142111040} {"current_steps": 6328, "total_steps": 9134, "loss": 0.8593, "learning_rate": 1.076682586545677e-05, "epoch": 0.6927392648950437, "percentage": 69.28, "elapsed_time": "4 days, 20:27:08", "remaining_time": "2 days, 3:38:16", "throughput": 2724.78, "total_tokens": 1142306368} {"current_steps": 6329, "total_steps": 9134, "loss": 0.7259, "learning_rate": 1.075975768385242e-05, "epoch": 0.6928487369659816, "percentage": 69.29, "elapsed_time": "4 days, 20:28:14", "remaining_time": "2 days, 3:37:10", "throughput": 2724.79, "total_tokens": 1142488928} {"current_steps": 6330, "total_steps": 9134, "loss": 0.6954, "learning_rate": 1.0752691186841516e-05, "epoch": 0.6929582090369194, "percentage": 69.3, "elapsed_time": "4 days, 20:29:14", "remaining_time": "2 days, 3:36:01", "throughput": 2724.76, "total_tokens": 1142641248} {"current_steps": 6331, "total_steps": 9134, "loss": 0.8957, "learning_rate": 1.0745626375260004e-05, "epoch": 0.6930676811078573, "percentage": 69.31, "elapsed_time": "4 days, 20:30:18", "remaining_time": "2 days, 3:34:54", "throughput": 2724.75, "total_tokens": 1142809472} {"current_steps": 6332, "total_steps": 9134, "loss": 0.6792, "learning_rate": 1.0738563249943637e-05, "epoch": 0.6931771531787952, "percentage": 69.32, "elapsed_time": "4 days, 20:31:18", "remaining_time": "2 days, 3:33:45", "throughput": 2724.68, "total_tokens": 1142945888} {"current_steps": 6333, "total_steps": 9134, "loss": 0.7611, "learning_rate": 1.073150181172799e-05, "epoch": 0.6932866252497332, "percentage": 69.33, "elapsed_time": "4 days, 20:32:22", "remaining_time": "2 days, 3:32:38", "throughput": 2724.68, "total_tokens": 1143118368} {"current_steps": 6334, "total_steps": 9134, "loss": 0.8674, "learning_rate": 1.0724442061448383e-05, "epoch": 0.6933960973206711, "percentage": 69.35, "elapsed_time": "4 days, 20:33:27", "remaining_time": "2 days, 3:31:31", "throughput": 2724.67, "total_tokens": 1143291744} {"current_steps": 6335, "total_steps": 9134, "loss": 0.8049, "learning_rate": 1.0717383999940011e-05, "epoch": 0.693505569391609, "percentage": 69.36, "elapsed_time": "4 days, 20:34:34", "remaining_time": "2 days, 3:30:25", "throughput": 2724.69, "total_tokens": 1143481024} {"current_steps": 6336, "total_steps": 9134, "loss": 0.7893, "learning_rate": 1.0710327628037788e-05, "epoch": 0.6936150414625468, "percentage": 69.37, "elapsed_time": "4 days, 20:35:39", "remaining_time": "2 days, 3:29:18", "throughput": 2724.67, "total_tokens": 1143651488} {"current_steps": 6337, "total_steps": 9134, "loss": 0.8885, "learning_rate": 1.0703272946576501e-05, "epoch": 0.6937245135334847, "percentage": 69.38, "elapsed_time": "4 days, 20:36:47", "remaining_time": "2 days, 3:28:12", "throughput": 2724.68, "total_tokens": 1143840768} {"current_steps": 6338, "total_steps": 9134, "loss": 0.9201, "learning_rate": 1.069621995639069e-05, "epoch": 0.6938339856044227, "percentage": 69.39, "elapsed_time": "4 days, 20:37:51", "remaining_time": "2 days, 3:27:05", "throughput": 2724.66, "total_tokens": 1144006752} {"current_steps": 6339, "total_steps": 9134, "loss": 0.7376, "learning_rate": 1.0689168658314708e-05, "epoch": 0.6939434576753606, "percentage": 69.4, "elapsed_time": "4 days, 20:38:55", "remaining_time": "2 days, 3:25:58", "throughput": 2724.66, "total_tokens": 1144179680} {"current_steps": 6340, "total_steps": 9134, "loss": 0.9221, "learning_rate": 1.0682119053182731e-05, "epoch": 0.6940529297462985, "percentage": 69.41, "elapsed_time": "4 days, 20:40:00", "remaining_time": "2 days, 3:24:51", "throughput": 2724.66, "total_tokens": 1144360448} {"current_steps": 6341, "total_steps": 9134, "loss": 1.0042, "learning_rate": 1.0675071141828682e-05, "epoch": 0.6941624018172364, "percentage": 69.42, "elapsed_time": "4 days, 20:41:05", "remaining_time": "2 days, 3:23:44", "throughput": 2724.63, "total_tokens": 1144523968} {"current_steps": 6342, "total_steps": 9134, "loss": 1.052, "learning_rate": 1.0668024925086353e-05, "epoch": 0.6942718738881742, "percentage": 69.43, "elapsed_time": "4 days, 20:42:12", "remaining_time": "2 days, 3:22:38", "throughput": 2724.65, "total_tokens": 1144714368} {"current_steps": 6343, "total_steps": 9134, "loss": 0.5977, "learning_rate": 1.0660980403789256e-05, "epoch": 0.6943813459591122, "percentage": 69.44, "elapsed_time": "4 days, 20:43:16", "remaining_time": "2 days, 3:21:31", "throughput": 2724.69, "total_tokens": 1144902976} {"current_steps": 6344, "total_steps": 9134, "loss": 0.6321, "learning_rate": 1.0653937578770787e-05, "epoch": 0.6944908180300501, "percentage": 69.45, "elapsed_time": "4 days, 20:44:23", "remaining_time": "2 days, 3:20:25", "throughput": 2724.68, "total_tokens": 1145082176} {"current_steps": 6345, "total_steps": 9134, "loss": 0.6477, "learning_rate": 1.0646896450864056e-05, "epoch": 0.694600290100988, "percentage": 69.47, "elapsed_time": "4 days, 20:45:28", "remaining_time": "2 days, 3:19:19", "throughput": 2724.66, "total_tokens": 1145253984} {"current_steps": 6346, "total_steps": 9134, "loss": 0.7436, "learning_rate": 1.0639857020902048e-05, "epoch": 0.6947097621719259, "percentage": 69.48, "elapsed_time": "4 days, 20:46:29", "remaining_time": "2 days, 3:18:10", "throughput": 2724.64, "total_tokens": 1145411904} {"current_steps": 6347, "total_steps": 9134, "loss": 0.7433, "learning_rate": 1.0632819289717499e-05, "epoch": 0.6948192342428637, "percentage": 69.49, "elapsed_time": "4 days, 20:47:34", "remaining_time": "2 days, 3:17:03", "throughput": 2724.66, "total_tokens": 1145597152} {"current_steps": 6348, "total_steps": 9134, "loss": 0.7622, "learning_rate": 1.0625783258142965e-05, "epoch": 0.6949287063138017, "percentage": 69.5, "elapsed_time": "4 days, 20:48:42", "remaining_time": "2 days, 3:15:58", "throughput": 2724.68, "total_tokens": 1145787552} {"current_steps": 6349, "total_steps": 9134, "loss": 1.0516, "learning_rate": 1.0618748927010794e-05, "epoch": 0.6950381783847396, "percentage": 69.51, "elapsed_time": "4 days, 20:49:49", "remaining_time": "2 days, 3:14:52", "throughput": 2724.74, "total_tokens": 1145996544} {"current_steps": 6350, "total_steps": 9134, "loss": 0.7735, "learning_rate": 1.0611716297153121e-05, "epoch": 0.6951476504556775, "percentage": 69.52, "elapsed_time": "4 days, 20:50:54", "remaining_time": "2 days, 3:13:45", "throughput": 2724.72, "total_tokens": 1146165664} {"current_steps": 6351, "total_steps": 9134, "loss": 0.4957, "learning_rate": 1.0604685369401923e-05, "epoch": 0.6952571225266154, "percentage": 69.53, "elapsed_time": "4 days, 20:52:00", "remaining_time": "2 days, 3:12:39", "throughput": 2724.73, "total_tokens": 1146351808} {"current_steps": 6352, "total_steps": 9134, "loss": 0.7416, "learning_rate": 1.059765614458891e-05, "epoch": 0.6953665945975533, "percentage": 69.54, "elapsed_time": "4 days, 20:53:05", "remaining_time": "2 days, 3:11:32", "throughput": 2724.73, "total_tokens": 1146524736} {"current_steps": 6353, "total_steps": 9134, "loss": 0.7054, "learning_rate": 1.059062862354565e-05, "epoch": 0.6954760666684912, "percentage": 69.55, "elapsed_time": "4 days, 20:54:13", "remaining_time": "2 days, 3:10:26", "throughput": 2724.78, "total_tokens": 1146733056} {"current_steps": 6354, "total_steps": 9134, "loss": 1.0509, "learning_rate": 1.0583602807103479e-05, "epoch": 0.6955855387394291, "percentage": 69.56, "elapsed_time": "4 days, 20:55:18", "remaining_time": "2 days, 3:09:20", "throughput": 2724.78, "total_tokens": 1146908896} {"current_steps": 6355, "total_steps": 9134, "loss": 0.7343, "learning_rate": 1.0576578696093536e-05, "epoch": 0.695695010810367, "percentage": 69.58, "elapsed_time": "4 days, 20:56:24", "remaining_time": "2 days, 3:08:13", "throughput": 2724.82, "total_tokens": 1147107808} {"current_steps": 6356, "total_steps": 9134, "loss": 0.7191, "learning_rate": 1.0569556291346761e-05, "epoch": 0.6958044828813049, "percentage": 69.59, "elapsed_time": "4 days, 20:57:33", "remaining_time": "2 days, 3:07:08", "throughput": 2724.84, "total_tokens": 1147302688} {"current_steps": 6357, "total_steps": 9134, "loss": 0.7672, "learning_rate": 1.056253559369389e-05, "epoch": 0.6959139549522428, "percentage": 69.6, "elapsed_time": "4 days, 20:58:37", "remaining_time": "2 days, 3:06:01", "throughput": 2724.83, "total_tokens": 1147474944} {"current_steps": 6358, "total_steps": 9134, "loss": 0.7266, "learning_rate": 1.0555516603965457e-05, "epoch": 0.6960234270231808, "percentage": 69.61, "elapsed_time": "4 days, 20:59:38", "remaining_time": "2 days, 3:04:52", "throughput": 2724.79, "total_tokens": 1147623008} {"current_steps": 6359, "total_steps": 9134, "loss": 0.9644, "learning_rate": 1.0548499322991789e-05, "epoch": 0.6961328990941186, "percentage": 69.62, "elapsed_time": "4 days, 21:00:43", "remaining_time": "2 days, 3:03:46", "throughput": 2724.81, "total_tokens": 1147806464} {"current_steps": 6360, "total_steps": 9134, "loss": 0.6975, "learning_rate": 1.0541483751603031e-05, "epoch": 0.6962423711650565, "percentage": 69.63, "elapsed_time": "4 days, 21:01:49", "remaining_time": "2 days, 3:02:39", "throughput": 2724.8, "total_tokens": 1147986112} {"current_steps": 6361, "total_steps": 9134, "loss": 0.8517, "learning_rate": 1.0534469890629109e-05, "epoch": 0.6963518432359944, "percentage": 69.64, "elapsed_time": "4 days, 21:02:54", "remaining_time": "2 days, 3:01:33", "throughput": 2724.82, "total_tokens": 1148167776} {"current_steps": 6362, "total_steps": 9134, "loss": 0.825, "learning_rate": 1.0527457740899744e-05, "epoch": 0.6964613153069323, "percentage": 69.65, "elapsed_time": "4 days, 21:04:03", "remaining_time": "2 days, 3:00:27", "throughput": 2724.9, "total_tokens": 1148389088} {"current_steps": 6363, "total_steps": 9134, "loss": 0.7819, "learning_rate": 1.0520447303244463e-05, "epoch": 0.6965707873778703, "percentage": 69.66, "elapsed_time": "4 days, 21:05:09", "remaining_time": "2 days, 2:59:21", "throughput": 2724.95, "total_tokens": 1148592928} {"current_steps": 6364, "total_steps": 9134, "loss": 0.6988, "learning_rate": 1.0513438578492582e-05, "epoch": 0.6966802594488081, "percentage": 69.67, "elapsed_time": "4 days, 21:06:10", "remaining_time": "2 days, 2:58:13", "throughput": 2724.91, "total_tokens": 1148741216} {"current_steps": 6365, "total_steps": 9134, "loss": 0.7086, "learning_rate": 1.0506431567473226e-05, "epoch": 0.696789731519746, "percentage": 69.68, "elapsed_time": "4 days, 21:07:19", "remaining_time": "2 days, 2:57:07", "throughput": 2724.95, "total_tokens": 1148943264} {"current_steps": 6366, "total_steps": 9134, "loss": 0.5867, "learning_rate": 1.049942627101531e-05, "epoch": 0.6968992035906839, "percentage": 69.7, "elapsed_time": "4 days, 21:08:24", "remaining_time": "2 days, 2:56:01", "throughput": 2725.0, "total_tokens": 1149144640} {"current_steps": 6367, "total_steps": 9134, "loss": 0.8374, "learning_rate": 1.0492422689947534e-05, "epoch": 0.6970086756616218, "percentage": 69.71, "elapsed_time": "4 days, 21:09:30", "remaining_time": "2 days, 2:54:54", "throughput": 2724.99, "total_tokens": 1149319808} {"current_steps": 6368, "total_steps": 9134, "loss": 0.8275, "learning_rate": 1.048542082509843e-05, "epoch": 0.6971181477325598, "percentage": 69.72, "elapsed_time": "4 days, 21:10:36", "remaining_time": "2 days, 2:53:48", "throughput": 2725.0, "total_tokens": 1149503040} {"current_steps": 6369, "total_steps": 9134, "loss": 0.7418, "learning_rate": 1.0478420677296297e-05, "epoch": 0.6972276198034977, "percentage": 69.73, "elapsed_time": "4 days, 21:11:39", "remaining_time": "2 days, 2:52:41", "throughput": 2724.99, "total_tokens": 1149674400} {"current_steps": 6370, "total_steps": 9134, "loss": 0.8802, "learning_rate": 1.0471422247369233e-05, "epoch": 0.6973370918744355, "percentage": 69.74, "elapsed_time": "4 days, 21:12:46", "remaining_time": "2 days, 2:51:34", "throughput": 2724.95, "total_tokens": 1149838368} {"current_steps": 6371, "total_steps": 9134, "loss": 0.9948, "learning_rate": 1.0464425536145148e-05, "epoch": 0.6974465639453734, "percentage": 69.75, "elapsed_time": "4 days, 21:13:54", "remaining_time": "2 days, 2:50:29", "throughput": 2725.02, "total_tokens": 1150051616} {"current_steps": 6372, "total_steps": 9134, "loss": 0.7484, "learning_rate": 1.0457430544451733e-05, "epoch": 0.6975560360163113, "percentage": 69.76, "elapsed_time": "4 days, 21:14:58", "remaining_time": "2 days, 2:49:22", "throughput": 2725.03, "total_tokens": 1150233728} {"current_steps": 6373, "total_steps": 9134, "loss": 0.857, "learning_rate": 1.0450437273116484e-05, "epoch": 0.6976655080872493, "percentage": 69.77, "elapsed_time": "4 days, 21:16:05", "remaining_time": "2 days, 2:48:16", "throughput": 2725.02, "total_tokens": 1150407104} {"current_steps": 6374, "total_steps": 9134, "loss": 0.6776, "learning_rate": 1.044344572296668e-05, "epoch": 0.6977749801581872, "percentage": 69.78, "elapsed_time": "4 days, 21:17:10", "remaining_time": "2 days, 2:47:09", "throughput": 2725.0, "total_tokens": 1150579584} {"current_steps": 6375, "total_steps": 9134, "loss": 0.9439, "learning_rate": 1.0436455894829442e-05, "epoch": 0.6978844522291251, "percentage": 69.79, "elapsed_time": "4 days, 21:18:16", "remaining_time": "2 days, 2:46:03", "throughput": 2725.0, "total_tokens": 1150759904} {"current_steps": 6376, "total_steps": 9134, "loss": 0.8197, "learning_rate": 1.0429467789531608e-05, "epoch": 0.6979939243000629, "percentage": 69.81, "elapsed_time": "4 days, 21:19:22", "remaining_time": "2 days, 2:44:56", "throughput": 2724.94, "total_tokens": 1150913344} {"current_steps": 6377, "total_steps": 9134, "loss": 0.6964, "learning_rate": 1.04224814078999e-05, "epoch": 0.6981033963710008, "percentage": 69.82, "elapsed_time": "4 days, 21:20:27", "remaining_time": "2 days, 2:43:50", "throughput": 2724.94, "total_tokens": 1151088512} {"current_steps": 6378, "total_steps": 9134, "loss": 0.5428, "learning_rate": 1.041549675076076e-05, "epoch": 0.6982128684419387, "percentage": 69.83, "elapsed_time": "4 days, 21:21:33", "remaining_time": "2 days, 2:42:43", "throughput": 2724.88, "total_tokens": 1151246432} {"current_steps": 6379, "total_steps": 9134, "loss": 0.8796, "learning_rate": 1.0408513818940477e-05, "epoch": 0.6983223405128767, "percentage": 69.84, "elapsed_time": "4 days, 21:22:42", "remaining_time": "2 days, 2:41:38", "throughput": 2724.9, "total_tokens": 1151439744} {"current_steps": 6380, "total_steps": 9134, "loss": 0.7313, "learning_rate": 1.040153261326512e-05, "epoch": 0.6984318125838146, "percentage": 69.85, "elapsed_time": "4 days, 21:23:50", "remaining_time": "2 days, 2:40:33", "throughput": 2724.91, "total_tokens": 1151627456} {"current_steps": 6381, "total_steps": 9134, "loss": 0.8966, "learning_rate": 1.0394553134560533e-05, "epoch": 0.6985412846547524, "percentage": 69.86, "elapsed_time": "4 days, 21:24:59", "remaining_time": "2 days, 2:39:28", "throughput": 2724.97, "total_tokens": 1151844736} {"current_steps": 6382, "total_steps": 9134, "loss": 0.7179, "learning_rate": 1.0387575383652411e-05, "epoch": 0.6986507567256903, "percentage": 69.87, "elapsed_time": "4 days, 21:26:07", "remaining_time": "2 days, 2:38:22", "throughput": 2725.0, "total_tokens": 1152041408} {"current_steps": 6383, "total_steps": 9134, "loss": 0.7517, "learning_rate": 1.0380599361366169e-05, "epoch": 0.6987602287966282, "percentage": 69.88, "elapsed_time": "4 days, 21:27:15", "remaining_time": "2 days, 2:37:17", "throughput": 2725.0, "total_tokens": 1152227776} {"current_steps": 6384, "total_steps": 9134, "loss": 0.6359, "learning_rate": 1.037362506852709e-05, "epoch": 0.6988697008675662, "percentage": 69.89, "elapsed_time": "4 days, 21:28:20", "remaining_time": "2 days, 2:36:10", "throughput": 2724.98, "total_tokens": 1152395776} {"current_steps": 6385, "total_steps": 9134, "loss": 0.8278, "learning_rate": 1.036665250596019e-05, "epoch": 0.6989791729385041, "percentage": 69.9, "elapsed_time": "4 days, 21:29:27", "remaining_time": "2 days, 2:35:04", "throughput": 2725.0, "total_tokens": 1152586400} {"current_steps": 6386, "total_steps": 9134, "loss": 0.8987, "learning_rate": 1.0359681674490332e-05, "epoch": 0.699088645009442, "percentage": 69.91, "elapsed_time": "4 days, 21:30:36", "remaining_time": "2 days, 2:33:59", "throughput": 2725.07, "total_tokens": 1152802336} {"current_steps": 6387, "total_steps": 9134, "loss": 0.734, "learning_rate": 1.0352712574942144e-05, "epoch": 0.6991981170803798, "percentage": 69.93, "elapsed_time": "4 days, 21:31:42", "remaining_time": "2 days, 2:32:52", "throughput": 2725.11, "total_tokens": 1152998112} {"current_steps": 6388, "total_steps": 9134, "loss": 0.6399, "learning_rate": 1.0345745208140056e-05, "epoch": 0.6993075891513177, "percentage": 69.94, "elapsed_time": "4 days, 21:32:49", "remaining_time": "2 days, 2:31:47", "throughput": 2725.13, "total_tokens": 1153192320} {"current_steps": 6389, "total_steps": 9134, "loss": 0.8757, "learning_rate": 1.03387795749083e-05, "epoch": 0.6994170612222557, "percentage": 69.95, "elapsed_time": "4 days, 21:33:57", "remaining_time": "2 days, 2:30:41", "throughput": 2725.15, "total_tokens": 1153385856} {"current_steps": 6390, "total_steps": 9134, "loss": 0.9226, "learning_rate": 1.0331815676070888e-05, "epoch": 0.6995265332931936, "percentage": 69.96, "elapsed_time": "4 days, 21:35:01", "remaining_time": "2 days, 2:29:34", "throughput": 2725.11, "total_tokens": 1153544672} {"current_steps": 6391, "total_steps": 9134, "loss": 0.9723, "learning_rate": 1.0324853512451643e-05, "epoch": 0.6996360053641315, "percentage": 69.97, "elapsed_time": "4 days, 21:36:07", "remaining_time": "2 days, 2:28:28", "throughput": 2725.14, "total_tokens": 1153737088} {"current_steps": 6392, "total_steps": 9134, "loss": 1.0053, "learning_rate": 1.0317893084874167e-05, "epoch": 0.6997454774350694, "percentage": 69.98, "elapsed_time": "4 days, 21:37:16", "remaining_time": "2 days, 2:27:23", "throughput": 2725.18, "total_tokens": 1153938688} {"current_steps": 6393, "total_steps": 9134, "loss": 0.7724, "learning_rate": 1.0310934394161875e-05, "epoch": 0.6998549495060072, "percentage": 69.99, "elapsed_time": "4 days, 21:38:24", "remaining_time": "2 days, 2:26:17", "throughput": 2725.24, "total_tokens": 1154154400} {"current_steps": 6394, "total_steps": 9134, "loss": 0.7241, "learning_rate": 1.0303977441137968e-05, "epoch": 0.6999644215769452, "percentage": 70.0, "elapsed_time": "4 days, 21:39:27", "remaining_time": "2 days, 2:25:10", "throughput": 2725.21, "total_tokens": 1154311648} {"current_steps": 6395, "total_steps": 9134, "loss": 0.7457, "learning_rate": 1.0297022226625434e-05, "epoch": 0.7000738936478831, "percentage": 70.01, "elapsed_time": "4 days, 21:40:33", "remaining_time": "2 days, 2:24:03", "throughput": 2725.19, "total_tokens": 1154482560} {"current_steps": 6396, "total_steps": 9134, "loss": 0.8359, "learning_rate": 1.0290068751447062e-05, "epoch": 0.700183365718821, "percentage": 70.02, "elapsed_time": "4 days, 21:41:35", "remaining_time": "2 days, 2:22:55", "throughput": 2725.16, "total_tokens": 1154640032} {"current_steps": 6397, "total_steps": 9134, "loss": 0.6436, "learning_rate": 1.0283117016425439e-05, "epoch": 0.7002928377897589, "percentage": 70.04, "elapsed_time": "4 days, 21:42:41", "remaining_time": "2 days, 2:21:49", "throughput": 2725.2, "total_tokens": 1154833120} {"current_steps": 6398, "total_steps": 9134, "loss": 0.7168, "learning_rate": 1.0276167022382937e-05, "epoch": 0.7004023098606967, "percentage": 70.05, "elapsed_time": "4 days, 21:43:49", "remaining_time": "2 days, 2:20:43", "throughput": 2725.21, "total_tokens": 1155027104} {"current_steps": 6399, "total_steps": 9134, "loss": 0.628, "learning_rate": 1.0269218770141728e-05, "epoch": 0.7005117819316347, "percentage": 70.06, "elapsed_time": "4 days, 21:44:58", "remaining_time": "2 days, 2:19:38", "throughput": 2725.23, "total_tokens": 1155222208} {"current_steps": 6400, "total_steps": 9134, "loss": 0.777, "learning_rate": 1.0262272260523772e-05, "epoch": 0.7006212540025726, "percentage": 70.07, "elapsed_time": "4 days, 21:46:06", "remaining_time": "2 days, 2:18:33", "throughput": 2725.27, "total_tokens": 1155424032} {"current_steps": 6401, "total_steps": 9134, "loss": 0.7518, "learning_rate": 1.0255327494350841e-05, "epoch": 0.7007307260735105, "percentage": 70.08, "elapsed_time": "4 days, 21:47:11", "remaining_time": "2 days, 2:17:26", "throughput": 2725.26, "total_tokens": 1155594496} {"current_steps": 6402, "total_steps": 9134, "loss": 0.6944, "learning_rate": 1.0248384472444481e-05, "epoch": 0.7008401981444484, "percentage": 70.09, "elapsed_time": "4 days, 21:48:15", "remaining_time": "2 days, 2:16:19", "throughput": 2725.18, "total_tokens": 1155737856} {"current_steps": 6403, "total_steps": 9134, "loss": 0.8583, "learning_rate": 1.0241443195626038e-05, "epoch": 0.7009496702153863, "percentage": 70.1, "elapsed_time": "4 days, 21:49:23", "remaining_time": "2 days, 2:15:13", "throughput": 2725.2, "total_tokens": 1155930048} {"current_steps": 6404, "total_steps": 9134, "loss": 0.7252, "learning_rate": 1.0234503664716649e-05, "epoch": 0.7010591422863242, "percentage": 70.11, "elapsed_time": "4 days, 21:50:25", "remaining_time": "2 days, 2:14:05", "throughput": 2725.13, "total_tokens": 1156068704} {"current_steps": 6405, "total_steps": 9134, "loss": 0.9761, "learning_rate": 1.0227565880537252e-05, "epoch": 0.7011686143572621, "percentage": 70.12, "elapsed_time": "4 days, 21:51:32", "remaining_time": "2 days, 2:12:59", "throughput": 2725.15, "total_tokens": 1156262016} {"current_steps": 6406, "total_steps": 9134, "loss": 0.704, "learning_rate": 1.0220629843908572e-05, "epoch": 0.7012780864282, "percentage": 70.13, "elapsed_time": "4 days, 21:52:35", "remaining_time": "2 days, 2:11:51", "throughput": 2725.13, "total_tokens": 1156424640} {"current_steps": 6407, "total_steps": 9134, "loss": 0.9158, "learning_rate": 1.0213695555651118e-05, "epoch": 0.7013875584991379, "percentage": 70.14, "elapsed_time": "4 days, 21:53:43", "remaining_time": "2 days, 2:10:46", "throughput": 2725.17, "total_tokens": 1156626464} {"current_steps": 6408, "total_steps": 9134, "loss": 0.7378, "learning_rate": 1.020676301658523e-05, "epoch": 0.7014970305700758, "percentage": 70.16, "elapsed_time": "4 days, 21:54:48", "remaining_time": "2 days, 2:09:39", "throughput": 2725.16, "total_tokens": 1156800960} {"current_steps": 6409, "total_steps": 9134, "loss": 0.9443, "learning_rate": 1.0199832227530979e-05, "epoch": 0.7016065026410138, "percentage": 70.17, "elapsed_time": "4 days, 21:55:54", "remaining_time": "2 days, 2:08:33", "throughput": 2725.13, "total_tokens": 1156966048} {"current_steps": 6410, "total_steps": 9134, "loss": 0.9808, "learning_rate": 1.0192903189308293e-05, "epoch": 0.7017159747119516, "percentage": 70.18, "elapsed_time": "4 days, 21:57:03", "remaining_time": "2 days, 2:07:28", "throughput": 2725.22, "total_tokens": 1157192288} {"current_steps": 6411, "total_steps": 9134, "loss": 0.9313, "learning_rate": 1.0185975902736853e-05, "epoch": 0.7018254467828895, "percentage": 70.19, "elapsed_time": "4 days, 21:58:12", "remaining_time": "2 days, 2:06:23", "throughput": 2725.25, "total_tokens": 1157391200} {"current_steps": 6412, "total_steps": 9134, "loss": 0.604, "learning_rate": 1.0179050368636146e-05, "epoch": 0.7019349188538274, "percentage": 70.2, "elapsed_time": "4 days, 21:59:17", "remaining_time": "2 days, 2:05:16", "throughput": 2725.25, "total_tokens": 1157568608} {"current_steps": 6413, "total_steps": 9134, "loss": 0.8807, "learning_rate": 1.0172126587825442e-05, "epoch": 0.7020443909247653, "percentage": 70.21, "elapsed_time": "4 days, 22:00:24", "remaining_time": "2 days, 2:04:10", "throughput": 2725.25, "total_tokens": 1157750944} {"current_steps": 6414, "total_steps": 9134, "loss": 0.6767, "learning_rate": 1.0165204561123811e-05, "epoch": 0.7021538629957033, "percentage": 70.22, "elapsed_time": "4 days, 22:01:32", "remaining_time": "2 days, 2:03:05", "throughput": 2725.34, "total_tokens": 1157974944} {"current_steps": 6415, "total_steps": 9134, "loss": 1.1053, "learning_rate": 1.015828428935014e-05, "epoch": 0.7022633350666411, "percentage": 70.23, "elapsed_time": "4 days, 22:02:39", "remaining_time": "2 days, 2:01:59", "throughput": 2725.37, "total_tokens": 1158170272} {"current_steps": 6416, "total_steps": 9134, "loss": 1.0652, "learning_rate": 1.0151365773323046e-05, "epoch": 0.702372807137579, "percentage": 70.24, "elapsed_time": "4 days, 22:03:46", "remaining_time": "2 days, 2:00:53", "throughput": 2725.38, "total_tokens": 1158357760} {"current_steps": 6417, "total_steps": 9134, "loss": 0.7868, "learning_rate": 1.0144449013861013e-05, "epoch": 0.7024822792085169, "percentage": 70.25, "elapsed_time": "4 days, 22:04:54", "remaining_time": "2 days, 1:59:47", "throughput": 2725.37, "total_tokens": 1158538528} {"current_steps": 6418, "total_steps": 9134, "loss": 0.7195, "learning_rate": 1.0137534011782246e-05, "epoch": 0.7025917512794548, "percentage": 70.26, "elapsed_time": "4 days, 22:06:00", "remaining_time": "2 days, 1:58:41", "throughput": 2725.37, "total_tokens": 1158718848} {"current_steps": 6419, "total_steps": 9134, "loss": 0.9056, "learning_rate": 1.013062076790481e-05, "epoch": 0.7027012233503928, "percentage": 70.28, "elapsed_time": "4 days, 22:07:09", "remaining_time": "2 days, 1:57:36", "throughput": 2725.39, "total_tokens": 1158915968} {"current_steps": 6420, "total_steps": 9134, "loss": 0.819, "learning_rate": 1.0123709283046495e-05, "epoch": 0.7028106954213307, "percentage": 70.29, "elapsed_time": "4 days, 22:08:13", "remaining_time": "2 days, 1:56:29", "throughput": 2725.4, "total_tokens": 1159096288} {"current_steps": 6421, "total_steps": 9134, "loss": 0.7292, "learning_rate": 1.011679955802494e-05, "epoch": 0.7029201674922685, "percentage": 70.3, "elapsed_time": "4 days, 22:09:19", "remaining_time": "2 days, 1:55:22", "throughput": 2725.42, "total_tokens": 1159284000} {"current_steps": 6422, "total_steps": 9134, "loss": 0.7629, "learning_rate": 1.0109891593657547e-05, "epoch": 0.7030296395632064, "percentage": 70.31, "elapsed_time": "4 days, 22:10:27", "remaining_time": "2 days, 1:54:17", "throughput": 2725.43, "total_tokens": 1159471488} {"current_steps": 6423, "total_steps": 9134, "loss": 1.0206, "learning_rate": 1.0102985390761505e-05, "epoch": 0.7031391116341443, "percentage": 70.32, "elapsed_time": "4 days, 22:11:29", "remaining_time": "2 days, 1:53:09", "throughput": 2725.38, "total_tokens": 1159622688} {"current_steps": 6424, "total_steps": 9134, "loss": 0.5952, "learning_rate": 1.009608095015383e-05, "epoch": 0.7032485837050823, "percentage": 70.33, "elapsed_time": "4 days, 22:12:36", "remaining_time": "2 days, 1:52:03", "throughput": 2725.42, "total_tokens": 1159820032} {"current_steps": 6425, "total_steps": 9134, "loss": 0.9418, "learning_rate": 1.0089178272651267e-05, "epoch": 0.7033580557760202, "percentage": 70.34, "elapsed_time": "4 days, 22:13:44", "remaining_time": "2 days, 1:50:58", "throughput": 2725.46, "total_tokens": 1160023872} {"current_steps": 6426, "total_steps": 9134, "loss": 0.7461, "learning_rate": 1.008227735907043e-05, "epoch": 0.7034675278469581, "percentage": 70.35, "elapsed_time": "4 days, 22:14:51", "remaining_time": "2 days, 1:49:51", "throughput": 2725.45, "total_tokens": 1160201056} {"current_steps": 6427, "total_steps": 9134, "loss": 0.7075, "learning_rate": 1.0075378210227645e-05, "epoch": 0.7035769999178959, "percentage": 70.36, "elapsed_time": "4 days, 22:15:55", "remaining_time": "2 days, 1:48:44", "throughput": 2725.46, "total_tokens": 1160381600} {"current_steps": 6428, "total_steps": 9134, "loss": 0.689, "learning_rate": 1.0068480826939097e-05, "epoch": 0.7036864719888338, "percentage": 70.37, "elapsed_time": "4 days, 22:16:59", "remaining_time": "2 days, 1:47:37", "throughput": 2725.48, "total_tokens": 1160564160} {"current_steps": 6429, "total_steps": 9134, "loss": 0.751, "learning_rate": 1.006158521002072e-05, "epoch": 0.7037959440597717, "percentage": 70.39, "elapsed_time": "4 days, 22:18:05", "remaining_time": "2 days, 1:46:31", "throughput": 2725.52, "total_tokens": 1160759712} {"current_steps": 6430, "total_steps": 9134, "loss": 0.7435, "learning_rate": 1.005469136028826e-05, "epoch": 0.7039054161307097, "percentage": 70.4, "elapsed_time": "4 days, 22:19:09", "remaining_time": "2 days, 1:45:24", "throughput": 2725.5, "total_tokens": 1160925920} {"current_steps": 6431, "total_steps": 9134, "loss": 0.864, "learning_rate": 1.0047799278557238e-05, "epoch": 0.7040148882016476, "percentage": 70.41, "elapsed_time": "4 days, 22:20:17", "remaining_time": "2 days, 1:44:18", "throughput": 2725.53, "total_tokens": 1161122592} {"current_steps": 6432, "total_steps": 9134, "loss": 0.9053, "learning_rate": 1.0040908965642979e-05, "epoch": 0.7041243602725854, "percentage": 70.42, "elapsed_time": "4 days, 22:21:26", "remaining_time": "2 days, 1:43:13", "throughput": 2725.52, "total_tokens": 1161308288} {"current_steps": 6433, "total_steps": 9134, "loss": 0.7465, "learning_rate": 1.0034020422360591e-05, "epoch": 0.7042338323435233, "percentage": 70.43, "elapsed_time": "4 days, 22:22:28", "remaining_time": "2 days, 1:42:05", "throughput": 2725.54, "total_tokens": 1161485024} {"current_steps": 6434, "total_steps": 9134, "loss": 1.0233, "learning_rate": 1.002713364952497e-05, "epoch": 0.7043433044144612, "percentage": 70.44, "elapsed_time": "4 days, 22:23:35", "remaining_time": "2 days, 1:40:59", "throughput": 2725.5, "total_tokens": 1161649888} {"current_steps": 6435, "total_steps": 9134, "loss": 0.7132, "learning_rate": 1.0020248647950822e-05, "epoch": 0.7044527764853992, "percentage": 70.45, "elapsed_time": "4 days, 22:24:38", "remaining_time": "2 days, 1:39:51", "throughput": 2725.51, "total_tokens": 1161826176} {"current_steps": 6436, "total_steps": 9134, "loss": 0.7798, "learning_rate": 1.0013365418452625e-05, "epoch": 0.7045622485563371, "percentage": 70.46, "elapsed_time": "4 days, 22:25:47", "remaining_time": "2 days, 1:38:46", "throughput": 2725.55, "total_tokens": 1162030464} {"current_steps": 6437, "total_steps": 9134, "loss": 0.8542, "learning_rate": 1.0006483961844645e-05, "epoch": 0.704671720627275, "percentage": 70.47, "elapsed_time": "4 days, 22:26:50", "remaining_time": "2 days, 1:37:39", "throughput": 2725.54, "total_tokens": 1162197568} {"current_steps": 6438, "total_steps": 9134, "loss": 0.6759, "learning_rate": 9.999604278940956e-06, "epoch": 0.7047811926982128, "percentage": 70.48, "elapsed_time": "4 days, 22:27:54", "remaining_time": "2 days, 1:36:31", "throughput": 2725.54, "total_tokens": 1162371392} {"current_steps": 6439, "total_steps": 9134, "loss": 0.8491, "learning_rate": 9.9927263705554e-06, "epoch": 0.7048906647691507, "percentage": 70.49, "elapsed_time": "4 days, 22:28:59", "remaining_time": "2 days, 1:35:25", "throughput": 2725.54, "total_tokens": 1162552384} {"current_steps": 6440, "total_steps": 9134, "loss": 0.8174, "learning_rate": 9.985850237501618e-06, "epoch": 0.7050001368400887, "percentage": 70.51, "elapsed_time": "4 days, 22:30:06", "remaining_time": "2 days, 1:34:19", "throughput": 2725.56, "total_tokens": 1162740768} {"current_steps": 6441, "total_steps": 9134, "loss": 0.9848, "learning_rate": 9.978975880593067e-06, "epoch": 0.7051096089110266, "percentage": 70.52, "elapsed_time": "4 days, 22:31:14", "remaining_time": "2 days, 1:33:13", "throughput": 2725.53, "total_tokens": 1162915040} {"current_steps": 6442, "total_steps": 9134, "loss": 0.6803, "learning_rate": 9.972103300642937e-06, "epoch": 0.7052190809819645, "percentage": 70.53, "elapsed_time": "4 days, 22:32:14", "remaining_time": "2 days, 1:32:04", "throughput": 2725.51, "total_tokens": 1163070496} {"current_steps": 6443, "total_steps": 9134, "loss": 0.8383, "learning_rate": 9.965232498464266e-06, "epoch": 0.7053285530529024, "percentage": 70.54, "elapsed_time": "4 days, 22:33:21", "remaining_time": "2 days, 1:30:59", "throughput": 2725.5, "total_tokens": 1163247904} {"current_steps": 6444, "total_steps": 9134, "loss": 0.7422, "learning_rate": 9.958363474869853e-06, "epoch": 0.7054380251238402, "percentage": 70.55, "elapsed_time": "4 days, 22:34:26", "remaining_time": "2 days, 1:29:52", "throughput": 2725.52, "total_tokens": 1163432480} {"current_steps": 6445, "total_steps": 9134, "loss": 0.932, "learning_rate": 9.951496230672283e-06, "epoch": 0.7055474971947782, "percentage": 70.56, "elapsed_time": "4 days, 22:35:35", "remaining_time": "2 days, 1:28:46", "throughput": 2725.58, "total_tokens": 1163645728} {"current_steps": 6446, "total_steps": 9134, "loss": 0.8108, "learning_rate": 9.94463076668394e-06, "epoch": 0.7056569692657161, "percentage": 70.57, "elapsed_time": "4 days, 22:36:42", "remaining_time": "2 days, 1:27:41", "throughput": 2725.62, "total_tokens": 1163845536} {"current_steps": 6447, "total_steps": 9134, "loss": 0.7338, "learning_rate": 9.937767083716989e-06, "epoch": 0.705766441336654, "percentage": 70.58, "elapsed_time": "4 days, 22:37:43", "remaining_time": "2 days, 1:26:32", "throughput": 2725.58, "total_tokens": 1163994496} {"current_steps": 6448, "total_steps": 9134, "loss": 0.7519, "learning_rate": 9.930905182583417e-06, "epoch": 0.7058759134075919, "percentage": 70.59, "elapsed_time": "4 days, 22:38:48", "remaining_time": "2 days, 1:25:25", "throughput": 2725.56, "total_tokens": 1164164288} {"current_steps": 6449, "total_steps": 9134, "loss": 0.6995, "learning_rate": 9.924045064094934e-06, "epoch": 0.7059853854785297, "percentage": 70.6, "elapsed_time": "4 days, 22:39:50", "remaining_time": "2 days, 1:24:17", "throughput": 2725.52, "total_tokens": 1164315712} {"current_steps": 6450, "total_steps": 9134, "loss": 0.9028, "learning_rate": 9.917186729063118e-06, "epoch": 0.7060948575494677, "percentage": 70.62, "elapsed_time": "4 days, 22:40:58", "remaining_time": "2 days, 1:23:12", "throughput": 2725.53, "total_tokens": 1164506336} {"current_steps": 6451, "total_steps": 9134, "loss": 0.6168, "learning_rate": 9.910330178299262e-06, "epoch": 0.7062043296204056, "percentage": 70.63, "elapsed_time": "4 days, 22:42:00", "remaining_time": "2 days, 1:22:04", "throughput": 2725.48, "total_tokens": 1164650816} {"current_steps": 6452, "total_steps": 9134, "loss": 0.9615, "learning_rate": 9.903475412614507e-06, "epoch": 0.7063138016913435, "percentage": 70.64, "elapsed_time": "4 days, 22:43:08", "remaining_time": "2 days, 1:20:59", "throughput": 2725.54, "total_tokens": 1164866304} {"current_steps": 6453, "total_steps": 9134, "loss": 0.8257, "learning_rate": 9.896622432819753e-06, "epoch": 0.7064232737622814, "percentage": 70.65, "elapsed_time": "4 days, 22:44:17", "remaining_time": "2 days, 1:19:53", "throughput": 2725.55, "total_tokens": 1165058272} {"current_steps": 6454, "total_steps": 9134, "loss": 0.6831, "learning_rate": 9.889771239725693e-06, "epoch": 0.7065327458332193, "percentage": 70.66, "elapsed_time": "4 days, 22:45:23", "remaining_time": "2 days, 1:18:47", "throughput": 2725.56, "total_tokens": 1165240384} {"current_steps": 6455, "total_steps": 9134, "loss": 0.7427, "learning_rate": 9.882921834142806e-06, "epoch": 0.7066422179041572, "percentage": 70.67, "elapsed_time": "4 days, 22:46:28", "remaining_time": "2 days, 1:17:40", "throughput": 2725.56, "total_tokens": 1165418016} {"current_steps": 6456, "total_steps": 9134, "loss": 0.8651, "learning_rate": 9.876074216881359e-06, "epoch": 0.7067516899750951, "percentage": 70.68, "elapsed_time": "4 days, 22:47:33", "remaining_time": "2 days, 1:16:34", "throughput": 2725.56, "total_tokens": 1165595424} {"current_steps": 6457, "total_steps": 9134, "loss": 0.7917, "learning_rate": 9.86922838875144e-06, "epoch": 0.706861162046033, "percentage": 70.69, "elapsed_time": "4 days, 22:48:37", "remaining_time": "2 days, 1:15:26", "throughput": 2725.59, "total_tokens": 1165781568} {"current_steps": 6458, "total_steps": 9134, "loss": 0.9143, "learning_rate": 9.86238435056286e-06, "epoch": 0.7069706341169709, "percentage": 70.7, "elapsed_time": "4 days, 22:49:45", "remaining_time": "2 days, 1:14:21", "throughput": 2725.6, "total_tokens": 1165971744} {"current_steps": 6459, "total_steps": 9134, "loss": 0.6487, "learning_rate": 9.855542103125286e-06, "epoch": 0.7070801061879088, "percentage": 70.71, "elapsed_time": "4 days, 22:50:51", "remaining_time": "2 days, 1:13:15", "throughput": 2725.62, "total_tokens": 1166159904} {"current_steps": 6460, "total_steps": 9134, "loss": 0.8435, "learning_rate": 9.848701647248118e-06, "epoch": 0.7071895782588468, "percentage": 70.72, "elapsed_time": "4 days, 22:51:54", "remaining_time": "2 days, 1:12:07", "throughput": 2725.63, "total_tokens": 1166335520} {"current_steps": 6461, "total_steps": 9134, "loss": 0.8041, "learning_rate": 9.841862983740584e-06, "epoch": 0.7072990503297846, "percentage": 70.74, "elapsed_time": "4 days, 22:53:02", "remaining_time": "2 days, 1:11:01", "throughput": 2725.66, "total_tokens": 1166534208} {"current_steps": 6462, "total_steps": 9134, "loss": 0.7024, "learning_rate": 9.835026113411685e-06, "epoch": 0.7074085224007225, "percentage": 70.75, "elapsed_time": "4 days, 22:54:07", "remaining_time": "2 days, 1:09:55", "throughput": 2725.7, "total_tokens": 1166728416} {"current_steps": 6463, "total_steps": 9134, "loss": 0.9265, "learning_rate": 9.828191037070208e-06, "epoch": 0.7075179944716604, "percentage": 70.76, "elapsed_time": "4 days, 22:55:11", "remaining_time": "2 days, 1:08:47", "throughput": 2725.63, "total_tokens": 1166874016} {"current_steps": 6464, "total_steps": 9134, "loss": 0.8755, "learning_rate": 9.821357755524727e-06, "epoch": 0.7076274665425983, "percentage": 70.77, "elapsed_time": "4 days, 22:56:16", "remaining_time": "2 days, 1:07:41", "throughput": 2725.61, "total_tokens": 1167041568} {"current_steps": 6465, "total_steps": 9134, "loss": 0.5768, "learning_rate": 9.814526269583596e-06, "epoch": 0.7077369386135363, "percentage": 70.78, "elapsed_time": "4 days, 22:57:23", "remaining_time": "2 days, 1:06:35", "throughput": 2725.63, "total_tokens": 1167231296} {"current_steps": 6466, "total_steps": 9134, "loss": 0.7677, "learning_rate": 9.807696580054994e-06, "epoch": 0.7078464106844741, "percentage": 70.79, "elapsed_time": "4 days, 22:58:31", "remaining_time": "2 days, 1:05:29", "throughput": 2725.64, "total_tokens": 1167423936} {"current_steps": 6467, "total_steps": 9134, "loss": 1.0006, "learning_rate": 9.800868687746832e-06, "epoch": 0.707955882755412, "percentage": 70.8, "elapsed_time": "4 days, 22:59:37", "remaining_time": "2 days, 1:04:23", "throughput": 2725.68, "total_tokens": 1167621728} {"current_steps": 6468, "total_steps": 9134, "loss": 0.7862, "learning_rate": 9.794042593466851e-06, "epoch": 0.7080653548263499, "percentage": 70.81, "elapsed_time": "4 days, 23:00:43", "remaining_time": "2 days, 1:03:17", "throughput": 2725.63, "total_tokens": 1167780768} {"current_steps": 6469, "total_steps": 9134, "loss": 0.791, "learning_rate": 9.787218298022565e-06, "epoch": 0.7081748268972878, "percentage": 70.82, "elapsed_time": "4 days, 23:01:46", "remaining_time": "2 days, 1:02:09", "throughput": 2725.6, "total_tokens": 1167939584} {"current_steps": 6470, "total_steps": 9134, "loss": 1.1715, "learning_rate": 9.780395802221274e-06, "epoch": 0.7082842989682258, "percentage": 70.83, "elapsed_time": "4 days, 23:02:54", "remaining_time": "2 days, 1:01:04", "throughput": 2725.63, "total_tokens": 1168136256} {"current_steps": 6471, "total_steps": 9134, "loss": 0.6974, "learning_rate": 9.773575106870061e-06, "epoch": 0.7083937710391637, "percentage": 70.85, "elapsed_time": "4 days, 23:04:00", "remaining_time": "2 days, 0:59:57", "throughput": 2725.58, "total_tokens": 1168294624} {"current_steps": 6472, "total_steps": 9134, "loss": 0.9761, "learning_rate": 9.766756212775807e-06, "epoch": 0.7085032431101015, "percentage": 70.86, "elapsed_time": "4 days, 23:05:06", "remaining_time": "2 days, 0:58:51", "throughput": 2725.58, "total_tokens": 1168475616} {"current_steps": 6473, "total_steps": 9134, "loss": 0.7774, "learning_rate": 9.759939120745171e-06, "epoch": 0.7086127151810394, "percentage": 70.87, "elapsed_time": "4 days, 23:06:14", "remaining_time": "2 days, 0:57:46", "throughput": 2725.62, "total_tokens": 1168679232} {"current_steps": 6474, "total_steps": 9134, "loss": 0.9091, "learning_rate": 9.753123831584604e-06, "epoch": 0.7087221872519773, "percentage": 70.88, "elapsed_time": "4 days, 23:07:22", "remaining_time": "2 days, 0:56:40", "throughput": 2725.67, "total_tokens": 1168881952} {"current_steps": 6475, "total_steps": 9134, "loss": 0.7007, "learning_rate": 9.746310346100331e-06, "epoch": 0.7088316593229153, "percentage": 70.89, "elapsed_time": "4 days, 23:08:29", "remaining_time": "2 days, 0:55:34", "throughput": 2725.71, "total_tokens": 1169085792} {"current_steps": 6476, "total_steps": 9134, "loss": 0.6447, "learning_rate": 9.739498665098395e-06, "epoch": 0.7089411313938532, "percentage": 70.9, "elapsed_time": "4 days, 23:09:35", "remaining_time": "2 days, 0:54:27", "throughput": 2725.73, "total_tokens": 1169272160} {"current_steps": 6477, "total_steps": 9134, "loss": 0.753, "learning_rate": 9.732688789384593e-06, "epoch": 0.7090506034647911, "percentage": 70.91, "elapsed_time": "4 days, 23:10:43", "remaining_time": "2 days, 0:53:22", "throughput": 2725.75, "total_tokens": 1169463680} {"current_steps": 6478, "total_steps": 9134, "loss": 0.7734, "learning_rate": 9.725880719764519e-06, "epoch": 0.7091600755357289, "percentage": 70.92, "elapsed_time": "4 days, 23:11:50", "remaining_time": "2 days, 0:52:16", "throughput": 2725.77, "total_tokens": 1169657888} {"current_steps": 6479, "total_steps": 9134, "loss": 0.9554, "learning_rate": 9.71907445704356e-06, "epoch": 0.7092695476066668, "percentage": 70.93, "elapsed_time": "4 days, 23:12:58", "remaining_time": "2 days, 0:51:11", "throughput": 2725.78, "total_tokens": 1169844032} {"current_steps": 6480, "total_steps": 9134, "loss": 0.9312, "learning_rate": 9.712270002026877e-06, "epoch": 0.7093790196776047, "percentage": 70.94, "elapsed_time": "4 days, 23:14:03", "remaining_time": "2 days, 0:50:04", "throughput": 2725.77, "total_tokens": 1170018304} {"current_steps": 6481, "total_steps": 9134, "loss": 0.8453, "learning_rate": 9.705467355519428e-06, "epoch": 0.7094884917485427, "percentage": 70.95, "elapsed_time": "4 days, 23:15:10", "remaining_time": "2 days, 0:48:58", "throughput": 2725.75, "total_tokens": 1170192352} {"current_steps": 6482, "total_steps": 9134, "loss": 0.9522, "learning_rate": 9.698666518325943e-06, "epoch": 0.7095979638194806, "percentage": 70.97, "elapsed_time": "4 days, 23:16:14", "remaining_time": "2 days, 0:47:51", "throughput": 2725.69, "total_tokens": 1170342208} {"current_steps": 6483, "total_steps": 9134, "loss": 0.7133, "learning_rate": 9.69186749125098e-06, "epoch": 0.7097074358904184, "percentage": 70.98, "elapsed_time": "4 days, 23:17:21", "remaining_time": "2 days, 0:46:45", "throughput": 2725.68, "total_tokens": 1170519392} {"current_steps": 6484, "total_steps": 9134, "loss": 0.7641, "learning_rate": 9.685070275098806e-06, "epoch": 0.7098169079613563, "percentage": 70.99, "elapsed_time": "4 days, 23:18:27", "remaining_time": "2 days, 0:45:39", "throughput": 2725.69, "total_tokens": 1170706432} {"current_steps": 6485, "total_steps": 9134, "loss": 0.8149, "learning_rate": 9.678274870673555e-06, "epoch": 0.7099263800322942, "percentage": 71.0, "elapsed_time": "4 days, 23:19:30", "remaining_time": "2 days, 0:44:31", "throughput": 2725.7, "total_tokens": 1170879808} {"current_steps": 6486, "total_steps": 9134, "loss": 0.6595, "learning_rate": 9.671481278779094e-06, "epoch": 0.7100358521032322, "percentage": 71.01, "elapsed_time": "4 days, 23:20:38", "remaining_time": "2 days, 0:43:25", "throughput": 2725.68, "total_tokens": 1171057664} {"current_steps": 6487, "total_steps": 9134, "loss": 0.8191, "learning_rate": 9.664689500219092e-06, "epoch": 0.7101453241741701, "percentage": 71.02, "elapsed_time": "4 days, 23:21:44", "remaining_time": "2 days, 0:42:19", "throughput": 2725.72, "total_tokens": 1171255904} {"current_steps": 6488, "total_steps": 9134, "loss": 0.5721, "learning_rate": 9.65789953579701e-06, "epoch": 0.710254796245108, "percentage": 71.03, "elapsed_time": "4 days, 23:22:52", "remaining_time": "2 days, 0:41:14", "throughput": 2725.71, "total_tokens": 1171434432} {"current_steps": 6489, "total_steps": 9134, "loss": 0.6667, "learning_rate": 9.651111386316072e-06, "epoch": 0.7103642683160458, "percentage": 71.04, "elapsed_time": "4 days, 23:23:57", "remaining_time": "2 days, 0:40:07", "throughput": 2725.69, "total_tokens": 1171603552} {"current_steps": 6490, "total_steps": 9134, "loss": 0.7402, "learning_rate": 9.644325052579333e-06, "epoch": 0.7104737403869837, "percentage": 71.05, "elapsed_time": "4 days, 23:25:03", "remaining_time": "2 days, 0:39:00", "throughput": 2725.74, "total_tokens": 1171805600} {"current_steps": 6491, "total_steps": 9134, "loss": 0.696, "learning_rate": 9.63754053538957e-06, "epoch": 0.7105832124579217, "percentage": 71.06, "elapsed_time": "4 days, 23:26:03", "remaining_time": "2 days, 0:37:52", "throughput": 2725.66, "total_tokens": 1171934400} {"current_steps": 6492, "total_steps": 9134, "loss": 0.791, "learning_rate": 9.630757835549412e-06, "epoch": 0.7106926845288596, "percentage": 71.08, "elapsed_time": "4 days, 23:27:08", "remaining_time": "2 days, 0:36:45", "throughput": 2725.65, "total_tokens": 1172109568} {"current_steps": 6493, "total_steps": 9134, "loss": 0.6513, "learning_rate": 9.623976953861199e-06, "epoch": 0.7108021565997975, "percentage": 71.09, "elapsed_time": "4 days, 23:28:15", "remaining_time": "2 days, 0:35:39", "throughput": 2725.65, "total_tokens": 1172289440} {"current_steps": 6494, "total_steps": 9134, "loss": 0.8444, "learning_rate": 9.617197891127131e-06, "epoch": 0.7109116286707354, "percentage": 71.1, "elapsed_time": "4 days, 23:29:21", "remaining_time": "2 days, 0:34:33", "throughput": 2725.68, "total_tokens": 1172480960} {"current_steps": 6495, "total_steps": 9134, "loss": 0.556, "learning_rate": 9.610420648149144e-06, "epoch": 0.7110211007416732, "percentage": 71.11, "elapsed_time": "4 days, 23:30:26", "remaining_time": "2 days, 0:33:26", "throughput": 2725.67, "total_tokens": 1172656352} {"current_steps": 6496, "total_steps": 9134, "loss": 1.0299, "learning_rate": 9.603645225728975e-06, "epoch": 0.7111305728126112, "percentage": 71.12, "elapsed_time": "4 days, 23:31:32", "remaining_time": "2 days, 0:32:20", "throughput": 2725.71, "total_tokens": 1172854368} {"current_steps": 6497, "total_steps": 9134, "loss": 0.9438, "learning_rate": 9.59687162466814e-06, "epoch": 0.7112400448835491, "percentage": 71.13, "elapsed_time": "4 days, 23:32:41", "remaining_time": "2 days, 0:31:14", "throughput": 2725.75, "total_tokens": 1173058880} {"current_steps": 6498, "total_steps": 9134, "loss": 0.7718, "learning_rate": 9.590099845767941e-06, "epoch": 0.711349516954487, "percentage": 71.14, "elapsed_time": "4 days, 23:33:45", "remaining_time": "2 days, 0:30:07", "throughput": 2725.67, "total_tokens": 1173198432} {"current_steps": 6499, "total_steps": 9134, "loss": 0.6266, "learning_rate": 9.583329889829486e-06, "epoch": 0.7114589890254249, "percentage": 71.15, "elapsed_time": "4 days, 23:34:52", "remaining_time": "2 days, 0:29:01", "throughput": 2725.67, "total_tokens": 1173377184} {"current_steps": 6500, "total_steps": 9134, "loss": 0.9927, "learning_rate": 9.576561757653618e-06, "epoch": 0.7115684610963627, "percentage": 71.16, "elapsed_time": "4 days, 23:35:56", "remaining_time": "2 days, 0:27:54", "throughput": 2725.64, "total_tokens": 1173543616} {"current_steps": 6501, "total_steps": 9134, "loss": 0.8954, "learning_rate": 9.569795450041028e-06, "epoch": 0.7116779331673007, "percentage": 71.17, "elapsed_time": "4 days, 23:37:02", "remaining_time": "2 days, 0:26:48", "throughput": 2725.61, "total_tokens": 1173708256} {"current_steps": 6502, "total_steps": 9134, "loss": 0.8229, "learning_rate": 9.563030967792119e-06, "epoch": 0.7117874052382386, "percentage": 71.18, "elapsed_time": "4 days, 23:38:08", "remaining_time": "2 days, 0:25:42", "throughput": 2725.67, "total_tokens": 1173914560} {"current_steps": 6503, "total_steps": 9134, "loss": 0.8115, "learning_rate": 9.556268311707145e-06, "epoch": 0.7118968773091765, "percentage": 71.2, "elapsed_time": "4 days, 23:39:11", "remaining_time": "2 days, 0:24:34", "throughput": 2725.66, "total_tokens": 1174079872} {"current_steps": 6504, "total_steps": 9134, "loss": 0.6053, "learning_rate": 9.549507482586107e-06, "epoch": 0.7120063493801144, "percentage": 71.21, "elapsed_time": "4 days, 23:40:14", "remaining_time": "2 days, 0:23:26", "throughput": 2725.61, "total_tokens": 1174231744} {"current_steps": 6505, "total_steps": 9134, "loss": 0.7187, "learning_rate": 9.542748481228796e-06, "epoch": 0.7121158214510523, "percentage": 71.22, "elapsed_time": "4 days, 23:41:19", "remaining_time": "2 days, 0:22:20", "throughput": 2725.66, "total_tokens": 1174430656} {"current_steps": 6506, "total_steps": 9134, "loss": 1.0123, "learning_rate": 9.535991308434795e-06, "epoch": 0.7122252935219902, "percentage": 71.23, "elapsed_time": "4 days, 23:42:28", "remaining_time": "2 days, 0:21:14", "throughput": 2725.7, "total_tokens": 1174636288} {"current_steps": 6507, "total_steps": 9134, "loss": 0.8889, "learning_rate": 9.529235965003447e-06, "epoch": 0.7123347655929281, "percentage": 71.24, "elapsed_time": "4 days, 23:43:33", "remaining_time": "2 days, 0:20:08", "throughput": 2725.73, "total_tokens": 1174825568} {"current_steps": 6508, "total_steps": 9134, "loss": 0.8864, "learning_rate": 9.52248245173392e-06, "epoch": 0.712444237663866, "percentage": 71.25, "elapsed_time": "4 days, 23:44:33", "remaining_time": "2 days, 0:18:59", "throughput": 2725.71, "total_tokens": 1174979680} {"current_steps": 6509, "total_steps": 9134, "loss": 0.785, "learning_rate": 9.51573076942513e-06, "epoch": 0.7125537097348039, "percentage": 71.26, "elapsed_time": "4 days, 23:45:38", "remaining_time": "2 days, 0:17:52", "throughput": 2725.69, "total_tokens": 1175151040} {"current_steps": 6510, "total_steps": 9134, "loss": 0.9181, "learning_rate": 9.508980918875787e-06, "epoch": 0.7126631818057418, "percentage": 71.27, "elapsed_time": "4 days, 23:46:45", "remaining_time": "2 days, 0:16:46", "throughput": 2725.71, "total_tokens": 1175339424} {"current_steps": 6511, "total_steps": 9134, "loss": 0.8352, "learning_rate": 9.50223290088439e-06, "epoch": 0.7127726538766798, "percentage": 71.28, "elapsed_time": "4 days, 23:47:50", "remaining_time": "2 days, 0:15:40", "throughput": 2725.71, "total_tokens": 1175518176} {"current_steps": 6512, "total_steps": 9134, "loss": 0.9036, "learning_rate": 9.495486716249213e-06, "epoch": 0.7128821259476176, "percentage": 71.29, "elapsed_time": "4 days, 23:48:56", "remaining_time": "2 days, 0:14:33", "throughput": 2725.69, "total_tokens": 1175688192} {"current_steps": 6513, "total_steps": 9134, "loss": 0.9446, "learning_rate": 9.48874236576832e-06, "epoch": 0.7129915980185555, "percentage": 71.31, "elapsed_time": "4 days, 23:50:01", "remaining_time": "2 days, 0:13:27", "throughput": 2725.68, "total_tokens": 1175863808} {"current_steps": 6514, "total_steps": 9134, "loss": 0.7969, "learning_rate": 9.48199985023955e-06, "epoch": 0.7131010700894934, "percentage": 71.32, "elapsed_time": "4 days, 23:51:10", "remaining_time": "2 days, 0:12:21", "throughput": 2725.75, "total_tokens": 1176081088} {"current_steps": 6515, "total_steps": 9134, "loss": 0.5672, "learning_rate": 9.475259170460527e-06, "epoch": 0.7132105421604313, "percentage": 71.33, "elapsed_time": "4 days, 23:52:18", "remaining_time": "2 days, 0:11:16", "throughput": 2725.78, "total_tokens": 1176278208} {"current_steps": 6516, "total_steps": 9134, "loss": 0.6445, "learning_rate": 9.468520327228681e-06, "epoch": 0.7133200142313693, "percentage": 71.34, "elapsed_time": "4 days, 23:53:21", "remaining_time": "2 days, 0:10:08", "throughput": 2725.77, "total_tokens": 1176446432} {"current_steps": 6517, "total_steps": 9134, "loss": 0.6244, "learning_rate": 9.46178332134117e-06, "epoch": 0.7134294863023071, "percentage": 71.35, "elapsed_time": "4 days, 23:54:26", "remaining_time": "2 days, 0:09:02", "throughput": 2725.71, "total_tokens": 1176598976} {"current_steps": 6518, "total_steps": 9134, "loss": 0.772, "learning_rate": 9.455048153594998e-06, "epoch": 0.713538958373245, "percentage": 71.36, "elapsed_time": "4 days, 23:55:23", "remaining_time": "2 days, 0:07:52", "throughput": 2725.65, "total_tokens": 1176727552} {"current_steps": 6519, "total_steps": 9134, "loss": 0.7132, "learning_rate": 9.448314824786913e-06, "epoch": 0.7136484304441829, "percentage": 71.37, "elapsed_time": "4 days, 23:56:31", "remaining_time": "2 days, 0:06:46", "throughput": 2725.68, "total_tokens": 1176926016} {"current_steps": 6520, "total_steps": 9134, "loss": 0.9246, "learning_rate": 9.441583335713455e-06, "epoch": 0.7137579025151208, "percentage": 71.38, "elapsed_time": "4 days, 23:57:39", "remaining_time": "2 days, 0:05:41", "throughput": 2725.74, "total_tokens": 1177139264} {"current_steps": 6521, "total_steps": 9134, "loss": 0.696, "learning_rate": 9.434853687170947e-06, "epoch": 0.7138673745860588, "percentage": 71.39, "elapsed_time": "4 days, 23:58:45", "remaining_time": "2 days, 0:04:34", "throughput": 2725.76, "total_tokens": 1177325856} {"current_steps": 6522, "total_steps": 9134, "loss": 0.8583, "learning_rate": 9.42812587995548e-06, "epoch": 0.7139768466569967, "percentage": 71.4, "elapsed_time": "4 days, 23:59:54", "remaining_time": "2 days, 0:03:29", "throughput": 2725.79, "total_tokens": 1177524096} {"current_steps": 6523, "total_steps": 9134, "loss": 0.7706, "learning_rate": 9.421399914862975e-06, "epoch": 0.7140863187279345, "percentage": 71.41, "elapsed_time": "5 days, 0:00:57", "remaining_time": "2 days, 0:02:22", "throughput": 2725.79, "total_tokens": 1177697024} {"current_steps": 6524, "total_steps": 9134, "loss": 0.8262, "learning_rate": 9.414675792689056e-06, "epoch": 0.7141957907988724, "percentage": 71.43, "elapsed_time": "5 days, 0:02:01", "remaining_time": "2 days, 0:01:15", "throughput": 2725.79, "total_tokens": 1177872416} {"current_steps": 6525, "total_steps": 9134, "loss": 0.751, "learning_rate": 9.407953514229218e-06, "epoch": 0.7143052628698103, "percentage": 71.44, "elapsed_time": "5 days, 0:03:08", "remaining_time": "2 days, 0:00:08", "throughput": 2725.83, "total_tokens": 1178070656} {"current_steps": 6526, "total_steps": 9134, "loss": 0.8409, "learning_rate": 9.401233080278655e-06, "epoch": 0.7144147349407483, "percentage": 71.45, "elapsed_time": "5 days, 0:04:16", "remaining_time": "1 day, 23:59:03", "throughput": 2725.87, "total_tokens": 1178272256} {"current_steps": 6527, "total_steps": 9134, "loss": 1.0876, "learning_rate": 9.394514491632406e-06, "epoch": 0.7145242070116862, "percentage": 71.46, "elapsed_time": "5 days, 0:05:24", "remaining_time": "1 day, 23:57:58", "throughput": 2725.93, "total_tokens": 1178485280} {"current_steps": 6528, "total_steps": 9134, "loss": 0.7362, "learning_rate": 9.38779774908526e-06, "epoch": 0.7146336790826241, "percentage": 71.47, "elapsed_time": "5 days, 0:06:26", "remaining_time": "1 day, 23:56:50", "throughput": 2725.94, "total_tokens": 1178662240} {"current_steps": 6529, "total_steps": 9134, "loss": 0.7825, "learning_rate": 9.381082853431795e-06, "epoch": 0.7147431511535619, "percentage": 71.48, "elapsed_time": "5 days, 0:07:29", "remaining_time": "1 day, 23:55:42", "throughput": 2725.89, "total_tokens": 1178811200} {"current_steps": 6530, "total_steps": 9134, "loss": 0.847, "learning_rate": 9.374369805466369e-06, "epoch": 0.7148526232244998, "percentage": 71.49, "elapsed_time": "5 days, 0:08:37", "remaining_time": "1 day, 23:54:37", "throughput": 2725.9, "total_tokens": 1179000480} {"current_steps": 6531, "total_steps": 9134, "loss": 1.0344, "learning_rate": 9.367658605983117e-06, "epoch": 0.7149620952954377, "percentage": 71.5, "elapsed_time": "5 days, 0:09:45", "remaining_time": "1 day, 23:53:31", "throughput": 2725.87, "total_tokens": 1179169600} {"current_steps": 6532, "total_steps": 9134, "loss": 0.9918, "learning_rate": 9.360949255775986e-06, "epoch": 0.7150715673663757, "percentage": 71.51, "elapsed_time": "5 days, 0:10:52", "remaining_time": "1 day, 23:52:25", "throughput": 2725.91, "total_tokens": 1179371648} {"current_steps": 6533, "total_steps": 9134, "loss": 0.7314, "learning_rate": 9.354241755638641e-06, "epoch": 0.7151810394373136, "percentage": 71.52, "elapsed_time": "5 days, 0:12:01", "remaining_time": "1 day, 23:51:20", "throughput": 2725.97, "total_tokens": 1179583328} {"current_steps": 6534, "total_steps": 9134, "loss": 0.7905, "learning_rate": 9.347536106364607e-06, "epoch": 0.7152905115082514, "percentage": 71.53, "elapsed_time": "5 days, 0:13:07", "remaining_time": "1 day, 23:50:14", "throughput": 2725.95, "total_tokens": 1179756928} {"current_steps": 6535, "total_steps": 9134, "loss": 0.7886, "learning_rate": 9.34083230874711e-06, "epoch": 0.7153999835791893, "percentage": 71.55, "elapsed_time": "5 days, 0:14:08", "remaining_time": "1 day, 23:49:05", "throughput": 2725.93, "total_tokens": 1179916416} {"current_steps": 6536, "total_steps": 9134, "loss": 0.5847, "learning_rate": 9.334130363579224e-06, "epoch": 0.7155094556501272, "percentage": 71.56, "elapsed_time": "5 days, 0:15:12", "remaining_time": "1 day, 23:47:58", "throughput": 2725.95, "total_tokens": 1180097184} {"current_steps": 6537, "total_steps": 9134, "loss": 0.67, "learning_rate": 9.32743027165377e-06, "epoch": 0.7156189277210652, "percentage": 71.57, "elapsed_time": "5 days, 0:16:14", "remaining_time": "1 day, 23:46:50", "throughput": 2725.91, "total_tokens": 1180249952} {"current_steps": 6538, "total_steps": 9134, "loss": 0.7916, "learning_rate": 9.320732033763351e-06, "epoch": 0.7157283997920031, "percentage": 71.58, "elapsed_time": "5 days, 0:17:22", "remaining_time": "1 day, 23:45:45", "throughput": 2725.93, "total_tokens": 1180444608} {"current_steps": 6539, "total_steps": 9134, "loss": 0.7682, "learning_rate": 9.314035650700361e-06, "epoch": 0.715837871862941, "percentage": 71.59, "elapsed_time": "5 days, 0:18:24", "remaining_time": "1 day, 23:44:37", "throughput": 2725.92, "total_tokens": 1180609024} {"current_steps": 6540, "total_steps": 9134, "loss": 0.9032, "learning_rate": 9.307341123256957e-06, "epoch": 0.7159473439338788, "percentage": 71.6, "elapsed_time": "5 days, 0:19:32", "remaining_time": "1 day, 23:43:31", "throughput": 2725.97, "total_tokens": 1180815552} {"current_steps": 6541, "total_steps": 9134, "loss": 0.7888, "learning_rate": 9.300648452225119e-06, "epoch": 0.7160568160048167, "percentage": 71.61, "elapsed_time": "5 days, 0:20:40", "remaining_time": "1 day, 23:42:26", "throughput": 2726.02, "total_tokens": 1181021408} {"current_steps": 6542, "total_steps": 9134, "loss": 0.6452, "learning_rate": 9.293957638396535e-06, "epoch": 0.7161662880757547, "percentage": 71.62, "elapsed_time": "5 days, 0:21:45", "remaining_time": "1 day, 23:41:19", "throughput": 2726.01, "total_tokens": 1181194336} {"current_steps": 6543, "total_steps": 9134, "loss": 0.7183, "learning_rate": 9.28726868256275e-06, "epoch": 0.7162757601466926, "percentage": 71.63, "elapsed_time": "5 days, 0:22:50", "remaining_time": "1 day, 23:40:13", "throughput": 2726.02, "total_tokens": 1181378688} {"current_steps": 6544, "total_steps": 9134, "loss": 1.0053, "learning_rate": 9.280581585515042e-06, "epoch": 0.7163852322176305, "percentage": 71.64, "elapsed_time": "5 days, 0:23:59", "remaining_time": "1 day, 23:39:07", "throughput": 2726.01, "total_tokens": 1181557216} {"current_steps": 6545, "total_steps": 9134, "loss": 0.9864, "learning_rate": 9.273896348044481e-06, "epoch": 0.7164947042885684, "percentage": 71.66, "elapsed_time": "5 days, 0:25:05", "remaining_time": "1 day, 23:38:01", "throughput": 2726.07, "total_tokens": 1181766656} {"current_steps": 6546, "total_steps": 9134, "loss": 0.7048, "learning_rate": 9.267212970941919e-06, "epoch": 0.7166041763595062, "percentage": 71.67, "elapsed_time": "5 days, 0:26:10", "remaining_time": "1 day, 23:36:54", "throughput": 2726.04, "total_tokens": 1181931296} {"current_steps": 6547, "total_steps": 9134, "loss": 0.7509, "learning_rate": 9.260531454997987e-06, "epoch": 0.7167136484304442, "percentage": 71.68, "elapsed_time": "5 days, 0:27:16", "remaining_time": "1 day, 23:35:48", "throughput": 2726.01, "total_tokens": 1182099296} {"current_steps": 6548, "total_steps": 9134, "loss": 0.8319, "learning_rate": 9.253851801003094e-06, "epoch": 0.7168231205013821, "percentage": 71.69, "elapsed_time": "5 days, 0:28:24", "remaining_time": "1 day, 23:34:42", "throughput": 2726.03, "total_tokens": 1182291264} {"current_steps": 6549, "total_steps": 9134, "loss": 1.0581, "learning_rate": 9.247174009747422e-06, "epoch": 0.71693259257232, "percentage": 71.7, "elapsed_time": "5 days, 0:29:33", "remaining_time": "1 day, 23:33:37", "throughput": 2726.0, "total_tokens": 1182467552} {"current_steps": 6550, "total_steps": 9134, "loss": 0.7627, "learning_rate": 9.240498082020962e-06, "epoch": 0.7170420646432579, "percentage": 71.71, "elapsed_time": "5 days, 0:30:38", "remaining_time": "1 day, 23:32:31", "throughput": 2726.02, "total_tokens": 1182653472} {"current_steps": 6551, "total_steps": 9134, "loss": 0.6753, "learning_rate": 9.23382401861345e-06, "epoch": 0.7171515367141957, "percentage": 71.72, "elapsed_time": "5 days, 0:31:42", "remaining_time": "1 day, 23:31:23", "throughput": 2726.03, "total_tokens": 1182831552} {"current_steps": 6552, "total_steps": 9134, "loss": 1.2305, "learning_rate": 9.227151820314417e-06, "epoch": 0.7172610087851337, "percentage": 71.73, "elapsed_time": "5 days, 0:32:50", "remaining_time": "1 day, 23:30:18", "throughput": 2726.12, "total_tokens": 1183056896} {"current_steps": 6553, "total_steps": 9134, "loss": 0.768, "learning_rate": 9.22048148791317e-06, "epoch": 0.7173704808560716, "percentage": 71.74, "elapsed_time": "5 days, 0:33:57", "remaining_time": "1 day, 23:29:12", "throughput": 2726.1, "total_tokens": 1183232288} {"current_steps": 6554, "total_steps": 9134, "loss": 0.8484, "learning_rate": 9.2138130221988e-06, "epoch": 0.7174799529270095, "percentage": 71.75, "elapsed_time": "5 days, 0:34:59", "remaining_time": "1 day, 23:28:04", "throughput": 2726.07, "total_tokens": 1183384160} {"current_steps": 6555, "total_steps": 9134, "loss": 0.9022, "learning_rate": 9.20714642396017e-06, "epoch": 0.7175894249979474, "percentage": 71.76, "elapsed_time": "5 days, 0:36:04", "remaining_time": "1 day, 23:26:57", "throughput": 2726.08, "total_tokens": 1183568736} {"current_steps": 6556, "total_steps": 9134, "loss": 0.8375, "learning_rate": 9.200481693985928e-06, "epoch": 0.7176988970688853, "percentage": 71.78, "elapsed_time": "5 days, 0:37:09", "remaining_time": "1 day, 23:25:51", "throughput": 2726.05, "total_tokens": 1183730912} {"current_steps": 6557, "total_steps": 9134, "loss": 0.757, "learning_rate": 9.193818833064489e-06, "epoch": 0.7178083691398232, "percentage": 71.79, "elapsed_time": "5 days, 0:38:14", "remaining_time": "1 day, 23:24:44", "throughput": 2726.1, "total_tokens": 1183927584} {"current_steps": 6558, "total_steps": 9134, "loss": 0.6658, "learning_rate": 9.187157841984082e-06, "epoch": 0.7179178412107611, "percentage": 71.8, "elapsed_time": "5 days, 0:39:22", "remaining_time": "1 day, 23:23:38", "throughput": 2726.06, "total_tokens": 1184099392} {"current_steps": 6559, "total_steps": 9134, "loss": 0.7983, "learning_rate": 9.180498721532657e-06, "epoch": 0.718027313281699, "percentage": 71.81, "elapsed_time": "5 days, 0:40:31", "remaining_time": "1 day, 23:22:33", "throughput": 2726.14, "total_tokens": 1184320480} {"current_steps": 6560, "total_steps": 9134, "loss": 0.9572, "learning_rate": 9.173841472498001e-06, "epoch": 0.7181367853526369, "percentage": 71.82, "elapsed_time": "5 days, 0:41:35", "remaining_time": "1 day, 23:21:26", "throughput": 2726.13, "total_tokens": 1184491616} {"current_steps": 6561, "total_steps": 9134, "loss": 0.7051, "learning_rate": 9.167186095667643e-06, "epoch": 0.7182462574235748, "percentage": 71.83, "elapsed_time": "5 days, 0:42:38", "remaining_time": "1 day, 23:20:19", "throughput": 2726.11, "total_tokens": 1184654464} {"current_steps": 6562, "total_steps": 9134, "loss": 0.6713, "learning_rate": 9.160532591828902e-06, "epoch": 0.7183557294945128, "percentage": 71.84, "elapsed_time": "5 days, 0:43:42", "remaining_time": "1 day, 23:19:11", "throughput": 2726.13, "total_tokens": 1184837472} {"current_steps": 6563, "total_steps": 9134, "loss": 0.7939, "learning_rate": 9.153880961768877e-06, "epoch": 0.7184652015654506, "percentage": 71.85, "elapsed_time": "5 days, 0:44:50", "remaining_time": "1 day, 23:18:06", "throughput": 2726.2, "total_tokens": 1185054080} {"current_steps": 6564, "total_steps": 9134, "loss": 0.7731, "learning_rate": 9.147231206274431e-06, "epoch": 0.7185746736363885, "percentage": 71.86, "elapsed_time": "5 days, 0:45:54", "remaining_time": "1 day, 23:16:59", "throughput": 2726.2, "total_tokens": 1185227232} {"current_steps": 6565, "total_steps": 9134, "loss": 0.7692, "learning_rate": 9.140583326132249e-06, "epoch": 0.7186841457073264, "percentage": 71.87, "elapsed_time": "5 days, 0:46:55", "remaining_time": "1 day, 23:15:50", "throughput": 2726.15, "total_tokens": 1185370368} {"current_steps": 6566, "total_steps": 9134, "loss": 0.6939, "learning_rate": 9.133937322128722e-06, "epoch": 0.7187936177782643, "percentage": 71.89, "elapsed_time": "5 days, 0:48:00", "remaining_time": "1 day, 23:14:44", "throughput": 2726.14, "total_tokens": 1185543744} {"current_steps": 6567, "total_steps": 9134, "loss": 1.0002, "learning_rate": 9.127293195050096e-06, "epoch": 0.7189030898492023, "percentage": 71.9, "elapsed_time": "5 days, 0:49:03", "remaining_time": "1 day, 23:13:36", "throughput": 2726.15, "total_tokens": 1185722720} {"current_steps": 6568, "total_steps": 9134, "loss": 0.5654, "learning_rate": 9.120650945682325e-06, "epoch": 0.7190125619201401, "percentage": 71.91, "elapsed_time": "5 days, 0:50:09", "remaining_time": "1 day, 23:12:30", "throughput": 2726.18, "total_tokens": 1185913792} {"current_steps": 6569, "total_steps": 9134, "loss": 0.6868, "learning_rate": 9.114010574811197e-06, "epoch": 0.719122033991078, "percentage": 71.92, "elapsed_time": "5 days, 0:51:16", "remaining_time": "1 day, 23:11:24", "throughput": 2726.17, "total_tokens": 1186092768} {"current_steps": 6570, "total_steps": 9134, "loss": 0.8304, "learning_rate": 9.107372083222251e-06, "epoch": 0.7192315060620159, "percentage": 71.93, "elapsed_time": "5 days, 0:52:17", "remaining_time": "1 day, 23:10:16", "throughput": 2726.16, "total_tokens": 1186254720} {"current_steps": 6571, "total_steps": 9134, "loss": 0.8053, "learning_rate": 9.100735471700805e-06, "epoch": 0.7193409781329538, "percentage": 71.94, "elapsed_time": "5 days, 0:53:24", "remaining_time": "1 day, 23:09:10", "throughput": 2726.19, "total_tokens": 1186450944} {"current_steps": 6572, "total_steps": 9134, "loss": 0.5698, "learning_rate": 9.094100741031961e-06, "epoch": 0.7194504502038918, "percentage": 71.95, "elapsed_time": "5 days, 0:54:29", "remaining_time": "1 day, 23:08:03", "throughput": 2726.21, "total_tokens": 1186634400} {"current_steps": 6573, "total_steps": 9134, "loss": 0.6843, "learning_rate": 9.087467892000582e-06, "epoch": 0.7195599222748297, "percentage": 71.96, "elapsed_time": "5 days, 0:55:34", "remaining_time": "1 day, 23:06:56", "throughput": 2726.13, "total_tokens": 1186778432} {"current_steps": 6574, "total_steps": 9134, "loss": 0.7123, "learning_rate": 9.08083692539135e-06, "epoch": 0.7196693943457675, "percentage": 71.97, "elapsed_time": "5 days, 0:56:39", "remaining_time": "1 day, 23:05:50", "throughput": 2726.15, "total_tokens": 1186964128} {"current_steps": 6575, "total_steps": 9134, "loss": 0.8055, "learning_rate": 9.07420784198866e-06, "epoch": 0.7197788664167054, "percentage": 71.98, "elapsed_time": "5 days, 0:57:40", "remaining_time": "1 day, 23:04:41", "throughput": 2726.13, "total_tokens": 1187123392} {"current_steps": 6576, "total_steps": 9134, "loss": 0.7627, "learning_rate": 9.067580642576746e-06, "epoch": 0.7198883384876433, "percentage": 71.99, "elapsed_time": "5 days, 0:58:43", "remaining_time": "1 day, 23:03:34", "throughput": 2726.11, "total_tokens": 1187283552} {"current_steps": 6577, "total_steps": 9134, "loss": 0.9206, "learning_rate": 9.060955327939582e-06, "epoch": 0.7199978105585813, "percentage": 72.01, "elapsed_time": "5 days, 0:59:49", "remaining_time": "1 day, 23:02:28", "throughput": 2726.13, "total_tokens": 1187473952} {"current_steps": 6578, "total_steps": 9134, "loss": 0.7725, "learning_rate": 9.054331898860935e-06, "epoch": 0.7201072826295192, "percentage": 72.02, "elapsed_time": "5 days, 1:00:52", "remaining_time": "1 day, 23:01:20", "throughput": 2726.11, "total_tokens": 1187635456} {"current_steps": 6579, "total_steps": 9134, "loss": 0.9809, "learning_rate": 9.047710356124342e-06, "epoch": 0.7202167547004571, "percentage": 72.03, "elapsed_time": "5 days, 1:01:55", "remaining_time": "1 day, 23:00:13", "throughput": 2726.11, "total_tokens": 1187807712} {"current_steps": 6580, "total_steps": 9134, "loss": 0.6504, "learning_rate": 9.041090700513117e-06, "epoch": 0.7203262267713949, "percentage": 72.04, "elapsed_time": "5 days, 1:03:02", "remaining_time": "1 day, 22:59:07", "throughput": 2726.1, "total_tokens": 1187987360} {"current_steps": 6581, "total_steps": 9134, "loss": 0.7909, "learning_rate": 9.034472932810354e-06, "epoch": 0.7204356988423328, "percentage": 72.05, "elapsed_time": "5 days, 1:04:09", "remaining_time": "1 day, 22:58:01", "throughput": 2726.16, "total_tokens": 1188194112} {"current_steps": 6582, "total_steps": 9134, "loss": 0.9215, "learning_rate": 9.027857053798913e-06, "epoch": 0.7205451709132707, "percentage": 72.06, "elapsed_time": "5 days, 1:05:16", "remaining_time": "1 day, 22:56:55", "throughput": 2726.22, "total_tokens": 1188406912} {"current_steps": 6583, "total_steps": 9134, "loss": 1.0656, "learning_rate": 9.02124306426146e-06, "epoch": 0.7206546429842087, "percentage": 72.07, "elapsed_time": "5 days, 1:06:24", "remaining_time": "1 day, 22:55:49", "throughput": 2726.28, "total_tokens": 1188616576} {"current_steps": 6584, "total_steps": 9134, "loss": 0.9511, "learning_rate": 9.014630964980404e-06, "epoch": 0.7207641150551466, "percentage": 72.08, "elapsed_time": "5 days, 1:07:31", "remaining_time": "1 day, 22:54:43", "throughput": 2726.34, "total_tokens": 1188824448} {"current_steps": 6585, "total_steps": 9134, "loss": 0.8529, "learning_rate": 9.008020756737945e-06, "epoch": 0.7208735871260844, "percentage": 72.09, "elapsed_time": "5 days, 1:08:39", "remaining_time": "1 day, 22:53:38", "throughput": 2726.35, "total_tokens": 1189011936} {"current_steps": 6586, "total_steps": 9134, "loss": 0.9814, "learning_rate": 9.001412440316059e-06, "epoch": 0.7209830591970223, "percentage": 72.1, "elapsed_time": "5 days, 1:09:43", "remaining_time": "1 day, 22:52:31", "throughput": 2726.38, "total_tokens": 1189202336} {"current_steps": 6587, "total_steps": 9134, "loss": 0.7476, "learning_rate": 8.994806016496499e-06, "epoch": 0.7210925312679602, "percentage": 72.12, "elapsed_time": "5 days, 1:10:50", "remaining_time": "1 day, 22:51:25", "throughput": 2726.37, "total_tokens": 1189381536} {"current_steps": 6588, "total_steps": 9134, "loss": 0.7003, "learning_rate": 8.988201486060791e-06, "epoch": 0.7212020033388982, "percentage": 72.13, "elapsed_time": "5 days, 1:11:58", "remaining_time": "1 day, 22:50:19", "throughput": 2726.4, "total_tokens": 1189580224} {"current_steps": 6589, "total_steps": 9134, "loss": 0.6302, "learning_rate": 8.981598849790238e-06, "epoch": 0.7213114754098361, "percentage": 72.14, "elapsed_time": "5 days, 1:13:03", "remaining_time": "1 day, 22:49:12", "throughput": 2726.4, "total_tokens": 1189753376} {"current_steps": 6590, "total_steps": 9134, "loss": 0.9024, "learning_rate": 8.974998108465907e-06, "epoch": 0.721420947480774, "percentage": 72.15, "elapsed_time": "5 days, 1:14:08", "remaining_time": "1 day, 22:48:06", "throughput": 2726.39, "total_tokens": 1189929664} {"current_steps": 6591, "total_steps": 9134, "loss": 0.6359, "learning_rate": 8.968399262868677e-06, "epoch": 0.7215304195517118, "percentage": 72.16, "elapsed_time": "5 days, 1:15:14", "remaining_time": "1 day, 22:46:59", "throughput": 2726.42, "total_tokens": 1190118720} {"current_steps": 6592, "total_steps": 9134, "loss": 0.7358, "learning_rate": 8.961802313779166e-06, "epoch": 0.7216398916226497, "percentage": 72.17, "elapsed_time": "5 days, 1:16:19", "remaining_time": "1 day, 22:45:53", "throughput": 2726.43, "total_tokens": 1190302624} {"current_steps": 6593, "total_steps": 9134, "loss": 0.768, "learning_rate": 8.955207261977783e-06, "epoch": 0.7217493636935877, "percentage": 72.18, "elapsed_time": "5 days, 1:17:27", "remaining_time": "1 day, 22:44:47", "throughput": 2726.48, "total_tokens": 1190510720} {"current_steps": 6594, "total_steps": 9134, "loss": 0.83, "learning_rate": 8.948614108244705e-06, "epoch": 0.7218588357645256, "percentage": 72.19, "elapsed_time": "5 days, 1:18:34", "remaining_time": "1 day, 22:43:42", "throughput": 2726.54, "total_tokens": 1190721952} {"current_steps": 6595, "total_steps": 9134, "loss": 0.6181, "learning_rate": 8.942022853359896e-06, "epoch": 0.7219683078354635, "percentage": 72.2, "elapsed_time": "5 days, 1:19:40", "remaining_time": "1 day, 22:42:35", "throughput": 2726.51, "total_tokens": 1190887264} {"current_steps": 6596, "total_steps": 9134, "loss": 0.837, "learning_rate": 8.935433498103086e-06, "epoch": 0.7220777799064014, "percentage": 72.21, "elapsed_time": "5 days, 1:20:40", "remaining_time": "1 day, 22:41:27", "throughput": 2726.5, "total_tokens": 1191047872} {"current_steps": 6597, "total_steps": 9134, "loss": 0.5566, "learning_rate": 8.928846043253772e-06, "epoch": 0.7221872519773392, "percentage": 72.22, "elapsed_time": "5 days, 1:21:48", "remaining_time": "1 day, 22:40:21", "throughput": 2726.57, "total_tokens": 1191261344} {"current_steps": 6598, "total_steps": 9134, "loss": 0.7768, "learning_rate": 8.922260489591266e-06, "epoch": 0.7222967240482772, "percentage": 72.24, "elapsed_time": "5 days, 1:22:54", "remaining_time": "1 day, 22:39:15", "throughput": 2726.55, "total_tokens": 1191432032} {"current_steps": 6599, "total_steps": 9134, "loss": 0.7494, "learning_rate": 8.915676837894593e-06, "epoch": 0.7224061961192151, "percentage": 72.25, "elapsed_time": "5 days, 1:24:01", "remaining_time": "1 day, 22:38:09", "throughput": 2726.53, "total_tokens": 1191609216} {"current_steps": 6600, "total_steps": 9134, "loss": 0.624, "learning_rate": 8.909095088942617e-06, "epoch": 0.722515668190153, "percentage": 72.26, "elapsed_time": "5 days, 1:25:06", "remaining_time": "1 day, 22:37:02", "throughput": 2726.56, "total_tokens": 1191799392} {"current_steps": 6601, "total_steps": 9134, "loss": 0.658, "learning_rate": 8.902515243513918e-06, "epoch": 0.7226251402610909, "percentage": 72.27, "elapsed_time": "5 days, 1:26:14", "remaining_time": "1 day, 22:35:56", "throughput": 2726.59, "total_tokens": 1191994048} {"current_steps": 6602, "total_steps": 9134, "loss": 0.6592, "learning_rate": 8.895937302386898e-06, "epoch": 0.7227346123320287, "percentage": 72.28, "elapsed_time": "5 days, 1:27:16", "remaining_time": "1 day, 22:34:49", "throughput": 2726.56, "total_tokens": 1192150176} {"current_steps": 6603, "total_steps": 9134, "loss": 0.8872, "learning_rate": 8.88936126633971e-06, "epoch": 0.7228440844029667, "percentage": 72.29, "elapsed_time": "5 days, 1:28:24", "remaining_time": "1 day, 22:33:43", "throughput": 2726.6, "total_tokens": 1192355136} {"current_steps": 6604, "total_steps": 9134, "loss": 0.8755, "learning_rate": 8.882787136150275e-06, "epoch": 0.7229535564739046, "percentage": 72.3, "elapsed_time": "5 days, 1:29:29", "remaining_time": "1 day, 22:32:36", "throughput": 2726.62, "total_tokens": 1192540832} {"current_steps": 6605, "total_steps": 9134, "loss": 0.6953, "learning_rate": 8.876214912596331e-06, "epoch": 0.7230630285448425, "percentage": 72.31, "elapsed_time": "5 days, 1:30:37", "remaining_time": "1 day, 22:31:31", "throughput": 2726.67, "total_tokens": 1192746240} {"current_steps": 6606, "total_steps": 9134, "loss": 0.7222, "learning_rate": 8.869644596455324e-06, "epoch": 0.7231725006157804, "percentage": 72.32, "elapsed_time": "5 days, 1:31:45", "remaining_time": "1 day, 22:30:25", "throughput": 2726.71, "total_tokens": 1192951648} {"current_steps": 6607, "total_steps": 9134, "loss": 0.7606, "learning_rate": 8.863076188504537e-06, "epoch": 0.7232819726867183, "percentage": 72.33, "elapsed_time": "5 days, 1:32:53", "remaining_time": "1 day, 22:29:20", "throughput": 2726.74, "total_tokens": 1193149440} {"current_steps": 6608, "total_steps": 9134, "loss": 0.7701, "learning_rate": 8.856509689520976e-06, "epoch": 0.7233914447576562, "percentage": 72.35, "elapsed_time": "5 days, 1:33:59", "remaining_time": "1 day, 22:28:13", "throughput": 2726.73, "total_tokens": 1193323488} {"current_steps": 6609, "total_steps": 9134, "loss": 0.6302, "learning_rate": 8.849945100281474e-06, "epoch": 0.7235009168285941, "percentage": 72.36, "elapsed_time": "5 days, 1:35:02", "remaining_time": "1 day, 22:27:06", "throughput": 2726.71, "total_tokens": 1193487456} {"current_steps": 6610, "total_steps": 9134, "loss": 0.7829, "learning_rate": 8.843382421562573e-06, "epoch": 0.723610388899532, "percentage": 72.37, "elapsed_time": "5 days, 1:36:05", "remaining_time": "1 day, 22:25:58", "throughput": 2726.72, "total_tokens": 1193662400} {"current_steps": 6611, "total_steps": 9134, "loss": 1.2094, "learning_rate": 8.836821654140656e-06, "epoch": 0.7237198609704699, "percentage": 72.38, "elapsed_time": "5 days, 1:37:12", "remaining_time": "1 day, 22:24:52", "throughput": 2726.77, "total_tokens": 1193868704} {"current_steps": 6612, "total_steps": 9134, "loss": 0.8877, "learning_rate": 8.830262798791838e-06, "epoch": 0.7238293330414078, "percentage": 72.39, "elapsed_time": "5 days, 1:38:19", "remaining_time": "1 day, 22:23:47", "throughput": 2726.79, "total_tokens": 1194062464} {"current_steps": 6613, "total_steps": 9134, "loss": 0.644, "learning_rate": 8.823705856292019e-06, "epoch": 0.7239388051123458, "percentage": 72.4, "elapsed_time": "5 days, 1:39:23", "remaining_time": "1 day, 22:22:39", "throughput": 2726.77, "total_tokens": 1194226432} {"current_steps": 6614, "total_steps": 9134, "loss": 0.7796, "learning_rate": 8.817150827416876e-06, "epoch": 0.7240482771832836, "percentage": 72.41, "elapsed_time": "5 days, 1:40:30", "remaining_time": "1 day, 22:21:33", "throughput": 2726.77, "total_tokens": 1194406976} {"current_steps": 6615, "total_steps": 9134, "loss": 0.8061, "learning_rate": 8.810597712941843e-06, "epoch": 0.7241577492542215, "percentage": 72.42, "elapsed_time": "5 days, 1:41:33", "remaining_time": "1 day, 22:20:26", "throughput": 2726.78, "total_tokens": 1194581696} {"current_steps": 6616, "total_steps": 9134, "loss": 0.9857, "learning_rate": 8.80404651364217e-06, "epoch": 0.7242672213251594, "percentage": 72.43, "elapsed_time": "5 days, 1:42:40", "remaining_time": "1 day, 22:19:20", "throughput": 2726.76, "total_tokens": 1194760000} {"current_steps": 6617, "total_steps": 9134, "loss": 0.9998, "learning_rate": 8.797497230292814e-06, "epoch": 0.7243766933960973, "percentage": 72.44, "elapsed_time": "5 days, 1:43:45", "remaining_time": "1 day, 22:18:13", "throughput": 2726.69, "total_tokens": 1194905600} {"current_steps": 6618, "total_steps": 9134, "loss": 1.0156, "learning_rate": 8.790949863668571e-06, "epoch": 0.7244861654670353, "percentage": 72.45, "elapsed_time": "5 days, 1:44:52", "remaining_time": "1 day, 22:17:08", "throughput": 2726.74, "total_tokens": 1195112352} {"current_steps": 6619, "total_steps": 9134, "loss": 0.8343, "learning_rate": 8.784404414543973e-06, "epoch": 0.7245956375379731, "percentage": 72.47, "elapsed_time": "5 days, 1:45:56", "remaining_time": "1 day, 22:16:01", "throughput": 2726.68, "total_tokens": 1195259296} {"current_steps": 6620, "total_steps": 9134, "loss": 0.9077, "learning_rate": 8.777860883693335e-06, "epoch": 0.724705109608911, "percentage": 72.48, "elapsed_time": "5 days, 1:47:03", "remaining_time": "1 day, 22:14:55", "throughput": 2726.69, "total_tokens": 1195444544} {"current_steps": 6621, "total_steps": 9134, "loss": 0.7657, "learning_rate": 8.771319271890741e-06, "epoch": 0.7248145816798489, "percentage": 72.49, "elapsed_time": "5 days, 1:48:11", "remaining_time": "1 day, 22:13:49", "throughput": 2726.72, "total_tokens": 1195644576} {"current_steps": 6622, "total_steps": 9134, "loss": 0.6545, "learning_rate": 8.764779579910054e-06, "epoch": 0.7249240537507868, "percentage": 72.5, "elapsed_time": "5 days, 1:49:16", "remaining_time": "1 day, 22:12:42", "throughput": 2726.71, "total_tokens": 1195815040} {"current_steps": 6623, "total_steps": 9134, "loss": 0.9177, "learning_rate": 8.758241808524906e-06, "epoch": 0.7250335258217248, "percentage": 72.51, "elapsed_time": "5 days, 1:50:21", "remaining_time": "1 day, 22:11:36", "throughput": 2726.7, "total_tokens": 1195992224} {"current_steps": 6624, "total_steps": 9134, "loss": 1.0859, "learning_rate": 8.751705958508697e-06, "epoch": 0.7251429978926627, "percentage": 72.52, "elapsed_time": "5 days, 1:51:30", "remaining_time": "1 day, 22:10:30", "throughput": 2726.72, "total_tokens": 1196187328} {"current_steps": 6625, "total_steps": 9134, "loss": 0.9452, "learning_rate": 8.745172030634616e-06, "epoch": 0.7252524699636005, "percentage": 72.53, "elapsed_time": "5 days, 1:52:35", "remaining_time": "1 day, 22:09:24", "throughput": 2726.69, "total_tokens": 1196350624} {"current_steps": 6626, "total_steps": 9134, "loss": 0.9741, "learning_rate": 8.738640025675612e-06, "epoch": 0.7253619420345384, "percentage": 72.54, "elapsed_time": "5 days, 1:53:39", "remaining_time": "1 day, 22:08:16", "throughput": 2726.71, "total_tokens": 1196531616} {"current_steps": 6627, "total_steps": 9134, "loss": 0.6813, "learning_rate": 8.732109944404408e-06, "epoch": 0.7254714141054763, "percentage": 72.55, "elapsed_time": "5 days, 1:54:46", "remaining_time": "1 day, 22:07:11", "throughput": 2726.72, "total_tokens": 1196722240} {"current_steps": 6628, "total_steps": 9134, "loss": 0.9786, "learning_rate": 8.725581787593496e-06, "epoch": 0.7255808861764143, "percentage": 72.56, "elapsed_time": "5 days, 1:55:55", "remaining_time": "1 day, 22:06:05", "throughput": 2726.8, "total_tokens": 1196941312} {"current_steps": 6629, "total_steps": 9134, "loss": 0.9005, "learning_rate": 8.719055556015149e-06, "epoch": 0.7256903582473522, "percentage": 72.57, "elapsed_time": "5 days, 1:56:57", "remaining_time": "1 day, 22:04:58", "throughput": 2726.76, "total_tokens": 1197095872} {"current_steps": 6630, "total_steps": 9134, "loss": 0.8307, "learning_rate": 8.712531250441394e-06, "epoch": 0.7257998303182901, "percentage": 72.59, "elapsed_time": "5 days, 1:58:06", "remaining_time": "1 day, 22:03:52", "throughput": 2726.76, "total_tokens": 1197283808} {"current_steps": 6631, "total_steps": 9134, "loss": 0.8498, "learning_rate": 8.706008871644075e-06, "epoch": 0.7259093023892279, "percentage": 72.6, "elapsed_time": "5 days, 1:59:12", "remaining_time": "1 day, 22:02:46", "throughput": 2726.76, "total_tokens": 1197463904} {"current_steps": 6632, "total_steps": 9134, "loss": 0.6923, "learning_rate": 8.699488420394741e-06, "epoch": 0.7260187744601658, "percentage": 72.61, "elapsed_time": "5 days, 2:00:17", "remaining_time": "1 day, 22:01:39", "throughput": 2726.74, "total_tokens": 1197631904} {"current_steps": 6633, "total_steps": 9134, "loss": 0.7962, "learning_rate": 8.692969897464775e-06, "epoch": 0.7261282465311037, "percentage": 72.62, "elapsed_time": "5 days, 2:01:21", "remaining_time": "1 day, 22:00:33", "throughput": 2726.78, "total_tokens": 1197826560} {"current_steps": 6634, "total_steps": 9134, "loss": 0.8388, "learning_rate": 8.686453303625294e-06, "epoch": 0.7262377186020417, "percentage": 72.63, "elapsed_time": "5 days, 2:02:26", "remaining_time": "1 day, 21:59:26", "throughput": 2726.79, "total_tokens": 1198005088} {"current_steps": 6635, "total_steps": 9134, "loss": 0.9238, "learning_rate": 8.679938639647203e-06, "epoch": 0.7263471906729796, "percentage": 72.64, "elapsed_time": "5 days, 2:03:30", "remaining_time": "1 day, 21:58:19", "throughput": 2726.78, "total_tokens": 1198174656} {"current_steps": 6636, "total_steps": 9134, "loss": 0.7076, "learning_rate": 8.673425906301171e-06, "epoch": 0.7264566627439174, "percentage": 72.65, "elapsed_time": "5 days, 2:04:36", "remaining_time": "1 day, 21:57:12", "throughput": 2726.83, "total_tokens": 1198376704} {"current_steps": 6637, "total_steps": 9134, "loss": 0.8841, "learning_rate": 8.666915104357637e-06, "epoch": 0.7265661348148553, "percentage": 72.66, "elapsed_time": "5 days, 2:05:40", "remaining_time": "1 day, 21:56:05", "throughput": 2726.81, "total_tokens": 1198542016} {"current_steps": 6638, "total_steps": 9134, "loss": 0.7606, "learning_rate": 8.660406234586838e-06, "epoch": 0.7266756068857932, "percentage": 72.67, "elapsed_time": "5 days, 2:06:43", "remaining_time": "1 day, 21:54:58", "throughput": 2726.8, "total_tokens": 1198709568} {"current_steps": 6639, "total_steps": 9134, "loss": 0.6159, "learning_rate": 8.653899297758728e-06, "epoch": 0.7267850789567312, "percentage": 72.68, "elapsed_time": "5 days, 2:07:51", "remaining_time": "1 day, 21:53:52", "throughput": 2726.82, "total_tokens": 1198902432} {"current_steps": 6640, "total_steps": 9134, "loss": 0.8114, "learning_rate": 8.647394294643099e-06, "epoch": 0.7268945510276691, "percentage": 72.7, "elapsed_time": "5 days, 2:08:56", "remaining_time": "1 day, 21:52:46", "throughput": 2726.85, "total_tokens": 1199097088} {"current_steps": 6641, "total_steps": 9134, "loss": 0.7512, "learning_rate": 8.640891226009449e-06, "epoch": 0.727004023098607, "percentage": 72.71, "elapsed_time": "5 days, 2:09:58", "remaining_time": "1 day, 21:51:38", "throughput": 2726.83, "total_tokens": 1199253664} {"current_steps": 6642, "total_steps": 9134, "loss": 0.7364, "learning_rate": 8.63439009262711e-06, "epoch": 0.7271134951695448, "percentage": 72.72, "elapsed_time": "5 days, 2:11:03", "remaining_time": "1 day, 21:50:31", "throughput": 2726.85, "total_tokens": 1199444064} {"current_steps": 6643, "total_steps": 9134, "loss": 0.8733, "learning_rate": 8.62789089526512e-06, "epoch": 0.7272229672404827, "percentage": 72.73, "elapsed_time": "5 days, 2:12:12", "remaining_time": "1 day, 21:49:26", "throughput": 2726.88, "total_tokens": 1199642304} {"current_steps": 6644, "total_steps": 9134, "loss": 0.9894, "learning_rate": 8.621393634692346e-06, "epoch": 0.7273324393114207, "percentage": 72.74, "elapsed_time": "5 days, 2:13:20", "remaining_time": "1 day, 21:48:20", "throughput": 2726.94, "total_tokens": 1199855104} {"current_steps": 6645, "total_steps": 9134, "loss": 0.7521, "learning_rate": 8.614898311677397e-06, "epoch": 0.7274419113823586, "percentage": 72.75, "elapsed_time": "5 days, 2:14:29", "remaining_time": "1 day, 21:47:15", "throughput": 2726.93, "total_tokens": 1200036320} {"current_steps": 6646, "total_steps": 9134, "loss": 0.8166, "learning_rate": 8.608404926988644e-06, "epoch": 0.7275513834532965, "percentage": 72.76, "elapsed_time": "5 days, 2:15:32", "remaining_time": "1 day, 21:46:08", "throughput": 2726.89, "total_tokens": 1200191776} {"current_steps": 6647, "total_steps": 9134, "loss": 0.5999, "learning_rate": 8.601913481394273e-06, "epoch": 0.7276608555242344, "percentage": 72.77, "elapsed_time": "5 days, 2:16:30", "remaining_time": "1 day, 21:44:59", "throughput": 2726.82, "total_tokens": 1200319904} {"current_steps": 6648, "total_steps": 9134, "loss": 0.6633, "learning_rate": 8.595423975662168e-06, "epoch": 0.7277703275951722, "percentage": 72.78, "elapsed_time": "5 days, 2:17:36", "remaining_time": "1 day, 21:43:52", "throughput": 2726.83, "total_tokens": 1200505376} {"current_steps": 6649, "total_steps": 9134, "loss": 0.7045, "learning_rate": 8.588936410560065e-06, "epoch": 0.7278797996661102, "percentage": 72.79, "elapsed_time": "5 days, 2:18:42", "remaining_time": "1 day, 21:42:46", "throughput": 2726.78, "total_tokens": 1200663296} {"current_steps": 6650, "total_steps": 9134, "loss": 0.8198, "learning_rate": 8.582450786855394e-06, "epoch": 0.7279892717370481, "percentage": 72.8, "elapsed_time": "5 days, 2:19:45", "remaining_time": "1 day, 21:41:38", "throughput": 2726.79, "total_tokens": 1200840704} {"current_steps": 6651, "total_steps": 9134, "loss": 0.6319, "learning_rate": 8.575967105315422e-06, "epoch": 0.728098743807986, "percentage": 72.82, "elapsed_time": "5 days, 2:20:49", "remaining_time": "1 day, 21:40:31", "throughput": 2726.75, "total_tokens": 1200995488} {"current_steps": 6652, "total_steps": 9134, "loss": 0.9258, "learning_rate": 8.569485366707142e-06, "epoch": 0.7282082158789239, "percentage": 72.83, "elapsed_time": "5 days, 2:21:54", "remaining_time": "1 day, 21:39:25", "throughput": 2726.72, "total_tokens": 1201162144} {"current_steps": 6653, "total_steps": 9134, "loss": 0.7841, "learning_rate": 8.563005571797334e-06, "epoch": 0.7283176879498617, "percentage": 72.84, "elapsed_time": "5 days, 2:23:00", "remaining_time": "1 day, 21:38:18", "throughput": 2726.68, "total_tokens": 1201322528} {"current_steps": 6654, "total_steps": 9134, "loss": 0.932, "learning_rate": 8.556527721352542e-06, "epoch": 0.7284271600207997, "percentage": 72.85, "elapsed_time": "5 days, 2:24:05", "remaining_time": "1 day, 21:37:12", "throughput": 2726.7, "total_tokens": 1201507104} {"current_steps": 6655, "total_steps": 9134, "loss": 0.9286, "learning_rate": 8.550051816139088e-06, "epoch": 0.7285366320917376, "percentage": 72.86, "elapsed_time": "5 days, 2:25:09", "remaining_time": "1 day, 21:36:04", "throughput": 2726.7, "total_tokens": 1201679808} {"current_steps": 6656, "total_steps": 9134, "loss": 0.9688, "learning_rate": 8.543577856923058e-06, "epoch": 0.7286461041626755, "percentage": 72.87, "elapsed_time": "5 days, 2:26:12", "remaining_time": "1 day, 21:34:57", "throughput": 2726.69, "total_tokens": 1201852288} {"current_steps": 6657, "total_steps": 9134, "loss": 0.8774, "learning_rate": 8.537105844470297e-06, "epoch": 0.7287555762336134, "percentage": 72.88, "elapsed_time": "5 days, 2:27:18", "remaining_time": "1 day, 21:33:51", "throughput": 2726.66, "total_tokens": 1202016032} {"current_steps": 6658, "total_steps": 9134, "loss": 0.9674, "learning_rate": 8.530635779546453e-06, "epoch": 0.7288650483045513, "percentage": 72.89, "elapsed_time": "5 days, 2:28:25", "remaining_time": "1 day, 21:32:45", "throughput": 2726.66, "total_tokens": 1202197920} {"current_steps": 6659, "total_steps": 9134, "loss": 0.8467, "learning_rate": 8.524167662916913e-06, "epoch": 0.7289745203754892, "percentage": 72.9, "elapsed_time": "5 days, 2:29:29", "remaining_time": "1 day, 21:31:38", "throughput": 2726.64, "total_tokens": 1202364128} {"current_steps": 6660, "total_steps": 9134, "loss": 0.8004, "learning_rate": 8.517701495346842e-06, "epoch": 0.7290839924464271, "percentage": 72.91, "elapsed_time": "5 days, 2:30:31", "remaining_time": "1 day, 21:30:30", "throughput": 2726.63, "total_tokens": 1202526976} {"current_steps": 6661, "total_steps": 9134, "loss": 0.7838, "learning_rate": 8.511237277601174e-06, "epoch": 0.729193464517365, "percentage": 72.93, "elapsed_time": "5 days, 2:31:30", "remaining_time": "1 day, 21:29:21", "throughput": 2726.61, "total_tokens": 1202679296} {"current_steps": 6662, "total_steps": 9134, "loss": 0.6777, "learning_rate": 8.504775010444616e-06, "epoch": 0.7293029365883029, "percentage": 72.94, "elapsed_time": "5 days, 2:32:37", "remaining_time": "1 day, 21:28:15", "throughput": 2726.58, "total_tokens": 1202850880} {"current_steps": 6663, "total_steps": 9134, "loss": 0.9366, "learning_rate": 8.49831469464164e-06, "epoch": 0.7294124086592408, "percentage": 72.95, "elapsed_time": "5 days, 2:33:39", "remaining_time": "1 day, 21:27:08", "throughput": 2726.57, "total_tokens": 1203017536} {"current_steps": 6664, "total_steps": 9134, "loss": 1.0457, "learning_rate": 8.491856330956491e-06, "epoch": 0.7295218807301788, "percentage": 72.96, "elapsed_time": "5 days, 2:34:40", "remaining_time": "1 day, 21:25:59", "throughput": 2726.55, "total_tokens": 1203173888} {"current_steps": 6665, "total_steps": 9134, "loss": 0.8974, "learning_rate": 8.48539992015317e-06, "epoch": 0.7296313528011166, "percentage": 72.97, "elapsed_time": "5 days, 2:35:45", "remaining_time": "1 day, 21:24:53", "throughput": 2726.53, "total_tokens": 1203339872} {"current_steps": 6666, "total_steps": 9134, "loss": 0.6084, "learning_rate": 8.478945462995477e-06, "epoch": 0.7297408248720545, "percentage": 72.98, "elapsed_time": "5 days, 2:36:51", "remaining_time": "1 day, 21:23:47", "throughput": 2726.49, "total_tokens": 1203505632} {"current_steps": 6667, "total_steps": 9134, "loss": 0.8562, "learning_rate": 8.472492960246953e-06, "epoch": 0.7298502969429924, "percentage": 72.99, "elapsed_time": "5 days, 2:37:58", "remaining_time": "1 day, 21:22:40", "throughput": 2726.49, "total_tokens": 1203686848} {"current_steps": 6668, "total_steps": 9134, "loss": 0.7483, "learning_rate": 8.466042412670916e-06, "epoch": 0.7299597690139303, "percentage": 73.0, "elapsed_time": "5 days, 2:38:58", "remaining_time": "1 day, 21:21:32", "throughput": 2726.45, "total_tokens": 1203832448} {"current_steps": 6669, "total_steps": 9134, "loss": 0.5752, "learning_rate": 8.459593821030454e-06, "epoch": 0.7300692410848683, "percentage": 73.01, "elapsed_time": "5 days, 2:40:02", "remaining_time": "1 day, 21:20:25", "throughput": 2726.48, "total_tokens": 1204020608} {"current_steps": 6670, "total_steps": 9134, "loss": 0.7345, "learning_rate": 8.453147186088423e-06, "epoch": 0.7301787131558061, "percentage": 73.02, "elapsed_time": "5 days, 2:41:05", "remaining_time": "1 day, 21:19:17", "throughput": 2726.49, "total_tokens": 1204195104} {"current_steps": 6671, "total_steps": 9134, "loss": 1.0612, "learning_rate": 8.446702508607449e-06, "epoch": 0.730288185226744, "percentage": 73.03, "elapsed_time": "5 days, 2:42:09", "remaining_time": "1 day, 21:18:11", "throughput": 2726.48, "total_tokens": 1204366688} {"current_steps": 6672, "total_steps": 9134, "loss": 0.6685, "learning_rate": 8.440259789349913e-06, "epoch": 0.7303976572976819, "percentage": 73.05, "elapsed_time": "5 days, 2:43:15", "remaining_time": "1 day, 21:17:04", "throughput": 2726.5, "total_tokens": 1204555744} {"current_steps": 6673, "total_steps": 9134, "loss": 0.9997, "learning_rate": 8.433819029078005e-06, "epoch": 0.7305071293686198, "percentage": 73.06, "elapsed_time": "5 days, 2:44:23", "remaining_time": "1 day, 21:15:58", "throughput": 2726.51, "total_tokens": 1204745920} {"current_steps": 6674, "total_steps": 9134, "loss": 0.6609, "learning_rate": 8.42738022855362e-06, "epoch": 0.7306166014395578, "percentage": 73.07, "elapsed_time": "5 days, 2:45:31", "remaining_time": "1 day, 21:14:53", "throughput": 2726.51, "total_tokens": 1204930496} {"current_steps": 6675, "total_steps": 9134, "loss": 0.8714, "learning_rate": 8.42094338853848e-06, "epoch": 0.7307260735104957, "percentage": 73.08, "elapsed_time": "5 days, 2:46:36", "remaining_time": "1 day, 21:13:47", "throughput": 2726.5, "total_tokens": 1205102528} {"current_steps": 6676, "total_steps": 9134, "loss": 0.9924, "learning_rate": 8.414508509794044e-06, "epoch": 0.7308355455814335, "percentage": 73.09, "elapsed_time": "5 days, 2:47:44", "remaining_time": "1 day, 21:12:41", "throughput": 2726.55, "total_tokens": 1205309952} {"current_steps": 6677, "total_steps": 9134, "loss": 0.6985, "learning_rate": 8.408075593081546e-06, "epoch": 0.7309450176523714, "percentage": 73.1, "elapsed_time": "5 days, 2:48:51", "remaining_time": "1 day, 21:11:35", "throughput": 2726.53, "total_tokens": 1205486240} {"current_steps": 6678, "total_steps": 9134, "loss": 1.0486, "learning_rate": 8.401644639161987e-06, "epoch": 0.7310544897233093, "percentage": 73.11, "elapsed_time": "5 days, 2:50:00", "remaining_time": "1 day, 21:10:30", "throughput": 2726.52, "total_tokens": 1205669024} {"current_steps": 6679, "total_steps": 9134, "loss": 0.7749, "learning_rate": 8.39521564879613e-06, "epoch": 0.7311639617942473, "percentage": 73.12, "elapsed_time": "5 days, 2:51:04", "remaining_time": "1 day, 21:09:23", "throughput": 2726.48, "total_tokens": 1205823808} {"current_steps": 6680, "total_steps": 9134, "loss": 0.8423, "learning_rate": 8.38878862274453e-06, "epoch": 0.7312734338651852, "percentage": 73.13, "elapsed_time": "5 days, 2:52:06", "remaining_time": "1 day, 21:08:15", "throughput": 2726.47, "total_tokens": 1205988000} {"current_steps": 6681, "total_steps": 9134, "loss": 0.7935, "learning_rate": 8.382363561767467e-06, "epoch": 0.7313829059361231, "percentage": 73.14, "elapsed_time": "5 days, 2:53:11", "remaining_time": "1 day, 21:07:08", "throughput": 2726.51, "total_tokens": 1206185792} {"current_steps": 6682, "total_steps": 9134, "loss": 0.9047, "learning_rate": 8.375940466625047e-06, "epoch": 0.7314923780070609, "percentage": 73.16, "elapsed_time": "5 days, 2:54:19", "remaining_time": "1 day, 21:06:03", "throughput": 2726.53, "total_tokens": 1206380448} {"current_steps": 6683, "total_steps": 9134, "loss": 0.7655, "learning_rate": 8.369519338077067e-06, "epoch": 0.7316018500779988, "percentage": 73.17, "elapsed_time": "5 days, 2:55:25", "remaining_time": "1 day, 21:04:56", "throughput": 2726.54, "total_tokens": 1206564800} {"current_steps": 6684, "total_steps": 9134, "loss": 0.7353, "learning_rate": 8.36310017688318e-06, "epoch": 0.7317113221489367, "percentage": 73.18, "elapsed_time": "5 days, 2:56:26", "remaining_time": "1 day, 21:03:48", "throughput": 2726.51, "total_tokens": 1206716448} {"current_steps": 6685, "total_steps": 9134, "loss": 0.9517, "learning_rate": 8.356682983802717e-06, "epoch": 0.7318207942198747, "percentage": 73.19, "elapsed_time": "5 days, 2:57:34", "remaining_time": "1 day, 21:02:43", "throughput": 2726.57, "total_tokens": 1206926560} {"current_steps": 6686, "total_steps": 9134, "loss": 0.7143, "learning_rate": 8.35026775959485e-06, "epoch": 0.7319302662908126, "percentage": 73.2, "elapsed_time": "5 days, 2:58:38", "remaining_time": "1 day, 21:01:36", "throughput": 2726.57, "total_tokens": 1207103296} {"current_steps": 6687, "total_steps": 9134, "loss": 0.8815, "learning_rate": 8.343854505018477e-06, "epoch": 0.7320397383617505, "percentage": 73.21, "elapsed_time": "5 days, 2:59:44", "remaining_time": "1 day, 21:00:29", "throughput": 2726.56, "total_tokens": 1207278912} {"current_steps": 6688, "total_steps": 9134, "loss": 0.8753, "learning_rate": 8.337443220832267e-06, "epoch": 0.7321492104326883, "percentage": 73.22, "elapsed_time": "5 days, 3:00:46", "remaining_time": "1 day, 20:59:22", "throughput": 2726.54, "total_tokens": 1207440864} {"current_steps": 6689, "total_steps": 9134, "loss": 0.7774, "learning_rate": 8.331033907794689e-06, "epoch": 0.7322586825036262, "percentage": 73.23, "elapsed_time": "5 days, 3:01:49", "remaining_time": "1 day, 20:58:14", "throughput": 2726.56, "total_tokens": 1207619168} {"current_steps": 6690, "total_steps": 9134, "loss": 0.9379, "learning_rate": 8.324626566663914e-06, "epoch": 0.7323681545745642, "percentage": 73.24, "elapsed_time": "5 days, 3:02:56", "remaining_time": "1 day, 20:57:08", "throughput": 2726.57, "total_tokens": 1207806880} {"current_steps": 6691, "total_steps": 9134, "loss": 0.8858, "learning_rate": 8.31822119819796e-06, "epoch": 0.7324776266455021, "percentage": 73.25, "elapsed_time": "5 days, 3:04:02", "remaining_time": "1 day, 20:56:02", "throughput": 2726.6, "total_tokens": 1207997952} {"current_steps": 6692, "total_steps": 9134, "loss": 0.7763, "learning_rate": 8.311817803154525e-06, "epoch": 0.73258709871644, "percentage": 73.26, "elapsed_time": "5 days, 3:05:07", "remaining_time": "1 day, 20:54:55", "throughput": 2726.57, "total_tokens": 1208164384} {"current_steps": 6693, "total_steps": 9134, "loss": 0.9212, "learning_rate": 8.305416382291157e-06, "epoch": 0.7326965707873778, "percentage": 73.28, "elapsed_time": "5 days, 3:06:14", "remaining_time": "1 day, 20:53:50", "throughput": 2726.62, "total_tokens": 1208371360} {"current_steps": 6694, "total_steps": 9134, "loss": 0.7534, "learning_rate": 8.299016936365111e-06, "epoch": 0.7328060428583157, "percentage": 73.29, "elapsed_time": "5 days, 3:07:22", "remaining_time": "1 day, 20:52:44", "throughput": 2726.64, "total_tokens": 1208562432} {"current_steps": 6695, "total_steps": 9134, "loss": 0.9269, "learning_rate": 8.292619466133437e-06, "epoch": 0.7329155149292537, "percentage": 73.3, "elapsed_time": "5 days, 3:08:29", "remaining_time": "1 day, 20:51:38", "throughput": 2726.68, "total_tokens": 1208761792} {"current_steps": 6696, "total_steps": 9134, "loss": 0.7216, "learning_rate": 8.286223972352939e-06, "epoch": 0.7330249870001916, "percentage": 73.31, "elapsed_time": "5 days, 3:09:35", "remaining_time": "1 day, 20:50:32", "throughput": 2726.69, "total_tokens": 1208947936} {"current_steps": 6697, "total_steps": 9134, "loss": 1.0054, "learning_rate": 8.279830455780196e-06, "epoch": 0.7331344590711295, "percentage": 73.32, "elapsed_time": "5 days, 3:10:41", "remaining_time": "1 day, 20:49:25", "throughput": 2726.68, "total_tokens": 1209122656} {"current_steps": 6698, "total_steps": 9134, "loss": 0.9168, "learning_rate": 8.273438917171536e-06, "epoch": 0.7332439311420674, "percentage": 73.33, "elapsed_time": "5 days, 3:11:44", "remaining_time": "1 day, 20:48:18", "throughput": 2726.64, "total_tokens": 1209277440} {"current_steps": 6699, "total_steps": 9134, "loss": 0.739, "learning_rate": 8.267049357283088e-06, "epoch": 0.7333534032130052, "percentage": 73.34, "elapsed_time": "5 days, 3:12:50", "remaining_time": "1 day, 20:47:12", "throughput": 2726.63, "total_tokens": 1209453952} {"current_steps": 6700, "total_steps": 9134, "loss": 0.8182, "learning_rate": 8.26066177687071e-06, "epoch": 0.7334628752839432, "percentage": 73.35, "elapsed_time": "5 days, 3:13:56", "remaining_time": "1 day, 20:46:05", "throughput": 2726.66, "total_tokens": 1209643904} {"current_steps": 6701, "total_steps": 9134, "loss": 0.7026, "learning_rate": 8.254276176690045e-06, "epoch": 0.7335723473548811, "percentage": 73.36, "elapsed_time": "5 days, 3:15:01", "remaining_time": "1 day, 20:44:59", "throughput": 2726.65, "total_tokens": 1209818624} {"current_steps": 6702, "total_steps": 9134, "loss": 0.6626, "learning_rate": 8.247892557496495e-06, "epoch": 0.733681819425819, "percentage": 73.37, "elapsed_time": "5 days, 3:16:03", "remaining_time": "1 day, 20:43:51", "throughput": 2726.66, "total_tokens": 1209992224} {"current_steps": 6703, "total_steps": 9134, "loss": 0.959, "learning_rate": 8.241510920045232e-06, "epoch": 0.7337912914967569, "percentage": 73.39, "elapsed_time": "5 days, 3:17:08", "remaining_time": "1 day, 20:42:44", "throughput": 2726.72, "total_tokens": 1210194944} {"current_steps": 6704, "total_steps": 9134, "loss": 0.8675, "learning_rate": 8.235131265091189e-06, "epoch": 0.7339007635676948, "percentage": 73.4, "elapsed_time": "5 days, 3:18:16", "remaining_time": "1 day, 20:41:39", "throughput": 2726.71, "total_tokens": 1210379072} {"current_steps": 6705, "total_steps": 9134, "loss": 0.8466, "learning_rate": 8.22875359338906e-06, "epoch": 0.7340102356386327, "percentage": 73.41, "elapsed_time": "5 days, 3:19:24", "remaining_time": "1 day, 20:40:33", "throughput": 2726.7, "total_tokens": 1210559392} {"current_steps": 6706, "total_steps": 9134, "loss": 0.5915, "learning_rate": 8.222377905693338e-06, "epoch": 0.7341197077095706, "percentage": 73.42, "elapsed_time": "5 days, 3:20:31", "remaining_time": "1 day, 20:39:27", "throughput": 2726.74, "total_tokens": 1210756512} {"current_steps": 6707, "total_steps": 9134, "loss": 1.0757, "learning_rate": 8.21600420275822e-06, "epoch": 0.7342291797805085, "percentage": 73.43, "elapsed_time": "5 days, 3:21:39", "remaining_time": "1 day, 20:38:22", "throughput": 2726.8, "total_tokens": 1210969312} {"current_steps": 6708, "total_steps": 9134, "loss": 0.9046, "learning_rate": 8.209632485337727e-06, "epoch": 0.7343386518514464, "percentage": 73.44, "elapsed_time": "5 days, 3:22:42", "remaining_time": "1 day, 20:37:14", "throughput": 2726.81, "total_tokens": 1211147840} {"current_steps": 6709, "total_steps": 9134, "loss": 0.822, "learning_rate": 8.203262754185611e-06, "epoch": 0.7344481239223843, "percentage": 73.45, "elapsed_time": "5 days, 3:23:48", "remaining_time": "1 day, 20:36:08", "throughput": 2726.89, "total_tokens": 1211362208} {"current_steps": 6710, "total_steps": 9134, "loss": 0.6619, "learning_rate": 8.196895010055403e-06, "epoch": 0.7345575959933222, "percentage": 73.46, "elapsed_time": "5 days, 3:24:55", "remaining_time": "1 day, 20:35:02", "throughput": 2726.89, "total_tokens": 1211544992} {"current_steps": 6711, "total_steps": 9134, "loss": 0.6354, "learning_rate": 8.190529253700393e-06, "epoch": 0.7346670680642601, "percentage": 73.47, "elapsed_time": "5 days, 3:25:56", "remaining_time": "1 day, 20:33:54", "throughput": 2726.89, "total_tokens": 1211710080} {"current_steps": 6712, "total_steps": 9134, "loss": 1.0866, "learning_rate": 8.184165485873633e-06, "epoch": 0.734776540135198, "percentage": 73.48, "elapsed_time": "5 days, 3:27:00", "remaining_time": "1 day, 20:32:47", "throughput": 2726.89, "total_tokens": 1211886368} {"current_steps": 6713, "total_steps": 9134, "loss": 0.8596, "learning_rate": 8.177803707327961e-06, "epoch": 0.7348860122061359, "percentage": 73.49, "elapsed_time": "5 days, 3:28:07", "remaining_time": "1 day, 20:31:41", "throughput": 2726.87, "total_tokens": 1212058848} {"current_steps": 6714, "total_steps": 9134, "loss": 0.8312, "learning_rate": 8.171443918815939e-06, "epoch": 0.7349954842770738, "percentage": 73.51, "elapsed_time": "5 days, 3:29:12", "remaining_time": "1 day, 20:30:35", "throughput": 2726.91, "total_tokens": 1212255744} {"current_steps": 6715, "total_steps": 9134, "loss": 0.7439, "learning_rate": 8.165086121089944e-06, "epoch": 0.7351049563480118, "percentage": 73.52, "elapsed_time": "5 days, 3:30:20", "remaining_time": "1 day, 20:29:29", "throughput": 2726.92, "total_tokens": 1212444352} {"current_steps": 6716, "total_steps": 9134, "loss": 0.8844, "learning_rate": 8.158730314902063e-06, "epoch": 0.7352144284189496, "percentage": 73.53, "elapsed_time": "5 days, 3:31:25", "remaining_time": "1 day, 20:28:22", "throughput": 2726.93, "total_tokens": 1212627136} {"current_steps": 6717, "total_steps": 9134, "loss": 0.8864, "learning_rate": 8.152376501004199e-06, "epoch": 0.7353239004898875, "percentage": 73.54, "elapsed_time": "5 days, 3:32:31", "remaining_time": "1 day, 20:27:16", "throughput": 2726.96, "total_tokens": 1212820896} {"current_steps": 6718, "total_steps": 9134, "loss": 0.8577, "learning_rate": 8.146024680147987e-06, "epoch": 0.7354333725608254, "percentage": 73.55, "elapsed_time": "5 days, 3:33:39", "remaining_time": "1 day, 20:26:10", "throughput": 2726.96, "total_tokens": 1213006368} {"current_steps": 6719, "total_steps": 9134, "loss": 0.9356, "learning_rate": 8.139674853084838e-06, "epoch": 0.7355428446317633, "percentage": 73.56, "elapsed_time": "5 days, 3:34:46", "remaining_time": "1 day, 20:25:04", "throughput": 2726.96, "total_tokens": 1213188480} {"current_steps": 6720, "total_steps": 9134, "loss": 0.857, "learning_rate": 8.13332702056592e-06, "epoch": 0.7356523167027013, "percentage": 73.57, "elapsed_time": "5 days, 3:35:51", "remaining_time": "1 day, 20:23:58", "throughput": 2726.92, "total_tokens": 1213347744} {"current_steps": 6721, "total_steps": 9134, "loss": 0.6646, "learning_rate": 8.126981183342167e-06, "epoch": 0.7357617887736392, "percentage": 73.58, "elapsed_time": "5 days, 3:36:54", "remaining_time": "1 day, 20:22:50", "throughput": 2726.94, "total_tokens": 1213526496} {"current_steps": 6722, "total_steps": 9134, "loss": 1.0344, "learning_rate": 8.120637342164298e-06, "epoch": 0.735871260844577, "percentage": 73.59, "elapsed_time": "5 days, 3:37:59", "remaining_time": "1 day, 20:21:44", "throughput": 2726.97, "total_tokens": 1213721600} {"current_steps": 6723, "total_steps": 9134, "loss": 0.7786, "learning_rate": 8.114295497782748e-06, "epoch": 0.7359807329155149, "percentage": 73.6, "elapsed_time": "5 days, 3:39:05", "remaining_time": "1 day, 20:20:38", "throughput": 2726.98, "total_tokens": 1213906176} {"current_steps": 6724, "total_steps": 9134, "loss": 0.8771, "learning_rate": 8.107955650947777e-06, "epoch": 0.7360902049864528, "percentage": 73.62, "elapsed_time": "5 days, 3:40:07", "remaining_time": "1 day, 20:19:30", "throughput": 2726.98, "total_tokens": 1214069248} {"current_steps": 6725, "total_steps": 9134, "loss": 0.9971, "learning_rate": 8.101617802409343e-06, "epoch": 0.7361996770573908, "percentage": 73.63, "elapsed_time": "5 days, 3:41:14", "remaining_time": "1 day, 20:18:24", "throughput": 2726.95, "total_tokens": 1214238368} {"current_steps": 6726, "total_steps": 9134, "loss": 0.6737, "learning_rate": 8.095281952917227e-06, "epoch": 0.7363091491283287, "percentage": 73.64, "elapsed_time": "5 days, 3:42:15", "remaining_time": "1 day, 20:17:16", "throughput": 2726.89, "total_tokens": 1214379712} {"current_steps": 6727, "total_steps": 9134, "loss": 0.758, "learning_rate": 8.088948103220942e-06, "epoch": 0.7364186211992665, "percentage": 73.65, "elapsed_time": "5 days, 3:43:15", "remaining_time": "1 day, 20:16:07", "throughput": 2726.83, "total_tokens": 1214520384} {"current_steps": 6728, "total_steps": 9134, "loss": 0.9206, "learning_rate": 8.082616254069767e-06, "epoch": 0.7365280932702044, "percentage": 73.66, "elapsed_time": "5 days, 3:44:19", "remaining_time": "1 day, 20:15:00", "throughput": 2726.84, "total_tokens": 1214699136} {"current_steps": 6729, "total_steps": 9134, "loss": 0.8122, "learning_rate": 8.076286406212747e-06, "epoch": 0.7366375653411423, "percentage": 73.67, "elapsed_time": "5 days, 3:45:27", "remaining_time": "1 day, 20:13:55", "throughput": 2726.82, "total_tokens": 1214875648} {"current_steps": 6730, "total_steps": 9134, "loss": 0.8615, "learning_rate": 8.069958560398686e-06, "epoch": 0.7367470374120803, "percentage": 73.68, "elapsed_time": "5 days, 3:46:32", "remaining_time": "1 day, 20:12:48", "throughput": 2726.87, "total_tokens": 1215072544} {"current_steps": 6731, "total_steps": 9134, "loss": 0.7409, "learning_rate": 8.063632717376177e-06, "epoch": 0.7368565094830182, "percentage": 73.69, "elapsed_time": "5 days, 3:47:36", "remaining_time": "1 day, 20:11:41", "throughput": 2726.83, "total_tokens": 1215232032} {"current_steps": 6732, "total_steps": 9134, "loss": 0.7533, "learning_rate": 8.057308877893524e-06, "epoch": 0.7369659815539561, "percentage": 73.7, "elapsed_time": "5 days, 3:48:40", "remaining_time": "1 day, 20:10:34", "throughput": 2726.85, "total_tokens": 1215415040} {"current_steps": 6733, "total_steps": 9134, "loss": 0.5853, "learning_rate": 8.050987042698852e-06, "epoch": 0.7370754536248939, "percentage": 73.71, "elapsed_time": "5 days, 3:49:43", "remaining_time": "1 day, 20:09:27", "throughput": 2726.87, "total_tokens": 1215594016} {"current_steps": 6734, "total_steps": 9134, "loss": 0.7491, "learning_rate": 8.04466721254001e-06, "epoch": 0.7371849256958318, "percentage": 73.72, "elapsed_time": "5 days, 3:50:50", "remaining_time": "1 day, 20:08:21", "throughput": 2726.9, "total_tokens": 1215788000} {"current_steps": 6735, "total_steps": 9134, "loss": 0.8814, "learning_rate": 8.038349388164627e-06, "epoch": 0.7372943977667697, "percentage": 73.74, "elapsed_time": "5 days, 3:51:53", "remaining_time": "1 day, 20:07:13", "throughput": 2726.9, "total_tokens": 1215961600} {"current_steps": 6736, "total_steps": 9134, "loss": 0.8221, "learning_rate": 8.032033570320083e-06, "epoch": 0.7374038698377077, "percentage": 73.75, "elapsed_time": "5 days, 3:52:55", "remaining_time": "1 day, 20:06:06", "throughput": 2726.83, "total_tokens": 1216098688} {"current_steps": 6737, "total_steps": 9134, "loss": 0.66, "learning_rate": 8.025719759753531e-06, "epoch": 0.7375133419086456, "percentage": 73.76, "elapsed_time": "5 days, 3:54:00", "remaining_time": "1 day, 20:04:59", "throughput": 2726.83, "total_tokens": 1216277216} {"current_steps": 6738, "total_steps": 9134, "loss": 1.0393, "learning_rate": 8.019407957211883e-06, "epoch": 0.7376228139795835, "percentage": 73.77, "elapsed_time": "5 days, 3:55:08", "remaining_time": "1 day, 20:03:53", "throughput": 2726.83, "total_tokens": 1216462688} {"current_steps": 6739, "total_steps": 9134, "loss": 0.9223, "learning_rate": 8.013098163441813e-06, "epoch": 0.7377322860505213, "percentage": 73.78, "elapsed_time": "5 days, 3:56:12", "remaining_time": "1 day, 20:02:47", "throughput": 2726.87, "total_tokens": 1216653984} {"current_steps": 6740, "total_steps": 9134, "loss": 1.2815, "learning_rate": 8.006790379189746e-06, "epoch": 0.7378417581214592, "percentage": 73.79, "elapsed_time": "5 days, 3:57:21", "remaining_time": "1 day, 20:01:41", "throughput": 2726.92, "total_tokens": 1216865440} {"current_steps": 6741, "total_steps": 9134, "loss": 1.0093, "learning_rate": 8.000484605201902e-06, "epoch": 0.7379512301923972, "percentage": 73.8, "elapsed_time": "5 days, 3:58:29", "remaining_time": "1 day, 20:00:36", "throughput": 2726.96, "total_tokens": 1217068160} {"current_steps": 6742, "total_steps": 9134, "loss": 0.9698, "learning_rate": 7.99418084222423e-06, "epoch": 0.7380607022633351, "percentage": 73.81, "elapsed_time": "5 days, 3:59:32", "remaining_time": "1 day, 19:59:28", "throughput": 2726.91, "total_tokens": 1217218912} {"current_steps": 6743, "total_steps": 9134, "loss": 0.7231, "learning_rate": 7.987879091002456e-06, "epoch": 0.738170174334273, "percentage": 73.82, "elapsed_time": "5 days, 4:00:35", "remaining_time": "1 day, 19:58:21", "throughput": 2726.9, "total_tokens": 1217382656} {"current_steps": 6744, "total_steps": 9134, "loss": 0.7381, "learning_rate": 7.981579352282064e-06, "epoch": 0.7382796464052108, "percentage": 73.83, "elapsed_time": "5 days, 4:01:41", "remaining_time": "1 day, 19:57:15", "throughput": 2726.86, "total_tokens": 1217549312} {"current_steps": 6745, "total_steps": 9134, "loss": 0.7621, "learning_rate": 7.9752816268083e-06, "epoch": 0.7383891184761487, "percentage": 73.84, "elapsed_time": "5 days, 4:02:47", "remaining_time": "1 day, 19:56:08", "throughput": 2726.89, "total_tokens": 1217738144} {"current_steps": 6746, "total_steps": 9134, "loss": 0.978, "learning_rate": 7.968985915326175e-06, "epoch": 0.7384985905470867, "percentage": 73.86, "elapsed_time": "5 days, 4:03:55", "remaining_time": "1 day, 19:55:03", "throughput": 2726.91, "total_tokens": 1217935936} {"current_steps": 6747, "total_steps": 9134, "loss": 0.8273, "learning_rate": 7.962692218580451e-06, "epoch": 0.7386080626180246, "percentage": 73.87, "elapsed_time": "5 days, 4:05:03", "remaining_time": "1 day, 19:53:57", "throughput": 2726.91, "total_tokens": 1218120064} {"current_steps": 6748, "total_steps": 9134, "loss": 1.0233, "learning_rate": 7.956400537315681e-06, "epoch": 0.7387175346889625, "percentage": 73.88, "elapsed_time": "5 days, 4:06:07", "remaining_time": "1 day, 19:52:50", "throughput": 2726.87, "total_tokens": 1218276864} {"current_steps": 6749, "total_steps": 9134, "loss": 0.6925, "learning_rate": 7.950110872276131e-06, "epoch": 0.7388270067599004, "percentage": 73.89, "elapsed_time": "5 days, 4:07:14", "remaining_time": "1 day, 19:51:45", "throughput": 2726.84, "total_tokens": 1218446880} {"current_steps": 6750, "total_steps": 9134, "loss": 0.7661, "learning_rate": 7.943823224205879e-06, "epoch": 0.7389364788308382, "percentage": 73.9, "elapsed_time": "5 days, 4:08:20", "remaining_time": "1 day, 19:50:38", "throughput": 2726.81, "total_tokens": 1218612192} {"current_steps": 6751, "total_steps": 9134, "loss": 0.9334, "learning_rate": 7.937537593848734e-06, "epoch": 0.7390459509017762, "percentage": 73.91, "elapsed_time": "5 days, 4:09:28", "remaining_time": "1 day, 19:49:33", "throughput": 2726.84, "total_tokens": 1218814240} {"current_steps": 6752, "total_steps": 9134, "loss": 0.6535, "learning_rate": 7.931253981948275e-06, "epoch": 0.7391554229727141, "percentage": 73.92, "elapsed_time": "5 days, 4:10:32", "remaining_time": "1 day, 19:48:26", "throughput": 2726.87, "total_tokens": 1218999264} {"current_steps": 6753, "total_steps": 9134, "loss": 0.6463, "learning_rate": 7.924972389247836e-06, "epoch": 0.739264895043652, "percentage": 73.93, "elapsed_time": "5 days, 4:11:35", "remaining_time": "1 day, 19:47:18", "throughput": 2726.85, "total_tokens": 1219163904} {"current_steps": 6754, "total_steps": 9134, "loss": 1.0891, "learning_rate": 7.918692816490517e-06, "epoch": 0.7393743671145899, "percentage": 73.94, "elapsed_time": "5 days, 4:12:43", "remaining_time": "1 day, 19:46:13", "throughput": 2726.87, "total_tokens": 1219355424} {"current_steps": 6755, "total_steps": 9134, "loss": 0.8389, "learning_rate": 7.912415264419198e-06, "epoch": 0.7394838391855278, "percentage": 73.95, "elapsed_time": "5 days, 4:13:52", "remaining_time": "1 day, 19:45:07", "throughput": 2726.91, "total_tokens": 1219561056} {"current_steps": 6756, "total_steps": 9134, "loss": 0.7436, "learning_rate": 7.906139733776474e-06, "epoch": 0.7395933112564657, "percentage": 73.97, "elapsed_time": "5 days, 4:14:55", "remaining_time": "1 day, 19:44:00", "throughput": 2726.9, "total_tokens": 1219731520} {"current_steps": 6757, "total_steps": 9134, "loss": 0.9019, "learning_rate": 7.899866225304756e-06, "epoch": 0.7397027833274036, "percentage": 73.98, "elapsed_time": "5 days, 4:16:01", "remaining_time": "1 day, 19:42:54", "throughput": 2726.91, "total_tokens": 1219912736} {"current_steps": 6758, "total_steps": 9134, "loss": 0.6783, "learning_rate": 7.893594739746157e-06, "epoch": 0.7398122553983415, "percentage": 73.99, "elapsed_time": "5 days, 4:17:09", "remaining_time": "1 day, 19:41:48", "throughput": 2726.95, "total_tokens": 1220117024} {"current_steps": 6759, "total_steps": 9134, "loss": 0.7174, "learning_rate": 7.887325277842605e-06, "epoch": 0.7399217274692794, "percentage": 74.0, "elapsed_time": "5 days, 4:18:14", "remaining_time": "1 day, 19:40:42", "throughput": 2726.94, "total_tokens": 1220292416} {"current_steps": 6760, "total_steps": 9134, "loss": 0.9755, "learning_rate": 7.881057840335762e-06, "epoch": 0.7400311995402173, "percentage": 74.01, "elapsed_time": "5 days, 4:19:22", "remaining_time": "1 day, 19:39:36", "throughput": 2727.02, "total_tokens": 1220511264} {"current_steps": 6761, "total_steps": 9134, "loss": 0.6291, "learning_rate": 7.874792427967048e-06, "epoch": 0.7401406716111552, "percentage": 74.02, "elapsed_time": "5 days, 4:20:29", "remaining_time": "1 day, 19:38:30", "throughput": 2727.06, "total_tokens": 1220711296} {"current_steps": 6762, "total_steps": 9134, "loss": 0.8917, "learning_rate": 7.868529041477654e-06, "epoch": 0.7402501436820931, "percentage": 74.03, "elapsed_time": "5 days, 4:21:36", "remaining_time": "1 day, 19:37:24", "throughput": 2727.04, "total_tokens": 1220884896} {"current_steps": 6763, "total_steps": 9134, "loss": 0.7946, "learning_rate": 7.862267681608514e-06, "epoch": 0.740359615753031, "percentage": 74.04, "elapsed_time": "5 days, 4:22:40", "remaining_time": "1 day, 19:36:17", "throughput": 2727.01, "total_tokens": 1221047520} {"current_steps": 6764, "total_steps": 9134, "loss": 0.8309, "learning_rate": 7.856008349100366e-06, "epoch": 0.7404690878239689, "percentage": 74.05, "elapsed_time": "5 days, 4:23:46", "remaining_time": "1 day, 19:35:11", "throughput": 2727.03, "total_tokens": 1221237696} {"current_steps": 6765, "total_steps": 9134, "loss": 0.8358, "learning_rate": 7.849751044693637e-06, "epoch": 0.7405785598949068, "percentage": 74.06, "elapsed_time": "5 days, 4:24:54", "remaining_time": "1 day, 19:34:05", "throughput": 2727.05, "total_tokens": 1221433024} {"current_steps": 6766, "total_steps": 9134, "loss": 0.73, "learning_rate": 7.843495769128584e-06, "epoch": 0.7406880319658448, "percentage": 74.07, "elapsed_time": "5 days, 4:25:58", "remaining_time": "1 day, 19:32:58", "throughput": 2727.07, "total_tokens": 1221616256} {"current_steps": 6767, "total_steps": 9134, "loss": 0.8665, "learning_rate": 7.83724252314518e-06, "epoch": 0.7407975040367826, "percentage": 74.09, "elapsed_time": "5 days, 4:27:06", "remaining_time": "1 day, 19:31:53", "throughput": 2727.13, "total_tokens": 1221827712} {"current_steps": 6768, "total_steps": 9134, "loss": 1.1668, "learning_rate": 7.830991307483179e-06, "epoch": 0.7409069761077205, "percentage": 74.1, "elapsed_time": "5 days, 4:28:09", "remaining_time": "1 day, 19:30:46", "throughput": 2727.12, "total_tokens": 1221996608} {"current_steps": 6769, "total_steps": 9134, "loss": 0.73, "learning_rate": 7.824742122882083e-06, "epoch": 0.7410164481786584, "percentage": 74.11, "elapsed_time": "5 days, 4:29:13", "remaining_time": "1 day, 19:29:39", "throughput": 2727.12, "total_tokens": 1222167744} {"current_steps": 6770, "total_steps": 9134, "loss": 0.8455, "learning_rate": 7.818494970081161e-06, "epoch": 0.7411259202495963, "percentage": 74.12, "elapsed_time": "5 days, 4:30:16", "remaining_time": "1 day, 19:28:31", "throughput": 2727.11, "total_tokens": 1222335072} {"current_steps": 6771, "total_steps": 9134, "loss": 0.6304, "learning_rate": 7.812249849819439e-06, "epoch": 0.7412353923205343, "percentage": 74.13, "elapsed_time": "5 days, 4:31:23", "remaining_time": "1 day, 19:27:25", "throughput": 2727.11, "total_tokens": 1222520544} {"current_steps": 6772, "total_steps": 9134, "loss": 0.7753, "learning_rate": 7.806006762835696e-06, "epoch": 0.7413448643914722, "percentage": 74.14, "elapsed_time": "5 days, 4:32:30", "remaining_time": "1 day, 19:26:19", "throughput": 2727.1, "total_tokens": 1222695040} {"current_steps": 6773, "total_steps": 9134, "loss": 0.9039, "learning_rate": 7.79976570986849e-06, "epoch": 0.74145433646241, "percentage": 74.15, "elapsed_time": "5 days, 4:33:38", "remaining_time": "1 day, 19:25:14", "throughput": 2727.08, "total_tokens": 1222873568} {"current_steps": 6774, "total_steps": 9134, "loss": 0.8444, "learning_rate": 7.793526691656117e-06, "epoch": 0.7415638085333479, "percentage": 74.16, "elapsed_time": "5 days, 4:34:46", "remaining_time": "1 day, 19:24:08", "throughput": 2727.1, "total_tokens": 1223068896} {"current_steps": 6775, "total_steps": 9134, "loss": 0.7585, "learning_rate": 7.787289708936645e-06, "epoch": 0.7416732806042858, "percentage": 74.17, "elapsed_time": "5 days, 4:35:53", "remaining_time": "1 day, 19:23:02", "throughput": 2727.15, "total_tokens": 1223273184} {"current_steps": 6776, "total_steps": 9134, "loss": 0.7415, "learning_rate": 7.781054762447898e-06, "epoch": 0.7417827526752238, "percentage": 74.18, "elapsed_time": "5 days, 4:36:57", "remaining_time": "1 day, 19:21:55", "throughput": 2727.19, "total_tokens": 1223463584} {"current_steps": 6777, "total_steps": 9134, "loss": 0.8687, "learning_rate": 7.774821852927453e-06, "epoch": 0.7418922247461617, "percentage": 74.2, "elapsed_time": "5 days, 4:38:04", "remaining_time": "1 day, 19:20:49", "throughput": 2727.22, "total_tokens": 1223660032} {"current_steps": 6778, "total_steps": 9134, "loss": 0.7623, "learning_rate": 7.768590981112654e-06, "epoch": 0.7420016968170995, "percentage": 74.21, "elapsed_time": "5 days, 4:39:12", "remaining_time": "1 day, 19:19:44", "throughput": 2727.25, "total_tokens": 1223858496} {"current_steps": 6779, "total_steps": 9134, "loss": 0.8207, "learning_rate": 7.762362147740601e-06, "epoch": 0.7421111688880374, "percentage": 74.22, "elapsed_time": "5 days, 4:40:15", "remaining_time": "1 day, 19:18:36", "throughput": 2727.22, "total_tokens": 1224017088} {"current_steps": 6780, "total_steps": 9134, "loss": 0.6315, "learning_rate": 7.756135353548145e-06, "epoch": 0.7422206409589753, "percentage": 74.23, "elapsed_time": "5 days, 4:41:23", "remaining_time": "1 day, 19:17:31", "throughput": 2727.24, "total_tokens": 1224211296} {"current_steps": 6781, "total_steps": 9134, "loss": 0.7878, "learning_rate": 7.749910599271928e-06, "epoch": 0.7423301130299133, "percentage": 74.24, "elapsed_time": "5 days, 4:42:29", "remaining_time": "1 day, 19:16:24", "throughput": 2727.24, "total_tokens": 1224394080} {"current_steps": 6782, "total_steps": 9134, "loss": 0.7693, "learning_rate": 7.743687885648293e-06, "epoch": 0.7424395851008512, "percentage": 74.25, "elapsed_time": "5 days, 4:43:30", "remaining_time": "1 day, 19:15:17", "throughput": 2727.2, "total_tokens": 1224540800} {"current_steps": 6783, "total_steps": 9134, "loss": 0.9423, "learning_rate": 7.737467213413405e-06, "epoch": 0.7425490571717891, "percentage": 74.26, "elapsed_time": "5 days, 4:44:38", "remaining_time": "1 day, 19:14:11", "throughput": 2727.19, "total_tokens": 1224720224} {"current_steps": 6784, "total_steps": 9134, "loss": 0.8774, "learning_rate": 7.731248583303142e-06, "epoch": 0.7426585292427269, "percentage": 74.27, "elapsed_time": "5 days, 4:45:42", "remaining_time": "1 day, 19:13:04", "throughput": 2727.17, "total_tokens": 1224890016} {"current_steps": 6785, "total_steps": 9134, "loss": 1.0115, "learning_rate": 7.725031996053159e-06, "epoch": 0.7427680013136648, "percentage": 74.28, "elapsed_time": "5 days, 4:46:49", "remaining_time": "1 day, 19:11:58", "throughput": 2727.19, "total_tokens": 1225078848} {"current_steps": 6786, "total_steps": 9134, "loss": 0.8412, "learning_rate": 7.718817452398869e-06, "epoch": 0.7428774733846027, "percentage": 74.29, "elapsed_time": "5 days, 4:47:55", "remaining_time": "1 day, 19:10:52", "throughput": 2727.22, "total_tokens": 1225271936} {"current_steps": 6787, "total_steps": 9134, "loss": 0.9265, "learning_rate": 7.712604953075428e-06, "epoch": 0.7429869454555407, "percentage": 74.3, "elapsed_time": "5 days, 4:49:03", "remaining_time": "1 day, 19:09:46", "throughput": 2727.22, "total_tokens": 1225457632} {"current_steps": 6788, "total_steps": 9134, "loss": 0.621, "learning_rate": 7.70639449881779e-06, "epoch": 0.7430964175264786, "percentage": 74.32, "elapsed_time": "5 days, 4:50:06", "remaining_time": "1 day, 19:08:39", "throughput": 2727.2, "total_tokens": 1225619360} {"current_steps": 6789, "total_steps": 9134, "loss": 0.8448, "learning_rate": 7.700186090360609e-06, "epoch": 0.7432058895974165, "percentage": 74.33, "elapsed_time": "5 days, 4:51:07", "remaining_time": "1 day, 19:07:31", "throughput": 2727.17, "total_tokens": 1225774144} {"current_steps": 6790, "total_steps": 9134, "loss": 0.997, "learning_rate": 7.693979728438355e-06, "epoch": 0.7433153616683543, "percentage": 74.34, "elapsed_time": "5 days, 4:52:12", "remaining_time": "1 day, 19:06:24", "throughput": 2727.19, "total_tokens": 1225961184} {"current_steps": 6791, "total_steps": 9134, "loss": 0.6648, "learning_rate": 7.687775413785201e-06, "epoch": 0.7434248337392922, "percentage": 74.35, "elapsed_time": "5 days, 4:53:14", "remaining_time": "1 day, 19:05:16", "throughput": 2727.19, "total_tokens": 1226130304} {"current_steps": 6792, "total_steps": 9134, "loss": 0.8546, "learning_rate": 7.681573147135126e-06, "epoch": 0.7435343058102302, "percentage": 74.36, "elapsed_time": "5 days, 4:54:21", "remaining_time": "1 day, 19:04:11", "throughput": 2727.2, "total_tokens": 1226317792} {"current_steps": 6793, "total_steps": 9134, "loss": 1.0252, "learning_rate": 7.675372929221844e-06, "epoch": 0.7436437778811681, "percentage": 74.37, "elapsed_time": "5 days, 4:55:24", "remaining_time": "1 day, 19:03:03", "throughput": 2727.19, "total_tokens": 1226485568} {"current_steps": 6794, "total_steps": 9134, "loss": 0.6643, "learning_rate": 7.669174760778825e-06, "epoch": 0.743753249952106, "percentage": 74.38, "elapsed_time": "5 days, 4:56:30", "remaining_time": "1 day, 19:01:57", "throughput": 2727.19, "total_tokens": 1226661408} {"current_steps": 6795, "total_steps": 9134, "loss": 0.6442, "learning_rate": 7.662978642539298e-06, "epoch": 0.7438627220230438, "percentage": 74.39, "elapsed_time": "5 days, 4:57:35", "remaining_time": "1 day, 19:00:50", "throughput": 2727.21, "total_tokens": 1226851584} {"current_steps": 6796, "total_steps": 9134, "loss": 0.7448, "learning_rate": 7.65678457523625e-06, "epoch": 0.7439721940939817, "percentage": 74.4, "elapsed_time": "5 days, 4:58:39", "remaining_time": "1 day, 18:59:44", "throughput": 2727.24, "total_tokens": 1227038400} {"current_steps": 6797, "total_steps": 9134, "loss": 0.6665, "learning_rate": 7.650592559602446e-06, "epoch": 0.7440816661649197, "percentage": 74.41, "elapsed_time": "5 days, 4:59:40", "remaining_time": "1 day, 18:58:35", "throughput": 2727.22, "total_tokens": 1227194528} {"current_steps": 6798, "total_steps": 9134, "loss": 1.1128, "learning_rate": 7.644402596370361e-06, "epoch": 0.7441911382358576, "percentage": 74.43, "elapsed_time": "5 days, 5:00:47", "remaining_time": "1 day, 18:57:30", "throughput": 2727.22, "total_tokens": 1227379104} {"current_steps": 6799, "total_steps": 9134, "loss": 0.6007, "learning_rate": 7.638214686272285e-06, "epoch": 0.7443006103067955, "percentage": 74.44, "elapsed_time": "5 days, 5:01:48", "remaining_time": "1 day, 18:56:22", "throughput": 2727.19, "total_tokens": 1227529856} {"current_steps": 6800, "total_steps": 9134, "loss": 0.8588, "learning_rate": 7.632028830040208e-06, "epoch": 0.7444100823777334, "percentage": 74.45, "elapsed_time": "5 days, 5:02:54", "remaining_time": "1 day, 18:55:15", "throughput": 2727.22, "total_tokens": 1227724512} {"current_steps": 6801, "total_steps": 9134, "loss": 0.8388, "learning_rate": 7.6258450284059255e-06, "epoch": 0.7445195544486712, "percentage": 74.46, "elapsed_time": "5 days, 5:03:57", "remaining_time": "1 day, 18:54:08", "throughput": 2727.21, "total_tokens": 1227891168} {"current_steps": 6802, "total_steps": 9134, "loss": 0.6731, "learning_rate": 7.619663282100961e-06, "epoch": 0.7446290265196092, "percentage": 74.47, "elapsed_time": "5 days, 5:05:03", "remaining_time": "1 day, 18:53:02", "throughput": 2727.2, "total_tokens": 1228069696} {"current_steps": 6803, "total_steps": 9134, "loss": 0.8809, "learning_rate": 7.613483591856605e-06, "epoch": 0.7447384985905471, "percentage": 74.48, "elapsed_time": "5 days, 5:06:08", "remaining_time": "1 day, 18:51:55", "throughput": 2727.23, "total_tokens": 1228255840} {"current_steps": 6804, "total_steps": 9134, "loss": 0.7567, "learning_rate": 7.607305958403904e-06, "epoch": 0.744847970661485, "percentage": 74.49, "elapsed_time": "5 days, 5:07:13", "remaining_time": "1 day, 18:50:49", "throughput": 2727.27, "total_tokens": 1228453408} {"current_steps": 6805, "total_steps": 9134, "loss": 0.8681, "learning_rate": 7.601130382473651e-06, "epoch": 0.7449574427324229, "percentage": 74.5, "elapsed_time": "5 days, 5:08:19", "remaining_time": "1 day, 18:49:42", "throughput": 2727.28, "total_tokens": 1228635296} {"current_steps": 6806, "total_steps": 9134, "loss": 0.8736, "learning_rate": 7.5949568647964265e-06, "epoch": 0.7450669148033608, "percentage": 74.51, "elapsed_time": "5 days, 5:09:27", "remaining_time": "1 day, 18:48:37", "throughput": 2727.31, "total_tokens": 1228836224} {"current_steps": 6807, "total_steps": 9134, "loss": 0.8627, "learning_rate": 7.58878540610252e-06, "epoch": 0.7451763868742987, "percentage": 74.52, "elapsed_time": "5 days, 5:10:34", "remaining_time": "1 day, 18:47:31", "throughput": 2727.35, "total_tokens": 1229037152} {"current_steps": 6808, "total_steps": 9134, "loss": 0.7538, "learning_rate": 7.58261600712202e-06, "epoch": 0.7452858589452366, "percentage": 74.53, "elapsed_time": "5 days, 5:11:42", "remaining_time": "1 day, 18:46:25", "throughput": 2727.34, "total_tokens": 1229217248} {"current_steps": 6809, "total_steps": 9134, "loss": 0.6557, "learning_rate": 7.576448668584752e-06, "epoch": 0.7453953310161745, "percentage": 74.55, "elapsed_time": "5 days, 5:12:47", "remaining_time": "1 day, 18:45:18", "throughput": 2727.36, "total_tokens": 1229405184} {"current_steps": 6810, "total_steps": 9134, "loss": 0.8186, "learning_rate": 7.570283391220295e-06, "epoch": 0.7455048030871124, "percentage": 74.56, "elapsed_time": "5 days, 5:13:55", "remaining_time": "1 day, 18:44:13", "throughput": 2727.4, "total_tokens": 1229609920} {"current_steps": 6811, "total_steps": 9134, "loss": 0.7368, "learning_rate": 7.564120175757996e-06, "epoch": 0.7456142751580503, "percentage": 74.57, "elapsed_time": "5 days, 5:14:58", "remaining_time": "1 day, 18:43:06", "throughput": 2727.38, "total_tokens": 1229770528} {"current_steps": 6812, "total_steps": 9134, "loss": 0.883, "learning_rate": 7.557959022926947e-06, "epoch": 0.7457237472289882, "percentage": 74.58, "elapsed_time": "5 days, 5:16:02", "remaining_time": "1 day, 18:41:59", "throughput": 2727.38, "total_tokens": 1229946368} {"current_steps": 6813, "total_steps": 9134, "loss": 0.8674, "learning_rate": 7.551799933456003e-06, "epoch": 0.7458332192999261, "percentage": 74.59, "elapsed_time": "5 days, 5:17:09", "remaining_time": "1 day, 18:40:53", "throughput": 2727.42, "total_tokens": 1230145728} {"current_steps": 6814, "total_steps": 9134, "loss": 0.7522, "learning_rate": 7.5456429080737635e-06, "epoch": 0.745942691370864, "percentage": 74.6, "elapsed_time": "5 days, 5:18:15", "remaining_time": "1 day, 18:39:46", "throughput": 2727.41, "total_tokens": 1230323136} {"current_steps": 6815, "total_steps": 9134, "loss": 0.5962, "learning_rate": 7.5394879475086085e-06, "epoch": 0.7460521634418019, "percentage": 74.61, "elapsed_time": "5 days, 5:19:17", "remaining_time": "1 day, 18:38:39", "throughput": 2727.38, "total_tokens": 1230479040} {"current_steps": 6816, "total_steps": 9134, "loss": 0.6823, "learning_rate": 7.533335052488652e-06, "epoch": 0.7461616355127398, "percentage": 74.62, "elapsed_time": "5 days, 5:20:22", "remaining_time": "1 day, 18:37:32", "throughput": 2727.38, "total_tokens": 1230657344} {"current_steps": 6817, "total_steps": 9134, "loss": 0.5537, "learning_rate": 7.527184223741765e-06, "epoch": 0.7462711075836778, "percentage": 74.63, "elapsed_time": "5 days, 5:21:27", "remaining_time": "1 day, 18:36:26", "throughput": 2727.37, "total_tokens": 1230829152} {"current_steps": 6818, "total_steps": 9134, "loss": 0.8846, "learning_rate": 7.521035461995585e-06, "epoch": 0.7463805796546156, "percentage": 74.64, "elapsed_time": "5 days, 5:22:26", "remaining_time": "1 day, 18:35:17", "throughput": 2727.34, "total_tokens": 1230977440} {"current_steps": 6819, "total_steps": 9134, "loss": 0.9078, "learning_rate": 7.514888767977493e-06, "epoch": 0.7464900517255535, "percentage": 74.66, "elapsed_time": "5 days, 5:23:31", "remaining_time": "1 day, 18:34:11", "throughput": 2727.34, "total_tokens": 1231151712} {"current_steps": 6820, "total_steps": 9134, "loss": 0.6792, "learning_rate": 7.508744142414629e-06, "epoch": 0.7465995237964914, "percentage": 74.67, "elapsed_time": "5 days, 5:24:33", "remaining_time": "1 day, 18:33:03", "throughput": 2727.32, "total_tokens": 1231312768} {"current_steps": 6821, "total_steps": 9134, "loss": 0.701, "learning_rate": 7.502601586033908e-06, "epoch": 0.7467089958674293, "percentage": 74.68, "elapsed_time": "5 days, 5:25:39", "remaining_time": "1 day, 18:31:57", "throughput": 2727.33, "total_tokens": 1231495776} {"current_steps": 6822, "total_steps": 9134, "loss": 0.9869, "learning_rate": 7.496461099561958e-06, "epoch": 0.7468184679383673, "percentage": 74.69, "elapsed_time": "5 days, 5:26:40", "remaining_time": "1 day, 18:30:49", "throughput": 2727.33, "total_tokens": 1231663104} {"current_steps": 6823, "total_steps": 9134, "loss": 0.8417, "learning_rate": 7.490322683725204e-06, "epoch": 0.7469279400093052, "percentage": 74.7, "elapsed_time": "5 days, 5:27:47", "remaining_time": "1 day, 18:29:42", "throughput": 2727.35, "total_tokens": 1231853952} {"current_steps": 6824, "total_steps": 9134, "loss": 0.9362, "learning_rate": 7.484186339249804e-06, "epoch": 0.747037412080243, "percentage": 74.71, "elapsed_time": "5 days, 5:28:52", "remaining_time": "1 day, 18:28:36", "throughput": 2727.35, "total_tokens": 1232032480} {"current_steps": 6825, "total_steps": 9134, "loss": 0.8023, "learning_rate": 7.4780520668616765e-06, "epoch": 0.7471468841511809, "percentage": 74.72, "elapsed_time": "5 days, 5:29:57", "remaining_time": "1 day, 18:27:29", "throughput": 2727.36, "total_tokens": 1232213920} {"current_steps": 6826, "total_steps": 9134, "loss": 0.7166, "learning_rate": 7.471919867286492e-06, "epoch": 0.7472563562221188, "percentage": 74.73, "elapsed_time": "5 days, 5:31:05", "remaining_time": "1 day, 18:26:24", "throughput": 2727.36, "total_tokens": 1232398272} {"current_steps": 6827, "total_steps": 9134, "loss": 0.8036, "learning_rate": 7.465789741249671e-06, "epoch": 0.7473658282930568, "percentage": 74.74, "elapsed_time": "5 days, 5:32:09", "remaining_time": "1 day, 18:25:17", "throughput": 2727.37, "total_tokens": 1232577920} {"current_steps": 6828, "total_steps": 9134, "loss": 0.8175, "learning_rate": 7.4596616894764215e-06, "epoch": 0.7474753003639947, "percentage": 74.75, "elapsed_time": "5 days, 5:33:13", "remaining_time": "1 day, 18:24:10", "throughput": 2727.35, "total_tokens": 1232743680} {"current_steps": 6829, "total_steps": 9134, "loss": 0.8717, "learning_rate": 7.4535357126916446e-06, "epoch": 0.7475847724349325, "percentage": 74.76, "elapsed_time": "5 days, 5:34:21", "remaining_time": "1 day, 18:23:04", "throughput": 2727.34, "total_tokens": 1232926688} {"current_steps": 6830, "total_steps": 9134, "loss": 0.6184, "learning_rate": 7.447411811620067e-06, "epoch": 0.7476942445058704, "percentage": 74.78, "elapsed_time": "5 days, 5:35:27", "remaining_time": "1 day, 18:21:58", "throughput": 2727.35, "total_tokens": 1233110368} {"current_steps": 6831, "total_steps": 9134, "loss": 0.6001, "learning_rate": 7.441289986986102e-06, "epoch": 0.7478037165768083, "percentage": 74.79, "elapsed_time": "5 days, 5:36:29", "remaining_time": "1 day, 18:20:50", "throughput": 2727.31, "total_tokens": 1233260896} {"current_steps": 6832, "total_steps": 9134, "loss": 0.8753, "learning_rate": 7.43517023951398e-06, "epoch": 0.7479131886477463, "percentage": 74.8, "elapsed_time": "5 days, 5:37:37", "remaining_time": "1 day, 18:19:45", "throughput": 2727.34, "total_tokens": 1233459808} {"current_steps": 6833, "total_steps": 9134, "loss": 1.1509, "learning_rate": 7.429052569927625e-06, "epoch": 0.7480226607186842, "percentage": 74.81, "elapsed_time": "5 days, 5:38:45", "remaining_time": "1 day, 18:18:39", "throughput": 2727.42, "total_tokens": 1233681120} {"current_steps": 6834, "total_steps": 9134, "loss": 0.9619, "learning_rate": 7.4229369789507706e-06, "epoch": 0.7481321327896221, "percentage": 74.82, "elapsed_time": "5 days, 5:39:48", "remaining_time": "1 day, 18:17:32", "throughput": 2727.46, "total_tokens": 1233870624} {"current_steps": 6835, "total_steps": 9134, "loss": 1.0941, "learning_rate": 7.416823467306866e-06, "epoch": 0.7482416048605599, "percentage": 74.83, "elapsed_time": "5 days, 5:40:56", "remaining_time": "1 day, 18:16:26", "throughput": 2727.5, "total_tokens": 1234074912} {"current_steps": 6836, "total_steps": 9134, "loss": 0.9603, "learning_rate": 7.410712035719133e-06, "epoch": 0.7483510769314978, "percentage": 74.84, "elapsed_time": "5 days, 5:42:02", "remaining_time": "1 day, 18:15:20", "throughput": 2727.54, "total_tokens": 1234270464} {"current_steps": 6837, "total_steps": 9134, "loss": 1.1083, "learning_rate": 7.4046026849105445e-06, "epoch": 0.7484605490024357, "percentage": 74.85, "elapsed_time": "5 days, 5:43:09", "remaining_time": "1 day, 18:14:14", "throughput": 2727.55, "total_tokens": 1234458624} {"current_steps": 6838, "total_steps": 9134, "loss": 0.8416, "learning_rate": 7.3984954156038095e-06, "epoch": 0.7485700210733737, "percentage": 74.86, "elapsed_time": "5 days, 5:44:10", "remaining_time": "1 day, 18:13:06", "throughput": 2727.55, "total_tokens": 1234628416} {"current_steps": 6839, "total_steps": 9134, "loss": 0.6634, "learning_rate": 7.392390228521437e-06, "epoch": 0.7486794931443116, "percentage": 74.87, "elapsed_time": "5 days, 5:45:12", "remaining_time": "1 day, 18:11:59", "throughput": 2727.54, "total_tokens": 1234793504} {"current_steps": 6840, "total_steps": 9134, "loss": 0.8972, "learning_rate": 7.386287124385624e-06, "epoch": 0.7487889652152495, "percentage": 74.89, "elapsed_time": "5 days, 5:46:18", "remaining_time": "1 day, 18:10:52", "throughput": 2727.53, "total_tokens": 1234967104} {"current_steps": 6841, "total_steps": 9134, "loss": 0.8314, "learning_rate": 7.3801861039183796e-06, "epoch": 0.7488984372861873, "percentage": 74.9, "elapsed_time": "5 days, 5:47:25", "remaining_time": "1 day, 18:09:47", "throughput": 2727.55, "total_tokens": 1235159520} {"current_steps": 6842, "total_steps": 9134, "loss": 0.9452, "learning_rate": 7.374087167841437e-06, "epoch": 0.7490079093571252, "percentage": 74.91, "elapsed_time": "5 days, 5:48:30", "remaining_time": "1 day, 18:08:40", "throughput": 2727.56, "total_tokens": 1235341856} {"current_steps": 6843, "total_steps": 9134, "loss": 0.8712, "learning_rate": 7.367990316876286e-06, "epoch": 0.7491173814280632, "percentage": 74.92, "elapsed_time": "5 days, 5:49:32", "remaining_time": "1 day, 18:07:32", "throughput": 2727.54, "total_tokens": 1235501120} {"current_steps": 6844, "total_steps": 9134, "loss": 0.6424, "learning_rate": 7.361895551744175e-06, "epoch": 0.7492268534990011, "percentage": 74.93, "elapsed_time": "5 days, 5:50:40", "remaining_time": "1 day, 18:06:27", "throughput": 2727.6, "total_tokens": 1235711456} {"current_steps": 6845, "total_steps": 9134, "loss": 1.0514, "learning_rate": 7.355802873166101e-06, "epoch": 0.749336325569939, "percentage": 74.94, "elapsed_time": "5 days, 5:51:46", "remaining_time": "1 day, 18:05:20", "throughput": 2727.62, "total_tokens": 1235903648} {"current_steps": 6846, "total_steps": 9134, "loss": 1.1335, "learning_rate": 7.349712281862817e-06, "epoch": 0.7494457976408768, "percentage": 74.95, "elapsed_time": "5 days, 5:52:54", "remaining_time": "1 day, 18:04:15", "throughput": 2727.66, "total_tokens": 1236106144} {"current_steps": 6847, "total_steps": 9134, "loss": 0.6468, "learning_rate": 7.34362377855482e-06, "epoch": 0.7495552697118147, "percentage": 74.96, "elapsed_time": "5 days, 5:53:59", "remaining_time": "1 day, 18:03:08", "throughput": 2727.64, "total_tokens": 1236276160} {"current_steps": 6848, "total_steps": 9134, "loss": 0.7023, "learning_rate": 7.3375373639623876e-06, "epoch": 0.7496647417827527, "percentage": 74.97, "elapsed_time": "5 days, 5:54:58", "remaining_time": "1 day, 18:02:00", "throughput": 2727.64, "total_tokens": 1236434304} {"current_steps": 6849, "total_steps": 9134, "loss": 0.5547, "learning_rate": 7.331453038805517e-06, "epoch": 0.7497742138536906, "percentage": 74.98, "elapsed_time": "5 days, 5:56:02", "remaining_time": "1 day, 18:00:53", "throughput": 2727.65, "total_tokens": 1236612160} {"current_steps": 6850, "total_steps": 9134, "loss": 0.8195, "learning_rate": 7.325370803803977e-06, "epoch": 0.7498836859246285, "percentage": 74.99, "elapsed_time": "5 days, 5:57:09", "remaining_time": "1 day, 17:59:47", "throughput": 2727.62, "total_tokens": 1236782624} {"current_steps": 6851, "total_steps": 9134, "loss": 0.7762, "learning_rate": 7.319290659677283e-06, "epoch": 0.7499931579955664, "percentage": 75.01, "elapsed_time": "5 days, 5:58:15", "remaining_time": "1 day, 17:58:41", "throughput": 2727.64, "total_tokens": 1236971904} {"current_steps": 6852, "total_steps": 9134, "loss": 0.7099, "learning_rate": 7.313212607144704e-06, "epoch": 0.7501026300665042, "percentage": 75.02, "elapsed_time": "5 days, 5:59:21", "remaining_time": "1 day, 17:57:34", "throughput": 2727.61, "total_tokens": 1237136992} {"current_steps": 6853, "total_steps": 9134, "loss": 0.7497, "learning_rate": 7.307136646925261e-06, "epoch": 0.7502121021374422, "percentage": 75.03, "elapsed_time": "5 days, 6:00:26", "remaining_time": "1 day, 17:56:28", "throughput": 2727.61, "total_tokens": 1237317760} {"current_steps": 6854, "total_steps": 9134, "loss": 0.6882, "learning_rate": 7.30106277973773e-06, "epoch": 0.7503215742083801, "percentage": 75.04, "elapsed_time": "5 days, 6:01:34", "remaining_time": "1 day, 17:55:22", "throughput": 2727.61, "total_tokens": 1237500992} {"current_steps": 6855, "total_steps": 9134, "loss": 0.6981, "learning_rate": 7.294991006300631e-06, "epoch": 0.750431046279318, "percentage": 75.05, "elapsed_time": "5 days, 6:02:38", "remaining_time": "1 day, 17:54:15", "throughput": 2727.6, "total_tokens": 1237671008} {"current_steps": 6856, "total_steps": 9134, "loss": 0.7309, "learning_rate": 7.288921327332254e-06, "epoch": 0.7505405183502559, "percentage": 75.06, "elapsed_time": "5 days, 6:03:42", "remaining_time": "1 day, 17:53:08", "throughput": 2727.62, "total_tokens": 1237856032} {"current_steps": 6857, "total_steps": 9134, "loss": 0.6799, "learning_rate": 7.28285374355063e-06, "epoch": 0.7506499904211938, "percentage": 75.07, "elapsed_time": "5 days, 6:04:48", "remaining_time": "1 day, 17:52:02", "throughput": 2727.64, "total_tokens": 1238044864} {"current_steps": 6858, "total_steps": 9134, "loss": 0.9884, "learning_rate": 7.276788255673539e-06, "epoch": 0.7507594624921317, "percentage": 75.08, "elapsed_time": "5 days, 6:05:56", "remaining_time": "1 day, 17:50:56", "throughput": 2727.63, "total_tokens": 1238226528} {"current_steps": 6859, "total_steps": 9134, "loss": 0.7491, "learning_rate": 7.270724864418513e-06, "epoch": 0.7508689345630696, "percentage": 75.09, "elapsed_time": "5 days, 6:07:01", "remaining_time": "1 day, 17:49:50", "throughput": 2727.69, "total_tokens": 1238429024} {"current_steps": 6860, "total_steps": 9134, "loss": 1.0001, "learning_rate": 7.264663570502844e-06, "epoch": 0.7509784066340075, "percentage": 75.1, "elapsed_time": "5 days, 6:08:08", "remaining_time": "1 day, 17:48:44", "throughput": 2727.76, "total_tokens": 1238642720} {"current_steps": 6861, "total_steps": 9134, "loss": 1.0472, "learning_rate": 7.258604374643571e-06, "epoch": 0.7510878787049454, "percentage": 75.11, "elapsed_time": "5 days, 6:09:14", "remaining_time": "1 day, 17:47:38", "throughput": 2727.75, "total_tokens": 1238817664} {"current_steps": 6862, "total_steps": 9134, "loss": 0.8808, "learning_rate": 7.252547277557478e-06, "epoch": 0.7511973507758833, "percentage": 75.13, "elapsed_time": "5 days, 6:10:17", "remaining_time": "1 day, 17:46:30", "throughput": 2727.74, "total_tokens": 1238987904} {"current_steps": 6863, "total_steps": 9134, "loss": 0.6106, "learning_rate": 7.246492279961129e-06, "epoch": 0.7513068228468212, "percentage": 75.14, "elapsed_time": "5 days, 6:11:21", "remaining_time": "1 day, 17:45:23", "throughput": 2727.74, "total_tokens": 1239161280} {"current_steps": 6864, "total_steps": 9134, "loss": 0.7211, "learning_rate": 7.24043938257079e-06, "epoch": 0.7514162949177591, "percentage": 75.15, "elapsed_time": "5 days, 6:12:28", "remaining_time": "1 day, 17:44:18", "throughput": 2727.77, "total_tokens": 1239359520} {"current_steps": 6865, "total_steps": 9134, "loss": 0.7162, "learning_rate": 7.234388586102528e-06, "epoch": 0.751525766988697, "percentage": 75.16, "elapsed_time": "5 days, 6:13:29", "remaining_time": "1 day, 17:43:10", "throughput": 2727.74, "total_tokens": 1239512960} {"current_steps": 6866, "total_steps": 9134, "loss": 0.9926, "learning_rate": 7.228339891272135e-06, "epoch": 0.7516352390596349, "percentage": 75.17, "elapsed_time": "5 days, 6:14:38", "remaining_time": "1 day, 17:42:04", "throughput": 2727.77, "total_tokens": 1239712992} {"current_steps": 6867, "total_steps": 9134, "loss": 0.8644, "learning_rate": 7.222293298795158e-06, "epoch": 0.7517447111305728, "percentage": 75.18, "elapsed_time": "5 days, 6:15:38", "remaining_time": "1 day, 17:40:56", "throughput": 2727.75, "total_tokens": 1239866208} {"current_steps": 6868, "total_steps": 9134, "loss": 1.0343, "learning_rate": 7.216248809386899e-06, "epoch": 0.7518541832015108, "percentage": 75.19, "elapsed_time": "5 days, 6:16:46", "remaining_time": "1 day, 17:39:50", "throughput": 2727.77, "total_tokens": 1240059968} {"current_steps": 6869, "total_steps": 9134, "loss": 0.7215, "learning_rate": 7.210206423762403e-06, "epoch": 0.7519636552724486, "percentage": 75.2, "elapsed_time": "5 days, 6:17:52", "remaining_time": "1 day, 17:38:44", "throughput": 2727.81, "total_tokens": 1240262016} {"current_steps": 6870, "total_steps": 9134, "loss": 0.8203, "learning_rate": 7.2041661426364925e-06, "epoch": 0.7520731273433865, "percentage": 75.21, "elapsed_time": "5 days, 6:18:57", "remaining_time": "1 day, 17:37:38", "throughput": 2727.85, "total_tokens": 1240452640} {"current_steps": 6871, "total_steps": 9134, "loss": 0.8787, "learning_rate": 7.198127966723692e-06, "epoch": 0.7521825994143244, "percentage": 75.22, "elapsed_time": "5 days, 6:20:03", "remaining_time": "1 day, 17:36:31", "throughput": 2727.87, "total_tokens": 1240643040} {"current_steps": 6872, "total_steps": 9134, "loss": 0.7175, "learning_rate": 7.192091896738337e-06, "epoch": 0.7522920714852623, "percentage": 75.24, "elapsed_time": "5 days, 6:21:09", "remaining_time": "1 day, 17:35:25", "throughput": 2727.92, "total_tokens": 1240845760} {"current_steps": 6873, "total_steps": 9134, "loss": 0.9158, "learning_rate": 7.1860579333944525e-06, "epoch": 0.7524015435562003, "percentage": 75.25, "elapsed_time": "5 days, 6:22:13", "remaining_time": "1 day, 17:34:18", "throughput": 2727.92, "total_tokens": 1241020032} {"current_steps": 6874, "total_steps": 9134, "loss": 0.738, "learning_rate": 7.180026077405877e-06, "epoch": 0.7525110156271382, "percentage": 75.26, "elapsed_time": "5 days, 6:23:16", "remaining_time": "1 day, 17:33:11", "throughput": 2727.94, "total_tokens": 1241201920} {"current_steps": 6875, "total_steps": 9134, "loss": 0.9236, "learning_rate": 7.1739963294861325e-06, "epoch": 0.752620487698076, "percentage": 75.27, "elapsed_time": "5 days, 6:24:24", "remaining_time": "1 day, 17:32:05", "throughput": 2727.99, "total_tokens": 1241411584} {"current_steps": 6876, "total_steps": 9134, "loss": 0.8722, "learning_rate": 7.167968690348554e-06, "epoch": 0.7527299597690139, "percentage": 75.28, "elapsed_time": "5 days, 6:25:32", "remaining_time": "1 day, 17:31:00", "throughput": 2728.0, "total_tokens": 1241601536} {"current_steps": 6877, "total_steps": 9134, "loss": 0.8053, "learning_rate": 7.161943160706189e-06, "epoch": 0.7528394318399518, "percentage": 75.29, "elapsed_time": "5 days, 6:26:39", "remaining_time": "1 day, 17:29:54", "throughput": 2728.01, "total_tokens": 1241787232} {"current_steps": 6878, "total_steps": 9134, "loss": 0.9984, "learning_rate": 7.155919741271849e-06, "epoch": 0.7529489039108898, "percentage": 75.3, "elapsed_time": "5 days, 6:27:42", "remaining_time": "1 day, 17:28:47", "throughput": 2728.0, "total_tokens": 1241959040} {"current_steps": 6879, "total_steps": 9134, "loss": 0.6845, "learning_rate": 7.149898432758093e-06, "epoch": 0.7530583759818277, "percentage": 75.31, "elapsed_time": "5 days, 6:28:49", "remaining_time": "1 day, 17:27:41", "throughput": 2728.02, "total_tokens": 1242146304} {"current_steps": 6880, "total_steps": 9134, "loss": 0.7861, "learning_rate": 7.143879235877218e-06, "epoch": 0.7531678480527655, "percentage": 75.32, "elapsed_time": "5 days, 6:29:53", "remaining_time": "1 day, 17:26:34", "throughput": 2728.06, "total_tokens": 1242342976} {"current_steps": 6881, "total_steps": 9134, "loss": 0.7791, "learning_rate": 7.13786215134131e-06, "epoch": 0.7532773201237034, "percentage": 75.33, "elapsed_time": "5 days, 6:30:56", "remaining_time": "1 day, 17:25:27", "throughput": 2728.09, "total_tokens": 1242525536} {"current_steps": 6882, "total_steps": 9134, "loss": 1.0009, "learning_rate": 7.131847179862148e-06, "epoch": 0.7533867921946413, "percentage": 75.34, "elapsed_time": "5 days, 6:32:03", "remaining_time": "1 day, 17:24:21", "throughput": 2728.09, "total_tokens": 1242710784} {"current_steps": 6883, "total_steps": 9134, "loss": 0.8608, "learning_rate": 7.125834322151315e-06, "epoch": 0.7534962642655793, "percentage": 75.36, "elapsed_time": "5 days, 6:33:11", "remaining_time": "1 day, 17:23:15", "throughput": 2728.14, "total_tokens": 1242918208} {"current_steps": 6884, "total_steps": 9134, "loss": 0.7602, "learning_rate": 7.119823578920112e-06, "epoch": 0.7536057363365172, "percentage": 75.37, "elapsed_time": "5 days, 6:34:16", "remaining_time": "1 day, 17:22:08", "throughput": 2728.17, "total_tokens": 1243107936} {"current_steps": 6885, "total_steps": 9134, "loss": 0.7868, "learning_rate": 7.113814950879596e-06, "epoch": 0.7537152084074551, "percentage": 75.38, "elapsed_time": "5 days, 6:35:20", "remaining_time": "1 day, 17:21:02", "throughput": 2728.15, "total_tokens": 1243276384} {"current_steps": 6886, "total_steps": 9134, "loss": 0.7359, "learning_rate": 7.1078084387405815e-06, "epoch": 0.7538246804783929, "percentage": 75.39, "elapsed_time": "5 days, 6:36:21", "remaining_time": "1 day, 17:19:54", "throughput": 2728.15, "total_tokens": 1243439456} {"current_steps": 6887, "total_steps": 9134, "loss": 0.7925, "learning_rate": 7.101804043213625e-06, "epoch": 0.7539341525493308, "percentage": 75.4, "elapsed_time": "5 days, 6:37:29", "remaining_time": "1 day, 17:18:48", "throughput": 2728.19, "total_tokens": 1243644416} {"current_steps": 6888, "total_steps": 9134, "loss": 0.8946, "learning_rate": 7.0958017650090245e-06, "epoch": 0.7540436246202687, "percentage": 75.41, "elapsed_time": "5 days, 6:38:35", "remaining_time": "1 day, 17:17:42", "throughput": 2728.16, "total_tokens": 1243808160} {"current_steps": 6889, "total_steps": 9134, "loss": 0.8432, "learning_rate": 7.089801604836857e-06, "epoch": 0.7541530966912067, "percentage": 75.42, "elapsed_time": "5 days, 6:39:40", "remaining_time": "1 day, 17:16:35", "throughput": 2728.17, "total_tokens": 1243992288} {"current_steps": 6890, "total_steps": 9134, "loss": 0.709, "learning_rate": 7.083803563406924e-06, "epoch": 0.7542625687621446, "percentage": 75.43, "elapsed_time": "5 days, 6:40:48", "remaining_time": "1 day, 17:15:30", "throughput": 2728.25, "total_tokens": 1244214720} {"current_steps": 6891, "total_steps": 9134, "loss": 0.8934, "learning_rate": 7.077807641428777e-06, "epoch": 0.7543720408330825, "percentage": 75.44, "elapsed_time": "5 days, 6:41:49", "remaining_time": "1 day, 17:14:22", "throughput": 2728.24, "total_tokens": 1244378016} {"current_steps": 6892, "total_steps": 9134, "loss": 0.7872, "learning_rate": 7.071813839611724e-06, "epoch": 0.7544815129040203, "percentage": 75.45, "elapsed_time": "5 days, 6:42:56", "remaining_time": "1 day, 17:13:16", "throughput": 2728.25, "total_tokens": 1244565504} {"current_steps": 6893, "total_steps": 9134, "loss": 0.8506, "learning_rate": 7.0658221586648195e-06, "epoch": 0.7545909849749582, "percentage": 75.47, "elapsed_time": "5 days, 6:44:00", "remaining_time": "1 day, 17:12:09", "throughput": 2728.28, "total_tokens": 1244752320} {"current_steps": 6894, "total_steps": 9134, "loss": 0.7866, "learning_rate": 7.059832599296873e-06, "epoch": 0.7547004570458962, "percentage": 75.48, "elapsed_time": "5 days, 6:45:02", "remaining_time": "1 day, 17:11:02", "throughput": 2728.25, "total_tokens": 1244909120} {"current_steps": 6895, "total_steps": 9134, "loss": 0.6671, "learning_rate": 7.053845162216424e-06, "epoch": 0.7548099291168341, "percentage": 75.49, "elapsed_time": "5 days, 6:46:07", "remaining_time": "1 day, 17:09:55", "throughput": 2728.25, "total_tokens": 1245084736} {"current_steps": 6896, "total_steps": 9134, "loss": 0.8998, "learning_rate": 7.047859848131802e-06, "epoch": 0.754919401187772, "percentage": 75.5, "elapsed_time": "5 days, 6:47:14", "remaining_time": "1 day, 17:08:49", "throughput": 2728.26, "total_tokens": 1245269984} {"current_steps": 6897, "total_steps": 9134, "loss": 0.7954, "learning_rate": 7.041876657751023e-06, "epoch": 0.7550288732587098, "percentage": 75.51, "elapsed_time": "5 days, 6:48:15", "remaining_time": "1 day, 17:07:41", "throughput": 2728.2, "total_tokens": 1245409760} {"current_steps": 6898, "total_steps": 9134, "loss": 1.0313, "learning_rate": 7.035895591781916e-06, "epoch": 0.7551383453296477, "percentage": 75.52, "elapsed_time": "5 days, 6:49:22", "remaining_time": "1 day, 17:06:35", "throughput": 2728.22, "total_tokens": 1245605984} {"current_steps": 6899, "total_steps": 9134, "loss": 0.7462, "learning_rate": 7.0299166509320194e-06, "epoch": 0.7552478174005857, "percentage": 75.53, "elapsed_time": "5 days, 6:50:26", "remaining_time": "1 day, 17:05:28", "throughput": 2728.21, "total_tokens": 1245775328} {"current_steps": 6900, "total_steps": 9134, "loss": 0.7666, "learning_rate": 7.023939835908627e-06, "epoch": 0.7553572894715236, "percentage": 75.54, "elapsed_time": "5 days, 6:51:24", "remaining_time": "1 day, 17:04:19", "throughput": 2728.17, "total_tokens": 1245912192} {"current_steps": 6901, "total_steps": 9134, "loss": 0.8747, "learning_rate": 7.0179651474187895e-06, "epoch": 0.7554667615424615, "percentage": 75.55, "elapsed_time": "5 days, 6:52:32", "remaining_time": "1 day, 17:03:14", "throughput": 2728.2, "total_tokens": 1246109984} {"current_steps": 6902, "total_steps": 9134, "loss": 0.6244, "learning_rate": 7.011992586169291e-06, "epoch": 0.7555762336133994, "percentage": 75.56, "elapsed_time": "5 days, 6:53:35", "remaining_time": "1 day, 17:02:06", "throughput": 2728.19, "total_tokens": 1246277536} {"current_steps": 6903, "total_steps": 9134, "loss": 0.7359, "learning_rate": 7.006022152866698e-06, "epoch": 0.7556857056843372, "percentage": 75.57, "elapsed_time": "5 days, 6:54:40", "remaining_time": "1 day, 17:01:00", "throughput": 2728.2, "total_tokens": 1246459424} {"current_steps": 6904, "total_steps": 9134, "loss": 0.9037, "learning_rate": 7.000053848217272e-06, "epoch": 0.7557951777552752, "percentage": 75.59, "elapsed_time": "5 days, 6:55:44", "remaining_time": "1 day, 16:59:53", "throughput": 2728.24, "total_tokens": 1246654528} {"current_steps": 6905, "total_steps": 9134, "loss": 0.7057, "learning_rate": 6.99408767292708e-06, "epoch": 0.7559046498262131, "percentage": 75.6, "elapsed_time": "5 days, 6:56:51", "remaining_time": "1 day, 16:58:47", "throughput": 2728.23, "total_tokens": 1246832384} {"current_steps": 6906, "total_steps": 9134, "loss": 0.6909, "learning_rate": 6.988123627701879e-06, "epoch": 0.756014121897151, "percentage": 75.61, "elapsed_time": "5 days, 6:57:58", "remaining_time": "1 day, 16:57:41", "throughput": 2728.21, "total_tokens": 1247007104} {"current_steps": 6907, "total_steps": 9134, "loss": 0.708, "learning_rate": 6.982161713247226e-06, "epoch": 0.7561235939680889, "percentage": 75.62, "elapsed_time": "5 days, 6:58:58", "remaining_time": "1 day, 16:56:33", "throughput": 2728.18, "total_tokens": 1247153152} {"current_steps": 6908, "total_steps": 9134, "loss": 0.7185, "learning_rate": 6.9762019302684e-06, "epoch": 0.7562330660390268, "percentage": 75.63, "elapsed_time": "5 days, 6:59:59", "remaining_time": "1 day, 16:55:25", "throughput": 2728.15, "total_tokens": 1247310400} {"current_steps": 6909, "total_steps": 9134, "loss": 0.7195, "learning_rate": 6.970244279470431e-06, "epoch": 0.7563425381099647, "percentage": 75.64, "elapsed_time": "5 days, 7:01:05", "remaining_time": "1 day, 16:54:19", "throughput": 2728.16, "total_tokens": 1247493184} {"current_steps": 6910, "total_steps": 9134, "loss": 0.8429, "learning_rate": 6.964288761558094e-06, "epoch": 0.7564520101809026, "percentage": 75.65, "elapsed_time": "5 days, 7:02:10", "remaining_time": "1 day, 16:53:12", "throughput": 2728.15, "total_tokens": 1247666336} {"current_steps": 6911, "total_steps": 9134, "loss": 0.7443, "learning_rate": 6.958335377235911e-06, "epoch": 0.7565614822518405, "percentage": 75.66, "elapsed_time": "5 days, 7:03:14", "remaining_time": "1 day, 16:52:06", "throughput": 2728.1, "total_tokens": 1247817312} {"current_steps": 6912, "total_steps": 9134, "loss": 0.7569, "learning_rate": 6.952384127208181e-06, "epoch": 0.7566709543227784, "percentage": 75.67, "elapsed_time": "5 days, 7:04:20", "remaining_time": "1 day, 16:50:59", "throughput": 2728.16, "total_tokens": 1248025408} {"current_steps": 6913, "total_steps": 9134, "loss": 1.1645, "learning_rate": 6.94643501217889e-06, "epoch": 0.7567804263937163, "percentage": 75.68, "elapsed_time": "5 days, 7:05:27", "remaining_time": "1 day, 16:49:53", "throughput": 2728.2, "total_tokens": 1248225216} {"current_steps": 6914, "total_steps": 9134, "loss": 0.8654, "learning_rate": 6.940488032851839e-06, "epoch": 0.7568898984646542, "percentage": 75.7, "elapsed_time": "5 days, 7:06:30", "remaining_time": "1 day, 16:48:46", "throughput": 2728.18, "total_tokens": 1248390976} {"current_steps": 6915, "total_steps": 9134, "loss": 0.9939, "learning_rate": 6.934543189930515e-06, "epoch": 0.7569993705355921, "percentage": 75.71, "elapsed_time": "5 days, 7:07:34", "remaining_time": "1 day, 16:47:39", "throughput": 2728.17, "total_tokens": 1248560992} {"current_steps": 6916, "total_steps": 9134, "loss": 1.0641, "learning_rate": 6.928600484118206e-06, "epoch": 0.75710884260653, "percentage": 75.72, "elapsed_time": "5 days, 7:08:40", "remaining_time": "1 day, 16:46:33", "throughput": 2728.15, "total_tokens": 1248731232} {"current_steps": 6917, "total_steps": 9134, "loss": 0.7616, "learning_rate": 6.92265991611791e-06, "epoch": 0.7572183146774679, "percentage": 75.73, "elapsed_time": "5 days, 7:09:44", "remaining_time": "1 day, 16:45:26", "throughput": 2728.15, "total_tokens": 1248906400} {"current_steps": 6918, "total_steps": 9134, "loss": 0.826, "learning_rate": 6.916721486632391e-06, "epoch": 0.7573277867484058, "percentage": 75.74, "elapsed_time": "5 days, 7:10:46", "remaining_time": "1 day, 16:44:19", "throughput": 2728.15, "total_tokens": 1249075072} {"current_steps": 6919, "total_steps": 9134, "loss": 0.8093, "learning_rate": 6.9107851963641505e-06, "epoch": 0.7574372588193438, "percentage": 75.75, "elapsed_time": "5 days, 7:11:49", "remaining_time": "1 day, 16:43:11", "throughput": 2728.14, "total_tokens": 1249240384} {"current_steps": 6920, "total_steps": 9134, "loss": 0.6396, "learning_rate": 6.9048510460154315e-06, "epoch": 0.7575467308902816, "percentage": 75.76, "elapsed_time": "5 days, 7:12:54", "remaining_time": "1 day, 16:42:05", "throughput": 2728.15, "total_tokens": 1249422944} {"current_steps": 6921, "total_steps": 9134, "loss": 1.0675, "learning_rate": 6.8989190362882565e-06, "epoch": 0.7576562029612195, "percentage": 75.77, "elapsed_time": "5 days, 7:13:57", "remaining_time": "1 day, 16:40:58", "throughput": 2728.2, "total_tokens": 1249618496} {"current_steps": 6922, "total_steps": 9134, "loss": 0.603, "learning_rate": 6.892989167884342e-06, "epoch": 0.7577656750321574, "percentage": 75.78, "elapsed_time": "5 days, 7:15:05", "remaining_time": "1 day, 16:39:52", "throughput": 2728.2, "total_tokens": 1249805088} {"current_steps": 6923, "total_steps": 9134, "loss": 0.8421, "learning_rate": 6.887061441505202e-06, "epoch": 0.7578751471030953, "percentage": 75.79, "elapsed_time": "5 days, 7:16:10", "remaining_time": "1 day, 16:38:46", "throughput": 2728.25, "total_tokens": 1250003776} {"current_steps": 6924, "total_steps": 9134, "loss": 0.6441, "learning_rate": 6.881135857852067e-06, "epoch": 0.7579846191740333, "percentage": 75.8, "elapsed_time": "5 days, 7:17:13", "remaining_time": "1 day, 16:37:38", "throughput": 2728.25, "total_tokens": 1250176928} {"current_steps": 6925, "total_steps": 9134, "loss": 0.9146, "learning_rate": 6.87521241762592e-06, "epoch": 0.7580940912449712, "percentage": 75.82, "elapsed_time": "5 days, 7:18:22", "remaining_time": "1 day, 16:36:33", "throughput": 2728.26, "total_tokens": 1250367776} {"current_steps": 6926, "total_steps": 9134, "loss": 0.8882, "learning_rate": 6.869291121527499e-06, "epoch": 0.758203563315909, "percentage": 75.83, "elapsed_time": "5 days, 7:19:22", "remaining_time": "1 day, 16:35:25", "throughput": 2728.23, "total_tokens": 1250518976} {"current_steps": 6927, "total_steps": 9134, "loss": 0.9045, "learning_rate": 6.863371970257276e-06, "epoch": 0.7583130353868469, "percentage": 75.84, "elapsed_time": "5 days, 7:20:30", "remaining_time": "1 day, 16:34:19", "throughput": 2728.28, "total_tokens": 1250728640} {"current_steps": 6928, "total_steps": 9134, "loss": 0.6783, "learning_rate": 6.857454964515481e-06, "epoch": 0.7584225074577848, "percentage": 75.85, "elapsed_time": "5 days, 7:21:36", "remaining_time": "1 day, 16:33:13", "throughput": 2728.31, "total_tokens": 1250921952} {"current_steps": 6929, "total_steps": 9134, "loss": 0.9814, "learning_rate": 6.851540105002077e-06, "epoch": 0.7585319795287228, "percentage": 75.86, "elapsed_time": "5 days, 7:22:43", "remaining_time": "1 day, 16:32:07", "throughput": 2728.35, "total_tokens": 1251121088} {"current_steps": 6930, "total_steps": 9134, "loss": 0.745, "learning_rate": 6.845627392416779e-06, "epoch": 0.7586414515996607, "percentage": 75.87, "elapsed_time": "5 days, 7:23:45", "remaining_time": "1 day, 16:31:00", "throughput": 2728.35, "total_tokens": 1251289984} {"current_steps": 6931, "total_steps": 9134, "loss": 1.0792, "learning_rate": 6.839716827459064e-06, "epoch": 0.7587509236705985, "percentage": 75.88, "elapsed_time": "5 days, 7:24:52", "remaining_time": "1 day, 16:29:54", "throughput": 2728.34, "total_tokens": 1251471872} {"current_steps": 6932, "total_steps": 9134, "loss": 0.7691, "learning_rate": 6.83380841082813e-06, "epoch": 0.7588603957415364, "percentage": 75.89, "elapsed_time": "5 days, 7:25:58", "remaining_time": "1 day, 16:28:47", "throughput": 2728.34, "total_tokens": 1251646592} {"current_steps": 6933, "total_steps": 9134, "loss": 0.9978, "learning_rate": 6.827902143222933e-06, "epoch": 0.7589698678124743, "percentage": 75.9, "elapsed_time": "5 days, 7:27:06", "remaining_time": "1 day, 16:27:42", "throughput": 2728.38, "total_tokens": 1251850208} {"current_steps": 6934, "total_steps": 9134, "loss": 0.7411, "learning_rate": 6.821998025342172e-06, "epoch": 0.7590793398834123, "percentage": 75.91, "elapsed_time": "5 days, 7:28:07", "remaining_time": "1 day, 16:26:34", "throughput": 2728.37, "total_tokens": 1252013280} {"current_steps": 6935, "total_steps": 9134, "loss": 0.8251, "learning_rate": 6.816096057884297e-06, "epoch": 0.7591888119543502, "percentage": 75.93, "elapsed_time": "5 days, 7:29:12", "remaining_time": "1 day, 16:25:27", "throughput": 2728.38, "total_tokens": 1252196512} {"current_steps": 6936, "total_steps": 9134, "loss": 0.9841, "learning_rate": 6.810196241547495e-06, "epoch": 0.7592982840252881, "percentage": 75.94, "elapsed_time": "5 days, 7:30:14", "remaining_time": "1 day, 16:24:20", "throughput": 2728.31, "total_tokens": 1252335392} {"current_steps": 6937, "total_steps": 9134, "loss": 0.8199, "learning_rate": 6.804298577029697e-06, "epoch": 0.7594077560962259, "percentage": 75.95, "elapsed_time": "5 days, 7:31:22", "remaining_time": "1 day, 16:23:14", "throughput": 2728.33, "total_tokens": 1252529376} {"current_steps": 6938, "total_steps": 9134, "loss": 0.8666, "learning_rate": 6.798403065028611e-06, "epoch": 0.7595172281671638, "percentage": 75.96, "elapsed_time": "5 days, 7:32:26", "remaining_time": "1 day, 16:22:08", "throughput": 2728.39, "total_tokens": 1252733440} {"current_steps": 6939, "total_steps": 9134, "loss": 1.1484, "learning_rate": 6.792509706241629e-06, "epoch": 0.7596267002381017, "percentage": 75.97, "elapsed_time": "5 days, 7:33:32", "remaining_time": "1 day, 16:21:01", "throughput": 2728.45, "total_tokens": 1252940416} {"current_steps": 6940, "total_steps": 9134, "loss": 1.1212, "learning_rate": 6.786618501365949e-06, "epoch": 0.7597361723090397, "percentage": 75.98, "elapsed_time": "5 days, 7:34:38", "remaining_time": "1 day, 16:19:55", "throughput": 2728.48, "total_tokens": 1253130368} {"current_steps": 6941, "total_steps": 9134, "loss": 0.8732, "learning_rate": 6.780729451098483e-06, "epoch": 0.7598456443799776, "percentage": 75.99, "elapsed_time": "5 days, 7:35:45", "remaining_time": "1 day, 16:18:49", "throughput": 2728.53, "total_tokens": 1253337568} {"current_steps": 6942, "total_steps": 9134, "loss": 0.9424, "learning_rate": 6.7748425561358934e-06, "epoch": 0.7599551164509155, "percentage": 76.0, "elapsed_time": "5 days, 7:36:51", "remaining_time": "1 day, 16:17:43", "throughput": 2728.55, "total_tokens": 1253526624} {"current_steps": 6943, "total_steps": 9134, "loss": 0.9154, "learning_rate": 6.76895781717459e-06, "epoch": 0.7600645885218533, "percentage": 76.01, "elapsed_time": "5 days, 7:37:55", "remaining_time": "1 day, 16:16:36", "throughput": 2728.57, "total_tokens": 1253709632} {"current_steps": 6944, "total_steps": 9134, "loss": 0.8865, "learning_rate": 6.763075234910715e-06, "epoch": 0.7601740605927912, "percentage": 76.02, "elapsed_time": "5 days, 7:39:02", "remaining_time": "1 day, 16:15:30", "throughput": 2728.61, "total_tokens": 1253914144} {"current_steps": 6945, "total_steps": 9134, "loss": 0.9831, "learning_rate": 6.757194810040193e-06, "epoch": 0.7602835326637292, "percentage": 76.03, "elapsed_time": "5 days, 7:40:07", "remaining_time": "1 day, 16:14:24", "throughput": 2728.62, "total_tokens": 1254094464} {"current_steps": 6946, "total_steps": 9134, "loss": 0.8722, "learning_rate": 6.751316543258637e-06, "epoch": 0.7603930047346671, "percentage": 76.05, "elapsed_time": "5 days, 7:41:15", "remaining_time": "1 day, 16:13:18", "throughput": 2728.63, "total_tokens": 1254283744} {"current_steps": 6947, "total_steps": 9134, "loss": 0.9107, "learning_rate": 6.745440435261463e-06, "epoch": 0.760502476805605, "percentage": 76.06, "elapsed_time": "5 days, 7:42:23", "remaining_time": "1 day, 16:12:12", "throughput": 2728.7, "total_tokens": 1254500128} {"current_steps": 6948, "total_steps": 9134, "loss": 0.8474, "learning_rate": 6.739566486743773e-06, "epoch": 0.7606119488765428, "percentage": 76.07, "elapsed_time": "5 days, 7:43:28", "remaining_time": "1 day, 16:11:06", "throughput": 2728.71, "total_tokens": 1254681792} {"current_steps": 6949, "total_steps": 9134, "loss": 0.8152, "learning_rate": 6.733694698400467e-06, "epoch": 0.7607214209474807, "percentage": 76.08, "elapsed_time": "5 days, 7:44:32", "remaining_time": "1 day, 16:09:59", "throughput": 2728.7, "total_tokens": 1254854944} {"current_steps": 6950, "total_steps": 9134, "loss": 0.7308, "learning_rate": 6.727825070926158e-06, "epoch": 0.7608308930184187, "percentage": 76.09, "elapsed_time": "5 days, 7:45:39", "remaining_time": "1 day, 16:08:53", "throughput": 2728.7, "total_tokens": 1255035040} {"current_steps": 6951, "total_steps": 9134, "loss": 0.9711, "learning_rate": 6.721957605015214e-06, "epoch": 0.7609403650893566, "percentage": 76.1, "elapsed_time": "5 days, 7:46:44", "remaining_time": "1 day, 16:07:46", "throughput": 2728.69, "total_tokens": 1255208864} {"current_steps": 6952, "total_steps": 9134, "loss": 0.808, "learning_rate": 6.716092301361743e-06, "epoch": 0.7610498371602945, "percentage": 76.11, "elapsed_time": "5 days, 7:47:49", "remaining_time": "1 day, 16:06:40", "throughput": 2728.7, "total_tokens": 1255393664} {"current_steps": 6953, "total_steps": 9134, "loss": 0.969, "learning_rate": 6.710229160659593e-06, "epoch": 0.7611593092312324, "percentage": 76.12, "elapsed_time": "5 days, 7:48:57", "remaining_time": "1 day, 16:05:34", "throughput": 2728.73, "total_tokens": 1255591680} {"current_steps": 6954, "total_steps": 9134, "loss": 0.7616, "learning_rate": 6.704368183602386e-06, "epoch": 0.7612687813021702, "percentage": 76.13, "elapsed_time": "5 days, 7:50:03", "remaining_time": "1 day, 16:04:28", "throughput": 2728.72, "total_tokens": 1255765504} {"current_steps": 6955, "total_steps": 9134, "loss": 0.7269, "learning_rate": 6.698509370883429e-06, "epoch": 0.7613782533731082, "percentage": 76.14, "elapsed_time": "5 days, 7:51:08", "remaining_time": "1 day, 16:03:21", "throughput": 2728.77, "total_tokens": 1255965760} {"current_steps": 6956, "total_steps": 9134, "loss": 0.9119, "learning_rate": 6.692652723195836e-06, "epoch": 0.7614877254440461, "percentage": 76.16, "elapsed_time": "5 days, 7:52:16", "remaining_time": "1 day, 16:02:16", "throughput": 2728.78, "total_tokens": 1256157056} {"current_steps": 6957, "total_steps": 9134, "loss": 0.8523, "learning_rate": 6.686798241232428e-06, "epoch": 0.761597197514984, "percentage": 76.17, "elapsed_time": "5 days, 7:53:21", "remaining_time": "1 day, 16:01:09", "throughput": 2728.83, "total_tokens": 1256359328} {"current_steps": 6958, "total_steps": 9134, "loss": 0.665, "learning_rate": 6.680945925685778e-06, "epoch": 0.7617066695859219, "percentage": 76.18, "elapsed_time": "5 days, 7:54:26", "remaining_time": "1 day, 16:00:03", "throughput": 2728.85, "total_tokens": 1256545248} {"current_steps": 6959, "total_steps": 9134, "loss": 0.7031, "learning_rate": 6.675095777248208e-06, "epoch": 0.7618161416568598, "percentage": 76.19, "elapsed_time": "5 days, 7:55:25", "remaining_time": "1 day, 15:58:55", "throughput": 2728.81, "total_tokens": 1256688160} {"current_steps": 6960, "total_steps": 9134, "loss": 0.6921, "learning_rate": 6.669247796611774e-06, "epoch": 0.7619256137277977, "percentage": 76.2, "elapsed_time": "5 days, 7:56:24", "remaining_time": "1 day, 15:57:46", "throughput": 2728.75, "total_tokens": 1256820768} {"current_steps": 6961, "total_steps": 9134, "loss": 0.8674, "learning_rate": 6.663401984468281e-06, "epoch": 0.7620350857987356, "percentage": 76.21, "elapsed_time": "5 days, 7:57:29", "remaining_time": "1 day, 15:56:40", "throughput": 2728.79, "total_tokens": 1257016320} {"current_steps": 6962, "total_steps": 9134, "loss": 0.8157, "learning_rate": 6.657558341509276e-06, "epoch": 0.7621445578696735, "percentage": 76.22, "elapsed_time": "5 days, 7:58:35", "remaining_time": "1 day, 15:55:33", "throughput": 2728.8, "total_tokens": 1257197088} {"current_steps": 6963, "total_steps": 9134, "loss": 1.2146, "learning_rate": 6.651716868426061e-06, "epoch": 0.7622540299406114, "percentage": 76.23, "elapsed_time": "5 days, 7:59:40", "remaining_time": "1 day, 15:54:27", "throughput": 2728.83, "total_tokens": 1257392864} {"current_steps": 6964, "total_steps": 9134, "loss": 0.9292, "learning_rate": 6.645877565909664e-06, "epoch": 0.7623635020115493, "percentage": 76.24, "elapsed_time": "5 days, 8:00:48", "remaining_time": "1 day, 15:53:21", "throughput": 2728.83, "total_tokens": 1257574976} {"current_steps": 6965, "total_steps": 9134, "loss": 0.6703, "learning_rate": 6.6400404346508625e-06, "epoch": 0.7624729740824872, "percentage": 76.25, "elapsed_time": "5 days, 8:01:52", "remaining_time": "1 day, 15:52:14", "throughput": 2728.84, "total_tokens": 1257756416} {"current_steps": 6966, "total_steps": 9134, "loss": 0.8921, "learning_rate": 6.634205475340182e-06, "epoch": 0.7625824461534251, "percentage": 76.26, "elapsed_time": "5 days, 8:02:55", "remaining_time": "1 day, 15:51:07", "throughput": 2728.82, "total_tokens": 1257921056} {"current_steps": 6967, "total_steps": 9134, "loss": 0.8477, "learning_rate": 6.628372688667883e-06, "epoch": 0.762691918224363, "percentage": 76.28, "elapsed_time": "5 days, 8:04:00", "remaining_time": "1 day, 15:50:00", "throughput": 2728.82, "total_tokens": 1258098016} {"current_steps": 6968, "total_steps": 9134, "loss": 0.8869, "learning_rate": 6.622542075323973e-06, "epoch": 0.7628013902953009, "percentage": 76.29, "elapsed_time": "5 days, 8:05:07", "remaining_time": "1 day, 15:48:55", "throughput": 2728.85, "total_tokens": 1258296480} {"current_steps": 6969, "total_steps": 9134, "loss": 0.9329, "learning_rate": 6.6167136359982064e-06, "epoch": 0.7629108623662388, "percentage": 76.3, "elapsed_time": "5 days, 8:06:08", "remaining_time": "1 day, 15:47:47", "throughput": 2728.84, "total_tokens": 1258457312} {"current_steps": 6970, "total_steps": 9134, "loss": 0.8995, "learning_rate": 6.610887371380064e-06, "epoch": 0.7630203344371768, "percentage": 76.31, "elapsed_time": "5 days, 8:07:14", "remaining_time": "1 day, 15:46:41", "throughput": 2728.87, "total_tokens": 1258649504} {"current_steps": 6971, "total_steps": 9134, "loss": 0.8872, "learning_rate": 6.605063282158808e-06, "epoch": 0.7631298065081146, "percentage": 76.32, "elapsed_time": "5 days, 8:08:20", "remaining_time": "1 day, 15:45:34", "throughput": 2728.91, "total_tokens": 1258846624} {"current_steps": 6972, "total_steps": 9134, "loss": 0.8379, "learning_rate": 6.599241369023385e-06, "epoch": 0.7632392785790525, "percentage": 76.33, "elapsed_time": "5 days, 8:09:27", "remaining_time": "1 day, 15:44:29", "throughput": 2728.91, "total_tokens": 1259029632} {"current_steps": 6973, "total_steps": 9134, "loss": 0.9019, "learning_rate": 6.593421632662539e-06, "epoch": 0.7633487506499904, "percentage": 76.34, "elapsed_time": "5 days, 8:10:35", "remaining_time": "1 day, 15:43:23", "throughput": 2728.89, "total_tokens": 1259207712} {"current_steps": 6974, "total_steps": 9134, "loss": 0.7225, "learning_rate": 6.587604073764728e-06, "epoch": 0.7634582227209283, "percentage": 76.35, "elapsed_time": "5 days, 8:11:42", "remaining_time": "1 day, 15:42:17", "throughput": 2728.89, "total_tokens": 1259388928} {"current_steps": 6975, "total_steps": 9134, "loss": 0.9872, "learning_rate": 6.581788693018154e-06, "epoch": 0.7635676947918663, "percentage": 76.36, "elapsed_time": "5 days, 8:12:49", "remaining_time": "1 day, 15:41:11", "throughput": 2728.89, "total_tokens": 1259575072} {"current_steps": 6976, "total_steps": 9134, "loss": 0.7461, "learning_rate": 6.575975491110769e-06, "epoch": 0.7636771668628042, "percentage": 76.37, "elapsed_time": "5 days, 8:13:53", "remaining_time": "1 day, 15:40:04", "throughput": 2728.88, "total_tokens": 1259744416} {"current_steps": 6977, "total_steps": 9134, "loss": 0.7605, "learning_rate": 6.570164468730258e-06, "epoch": 0.763786638933742, "percentage": 76.38, "elapsed_time": "5 days, 8:14:59", "remaining_time": "1 day, 15:38:58", "throughput": 2728.9, "total_tokens": 1259931008} {"current_steps": 6978, "total_steps": 9134, "loss": 0.6357, "learning_rate": 6.56435562656407e-06, "epoch": 0.7638961110046799, "percentage": 76.4, "elapsed_time": "5 days, 8:16:02", "remaining_time": "1 day, 15:37:51", "throughput": 2728.87, "total_tokens": 1260091616} {"current_steps": 6979, "total_steps": 9134, "loss": 1.0362, "learning_rate": 6.558548965299355e-06, "epoch": 0.7640055830756178, "percentage": 76.41, "elapsed_time": "5 days, 8:17:10", "remaining_time": "1 day, 15:36:45", "throughput": 2728.89, "total_tokens": 1260286272} {"current_steps": 6980, "total_steps": 9134, "loss": 0.967, "learning_rate": 6.552744485623058e-06, "epoch": 0.7641150551465558, "percentage": 76.42, "elapsed_time": "5 days, 8:18:15", "remaining_time": "1 day, 15:35:39", "throughput": 2728.9, "total_tokens": 1260465248} {"current_steps": 6981, "total_steps": 9134, "loss": 0.6375, "learning_rate": 6.5469421882218075e-06, "epoch": 0.7642245272174937, "percentage": 76.43, "elapsed_time": "5 days, 8:19:20", "remaining_time": "1 day, 15:34:32", "throughput": 2728.95, "total_tokens": 1260670208} {"current_steps": 6982, "total_steps": 9134, "loss": 0.9057, "learning_rate": 6.541142073782028e-06, "epoch": 0.7643339992884315, "percentage": 76.44, "elapsed_time": "5 days, 8:20:21", "remaining_time": "1 day, 15:33:24", "throughput": 2728.9, "total_tokens": 1260809760} {"current_steps": 6983, "total_steps": 9134, "loss": 1.0672, "learning_rate": 6.535344142989852e-06, "epoch": 0.7644434713593694, "percentage": 76.45, "elapsed_time": "5 days, 8:21:25", "remaining_time": "1 day, 15:32:17", "throughput": 2728.91, "total_tokens": 1260990976} {"current_steps": 6984, "total_steps": 9134, "loss": 0.7156, "learning_rate": 6.529548396531168e-06, "epoch": 0.7645529434303073, "percentage": 76.46, "elapsed_time": "5 days, 8:22:26", "remaining_time": "1 day, 15:31:10", "throughput": 2728.9, "total_tokens": 1261149344} {"current_steps": 6985, "total_steps": 9134, "loss": 0.909, "learning_rate": 6.523754835091597e-06, "epoch": 0.7646624155012453, "percentage": 76.47, "elapsed_time": "5 days, 8:23:33", "remaining_time": "1 day, 15:30:04", "throughput": 2728.94, "total_tokens": 1261351840} {"current_steps": 6986, "total_steps": 9134, "loss": 0.7079, "learning_rate": 6.517963459356502e-06, "epoch": 0.7647718875721832, "percentage": 76.48, "elapsed_time": "5 days, 8:24:37", "remaining_time": "1 day, 15:28:57", "throughput": 2728.9, "total_tokens": 1261511552} {"current_steps": 6987, "total_steps": 9134, "loss": 0.9208, "learning_rate": 6.512174270011015e-06, "epoch": 0.7648813596431211, "percentage": 76.49, "elapsed_time": "5 days, 8:25:42", "remaining_time": "1 day, 15:27:50", "throughput": 2728.88, "total_tokens": 1261675296} {"current_steps": 6988, "total_steps": 9134, "loss": 1.0308, "learning_rate": 6.5063872677399525e-06, "epoch": 0.7649908317140589, "percentage": 76.51, "elapsed_time": "5 days, 8:26:47", "remaining_time": "1 day, 15:26:44", "throughput": 2728.88, "total_tokens": 1261855392} {"current_steps": 6989, "total_steps": 9134, "loss": 0.8272, "learning_rate": 6.500602453227936e-06, "epoch": 0.7651003037849968, "percentage": 76.52, "elapsed_time": "5 days, 8:27:46", "remaining_time": "1 day, 15:25:36", "throughput": 2728.87, "total_tokens": 1262009056} {"current_steps": 6990, "total_steps": 9134, "loss": 0.801, "learning_rate": 6.494819827159271e-06, "epoch": 0.7652097758559347, "percentage": 76.53, "elapsed_time": "5 days, 8:28:53", "remaining_time": "1 day, 15:24:30", "throughput": 2728.91, "total_tokens": 1262213568} {"current_steps": 6991, "total_steps": 9134, "loss": 0.6824, "learning_rate": 6.489039390218052e-06, "epoch": 0.7653192479268727, "percentage": 76.54, "elapsed_time": "5 days, 8:29:54", "remaining_time": "1 day, 15:23:22", "throughput": 2728.9, "total_tokens": 1262375520} {"current_steps": 6992, "total_steps": 9134, "loss": 0.7836, "learning_rate": 6.483261143088084e-06, "epoch": 0.7654287199978106, "percentage": 76.55, "elapsed_time": "5 days, 8:30:59", "remaining_time": "1 day, 15:22:15", "throughput": 2728.87, "total_tokens": 1262536352} {"current_steps": 6993, "total_steps": 9134, "loss": 1.2439, "learning_rate": 6.477485086452928e-06, "epoch": 0.7655381920687485, "percentage": 76.56, "elapsed_time": "5 days, 8:32:06", "remaining_time": "1 day, 15:21:09", "throughput": 2728.91, "total_tokens": 1262738624} {"current_steps": 6994, "total_steps": 9134, "loss": 0.7429, "learning_rate": 6.471711220995877e-06, "epoch": 0.7656476641396863, "percentage": 76.57, "elapsed_time": "5 days, 8:33:12", "remaining_time": "1 day, 15:20:03", "throughput": 2728.93, "total_tokens": 1262928800} {"current_steps": 6995, "total_steps": 9134, "loss": 0.7205, "learning_rate": 6.46593954739996e-06, "epoch": 0.7657571362106242, "percentage": 76.58, "elapsed_time": "5 days, 8:34:17", "remaining_time": "1 day, 15:18:57", "throughput": 2728.92, "total_tokens": 1263103520} {"current_steps": 6996, "total_steps": 9134, "loss": 1.137, "learning_rate": 6.460170066347979e-06, "epoch": 0.7658666082815622, "percentage": 76.59, "elapsed_time": "5 days, 8:35:25", "remaining_time": "1 day, 15:17:51", "throughput": 2728.99, "total_tokens": 1263319904} {"current_steps": 6997, "total_steps": 9134, "loss": 0.7584, "learning_rate": 6.4544027785224195e-06, "epoch": 0.7659760803525001, "percentage": 76.6, "elapsed_time": "5 days, 8:36:32", "remaining_time": "1 day, 15:16:45", "throughput": 2729.04, "total_tokens": 1263523520} {"current_steps": 6998, "total_steps": 9134, "loss": 0.7762, "learning_rate": 6.448637684605569e-06, "epoch": 0.766085552423438, "percentage": 76.61, "elapsed_time": "5 days, 8:37:40", "remaining_time": "1 day, 15:15:40", "throughput": 2729.1, "total_tokens": 1263737216} {"current_steps": 6999, "total_steps": 9134, "loss": 0.8547, "learning_rate": 6.442874785279415e-06, "epoch": 0.7661950244943758, "percentage": 76.63, "elapsed_time": "5 days, 8:38:45", "remaining_time": "1 day, 15:14:33", "throughput": 2729.1, "total_tokens": 1263916416} {"current_steps": 7000, "total_steps": 9134, "loss": 0.7911, "learning_rate": 6.437114081225698e-06, "epoch": 0.7663044965653137, "percentage": 76.64, "elapsed_time": "5 days, 8:39:53", "remaining_time": "1 day, 15:13:27", "throughput": 2729.14, "total_tokens": 1264121600} {"current_steps": 7001, "total_steps": 9134, "loss": 0.5821, "learning_rate": 6.431355573125899e-06, "epoch": 0.7664139686362517, "percentage": 76.65, "elapsed_time": "5 days, 8:40:57", "remaining_time": "1 day, 15:12:21", "throughput": 2729.15, "total_tokens": 1264298560} {"current_steps": 7002, "total_steps": 9134, "loss": 0.8606, "learning_rate": 6.4255992616612385e-06, "epoch": 0.7665234407071896, "percentage": 76.66, "elapsed_time": "5 days, 8:42:03", "remaining_time": "1 day, 15:11:14", "throughput": 2729.15, "total_tokens": 1264478432} {"current_steps": 7003, "total_steps": 9134, "loss": 0.8312, "learning_rate": 6.419845147512679e-06, "epoch": 0.7666329127781275, "percentage": 76.67, "elapsed_time": "5 days, 8:43:06", "remaining_time": "1 day, 15:10:07", "throughput": 2729.14, "total_tokens": 1264644640} {"current_steps": 7004, "total_steps": 9134, "loss": 0.8881, "learning_rate": 6.4140932313609096e-06, "epoch": 0.7667423848490654, "percentage": 76.68, "elapsed_time": "5 days, 8:44:07", "remaining_time": "1 day, 15:09:00", "throughput": 2729.15, "total_tokens": 1264820256} {"current_steps": 7005, "total_steps": 9134, "loss": 0.7918, "learning_rate": 6.408343513886389e-06, "epoch": 0.7668518569200032, "percentage": 76.69, "elapsed_time": "5 days, 8:45:14", "remaining_time": "1 day, 15:07:54", "throughput": 2729.16, "total_tokens": 1265003264} {"current_steps": 7006, "total_steps": 9134, "loss": 0.8011, "learning_rate": 6.402595995769289e-06, "epoch": 0.7669613289909412, "percentage": 76.7, "elapsed_time": "5 days, 8:46:19", "remaining_time": "1 day, 15:06:47", "throughput": 2729.19, "total_tokens": 1265193888} {"current_steps": 7007, "total_steps": 9134, "loss": 0.6789, "learning_rate": 6.396850677689531e-06, "epoch": 0.7670708010618791, "percentage": 76.71, "elapsed_time": "5 days, 8:47:20", "remaining_time": "1 day, 15:05:39", "throughput": 2729.19, "total_tokens": 1265360768} {"current_steps": 7008, "total_steps": 9134, "loss": 0.844, "learning_rate": 6.391107560326776e-06, "epoch": 0.767180273132817, "percentage": 76.72, "elapsed_time": "5 days, 8:48:25", "remaining_time": "1 day, 15:04:33", "throughput": 2729.19, "total_tokens": 1265537952} {"current_steps": 7009, "total_steps": 9134, "loss": 0.969, "learning_rate": 6.385366644360419e-06, "epoch": 0.7672897452037549, "percentage": 76.74, "elapsed_time": "5 days, 8:49:31", "remaining_time": "1 day, 15:03:26", "throughput": 2729.23, "total_tokens": 1265738880} {"current_steps": 7010, "total_steps": 9134, "loss": 0.7987, "learning_rate": 6.379627930469598e-06, "epoch": 0.7673992172746928, "percentage": 76.75, "elapsed_time": "5 days, 8:50:37", "remaining_time": "1 day, 15:02:20", "throughput": 2729.22, "total_tokens": 1265912704} {"current_steps": 7011, "total_steps": 9134, "loss": 0.7798, "learning_rate": 6.373891419333211e-06, "epoch": 0.7675086893456307, "percentage": 76.76, "elapsed_time": "5 days, 8:51:43", "remaining_time": "1 day, 15:01:14", "throughput": 2729.23, "total_tokens": 1266097952} {"current_steps": 7012, "total_steps": 9134, "loss": 0.6739, "learning_rate": 6.368157111629846e-06, "epoch": 0.7676181614165686, "percentage": 76.77, "elapsed_time": "5 days, 8:52:47", "remaining_time": "1 day, 15:00:07", "throughput": 2729.23, "total_tokens": 1266272896} {"current_steps": 7013, "total_steps": 9134, "loss": 0.6608, "learning_rate": 6.362425008037895e-06, "epoch": 0.7677276334875065, "percentage": 76.78, "elapsed_time": "5 days, 8:53:52", "remaining_time": "1 day, 14:59:01", "throughput": 2729.24, "total_tokens": 1266457024} {"current_steps": 7014, "total_steps": 9134, "loss": 0.9824, "learning_rate": 6.35669510923542e-06, "epoch": 0.7678371055584444, "percentage": 76.79, "elapsed_time": "5 days, 8:54:58", "remaining_time": "1 day, 14:57:55", "throughput": 2729.26, "total_tokens": 1266645632} {"current_steps": 7015, "total_steps": 9134, "loss": 0.819, "learning_rate": 6.35096741590028e-06, "epoch": 0.7679465776293823, "percentage": 76.8, "elapsed_time": "5 days, 8:56:00", "remaining_time": "1 day, 14:56:47", "throughput": 2729.2, "total_tokens": 1266784960} {"current_steps": 7016, "total_steps": 9134, "loss": 0.8471, "learning_rate": 6.345241928710044e-06, "epoch": 0.7680560497003202, "percentage": 76.81, "elapsed_time": "5 days, 8:57:04", "remaining_time": "1 day, 14:55:40", "throughput": 2729.18, "total_tokens": 1266954080} {"current_steps": 7017, "total_steps": 9134, "loss": 0.6178, "learning_rate": 6.339518648342019e-06, "epoch": 0.7681655217712581, "percentage": 76.82, "elapsed_time": "5 days, 8:58:11", "remaining_time": "1 day, 14:54:34", "throughput": 2729.17, "total_tokens": 1267128576} {"current_steps": 7018, "total_steps": 9134, "loss": 1.0199, "learning_rate": 6.33379757547328e-06, "epoch": 0.768274993842196, "percentage": 76.83, "elapsed_time": "5 days, 8:59:13", "remaining_time": "1 day, 14:53:27", "throughput": 2729.16, "total_tokens": 1267295456} {"current_steps": 7019, "total_steps": 9134, "loss": 1.1263, "learning_rate": 6.328078710780588e-06, "epoch": 0.7683844659131339, "percentage": 76.84, "elapsed_time": "5 days, 9:00:18", "remaining_time": "1 day, 14:52:20", "throughput": 2729.14, "total_tokens": 1267465024} {"current_steps": 7020, "total_steps": 9134, "loss": 0.7976, "learning_rate": 6.322362054940506e-06, "epoch": 0.7684939379840718, "percentage": 76.86, "elapsed_time": "5 days, 9:01:21", "remaining_time": "1 day, 14:51:13", "throughput": 2729.14, "total_tokens": 1267633472} {"current_steps": 7021, "total_steps": 9134, "loss": 0.7009, "learning_rate": 6.316647608629272e-06, "epoch": 0.7686034100550098, "percentage": 76.87, "elapsed_time": "5 days, 9:02:25", "remaining_time": "1 day, 14:50:06", "throughput": 2729.12, "total_tokens": 1267799232} {"current_steps": 7022, "total_steps": 9134, "loss": 0.596, "learning_rate": 6.310935372522925e-06, "epoch": 0.7687128821259476, "percentage": 76.88, "elapsed_time": "5 days, 9:03:26", "remaining_time": "1 day, 14:48:59", "throughput": 2729.12, "total_tokens": 1267963872} {"current_steps": 7023, "total_steps": 9134, "loss": 0.811, "learning_rate": 6.305225347297181e-06, "epoch": 0.7688223541968855, "percentage": 76.89, "elapsed_time": "5 days, 9:04:31", "remaining_time": "1 day, 14:47:52", "throughput": 2729.16, "total_tokens": 1268163456} {"current_steps": 7024, "total_steps": 9134, "loss": 0.8374, "learning_rate": 6.299517533627547e-06, "epoch": 0.7689318262678234, "percentage": 76.9, "elapsed_time": "5 days, 9:05:36", "remaining_time": "1 day, 14:46:46", "throughput": 2729.19, "total_tokens": 1268354752} {"current_steps": 7025, "total_steps": 9134, "loss": 1.1124, "learning_rate": 6.293811932189239e-06, "epoch": 0.7690412983387613, "percentage": 76.91, "elapsed_time": "5 days, 9:06:37", "remaining_time": "1 day, 14:45:38", "throughput": 2729.2, "total_tokens": 1268526112} {"current_steps": 7026, "total_steps": 9134, "loss": 0.707, "learning_rate": 6.28810854365722e-06, "epoch": 0.7691507704096993, "percentage": 76.92, "elapsed_time": "5 days, 9:07:40", "remaining_time": "1 day, 14:44:31", "throughput": 2729.21, "total_tokens": 1268702400} {"current_steps": 7027, "total_steps": 9134, "loss": 1.0515, "learning_rate": 6.282407368706189e-06, "epoch": 0.7692602424806372, "percentage": 76.93, "elapsed_time": "5 days, 9:08:47", "remaining_time": "1 day, 14:43:25", "throughput": 2729.22, "total_tokens": 1268887200} {"current_steps": 7028, "total_steps": 9134, "loss": 0.6614, "learning_rate": 6.276708408010576e-06, "epoch": 0.769369714551575, "percentage": 76.94, "elapsed_time": "5 days, 9:09:47", "remaining_time": "1 day, 14:42:17", "throughput": 2729.2, "total_tokens": 1269044000} {"current_steps": 7029, "total_steps": 9134, "loss": 0.9788, "learning_rate": 6.27101166224458e-06, "epoch": 0.7694791866225129, "percentage": 76.95, "elapsed_time": "5 days, 9:10:52", "remaining_time": "1 day, 14:41:10", "throughput": 2729.2, "total_tokens": 1269220512} {"current_steps": 7030, "total_steps": 9134, "loss": 0.7799, "learning_rate": 6.265317132082088e-06, "epoch": 0.7695886586934508, "percentage": 76.97, "elapsed_time": "5 days, 9:11:58", "remaining_time": "1 day, 14:40:04", "throughput": 2729.2, "total_tokens": 1269404192} {"current_steps": 7031, "total_steps": 9134, "loss": 0.8535, "learning_rate": 6.259624818196772e-06, "epoch": 0.7696981307643888, "percentage": 76.98, "elapsed_time": "5 days, 9:13:03", "remaining_time": "1 day, 14:38:58", "throughput": 2729.23, "total_tokens": 1269595040} {"current_steps": 7032, "total_steps": 9134, "loss": 0.5934, "learning_rate": 6.253934721262014e-06, "epoch": 0.7698076028353267, "percentage": 76.99, "elapsed_time": "5 days, 9:14:05", "remaining_time": "1 day, 14:37:50", "throughput": 2729.22, "total_tokens": 1269758336} {"current_steps": 7033, "total_steps": 9134, "loss": 0.9774, "learning_rate": 6.248246841950942e-06, "epoch": 0.7699170749062645, "percentage": 77.0, "elapsed_time": "5 days, 9:15:12", "remaining_time": "1 day, 14:36:44", "throughput": 2729.22, "total_tokens": 1269940000} {"current_steps": 7034, "total_steps": 9134, "loss": 0.7631, "learning_rate": 6.242561180936421e-06, "epoch": 0.7700265469772024, "percentage": 77.01, "elapsed_time": "5 days, 9:16:13", "remaining_time": "1 day, 14:35:37", "throughput": 2729.2, "total_tokens": 1270098144} {"current_steps": 7035, "total_steps": 9134, "loss": 0.8519, "learning_rate": 6.236877738891053e-06, "epoch": 0.7701360190481403, "percentage": 77.02, "elapsed_time": "5 days, 9:17:20", "remaining_time": "1 day, 14:34:31", "throughput": 2729.27, "total_tokens": 1270312288} {"current_steps": 7036, "total_steps": 9134, "loss": 0.9846, "learning_rate": 6.231196516487181e-06, "epoch": 0.7702454911190783, "percentage": 77.03, "elapsed_time": "5 days, 9:18:23", "remaining_time": "1 day, 14:33:24", "throughput": 2729.29, "total_tokens": 1270495520} {"current_steps": 7037, "total_steps": 9134, "loss": 0.8724, "learning_rate": 6.225517514396873e-06, "epoch": 0.7703549631900162, "percentage": 77.04, "elapsed_time": "5 days, 9:19:28", "remaining_time": "1 day, 14:32:17", "throughput": 2729.32, "total_tokens": 1270685248} {"current_steps": 7038, "total_steps": 9134, "loss": 0.5854, "learning_rate": 6.219840733291959e-06, "epoch": 0.7704644352609541, "percentage": 77.05, "elapsed_time": "5 days, 9:20:32", "remaining_time": "1 day, 14:31:10", "throughput": 2729.31, "total_tokens": 1270857952} {"current_steps": 7039, "total_steps": 9134, "loss": 0.8448, "learning_rate": 6.2141661738439884e-06, "epoch": 0.7705739073318919, "percentage": 77.06, "elapsed_time": "5 days, 9:21:35", "remaining_time": "1 day, 14:30:03", "throughput": 2729.31, "total_tokens": 1271030208} {"current_steps": 7040, "total_steps": 9134, "loss": 0.6917, "learning_rate": 6.208493836724244e-06, "epoch": 0.7706833794028298, "percentage": 77.07, "elapsed_time": "5 days, 9:22:41", "remaining_time": "1 day, 14:28:57", "throughput": 2729.36, "total_tokens": 1271230016} {"current_steps": 7041, "total_steps": 9134, "loss": 0.6913, "learning_rate": 6.202823722603757e-06, "epoch": 0.7707928514737677, "percentage": 77.09, "elapsed_time": "5 days, 9:23:49", "remaining_time": "1 day, 14:27:51", "throughput": 2729.38, "total_tokens": 1271426240} {"current_steps": 7042, "total_steps": 9134, "loss": 1.1706, "learning_rate": 6.197155832153287e-06, "epoch": 0.7709023235447057, "percentage": 77.1, "elapsed_time": "5 days, 9:24:56", "remaining_time": "1 day, 14:26:46", "throughput": 2729.4, "total_tokens": 1271620448} {"current_steps": 7043, "total_steps": 9134, "loss": 1.0093, "learning_rate": 6.191490166043337e-06, "epoch": 0.7710117956156436, "percentage": 77.11, "elapsed_time": "5 days, 9:26:02", "remaining_time": "1 day, 14:25:39", "throughput": 2729.45, "total_tokens": 1271820928} {"current_steps": 7044, "total_steps": 9134, "loss": 0.6871, "learning_rate": 6.185826724944146e-06, "epoch": 0.7711212676865815, "percentage": 77.12, "elapsed_time": "5 days, 9:27:00", "remaining_time": "1 day, 14:24:31", "throughput": 2729.43, "total_tokens": 1271972576} {"current_steps": 7045, "total_steps": 9134, "loss": 0.7507, "learning_rate": 6.180165509525682e-06, "epoch": 0.7712307397575193, "percentage": 77.13, "elapsed_time": "5 days, 9:28:02", "remaining_time": "1 day, 14:23:23", "throughput": 2729.42, "total_tokens": 1272135872} {"current_steps": 7046, "total_steps": 9134, "loss": 0.7419, "learning_rate": 6.174506520457665e-06, "epoch": 0.7713402118284572, "percentage": 77.14, "elapsed_time": "5 days, 9:29:06", "remaining_time": "1 day, 14:22:16", "throughput": 2729.42, "total_tokens": 1272308352} {"current_steps": 7047, "total_steps": 9134, "loss": 0.7314, "learning_rate": 6.168849758409539e-06, "epoch": 0.7714496838993952, "percentage": 77.15, "elapsed_time": "5 days, 9:30:08", "remaining_time": "1 day, 14:21:09", "throughput": 2729.38, "total_tokens": 1272460224} {"current_steps": 7048, "total_steps": 9134, "loss": 0.997, "learning_rate": 6.163195224050488e-06, "epoch": 0.7715591559703331, "percentage": 77.16, "elapsed_time": "5 days, 9:31:13", "remaining_time": "1 day, 14:20:03", "throughput": 2729.42, "total_tokens": 1272653984} {"current_steps": 7049, "total_steps": 9134, "loss": 0.8242, "learning_rate": 6.157542918049433e-06, "epoch": 0.771668628041271, "percentage": 77.17, "elapsed_time": "5 days, 9:32:13", "remaining_time": "1 day, 14:18:55", "throughput": 2729.4, "total_tokens": 1272813248} {"current_steps": 7050, "total_steps": 9134, "loss": 0.9673, "learning_rate": 6.151892841075027e-06, "epoch": 0.7717781001122088, "percentage": 77.18, "elapsed_time": "5 days, 9:33:20", "remaining_time": "1 day, 14:17:49", "throughput": 2729.47, "total_tokens": 1273024032} {"current_steps": 7051, "total_steps": 9134, "loss": 0.7719, "learning_rate": 6.146244993795669e-06, "epoch": 0.7718875721831467, "percentage": 77.2, "elapsed_time": "5 days, 9:34:24", "remaining_time": "1 day, 14:16:42", "throughput": 2729.46, "total_tokens": 1273196736} {"current_steps": 7052, "total_steps": 9134, "loss": 0.8508, "learning_rate": 6.14059937687948e-06, "epoch": 0.7719970442540847, "percentage": 77.21, "elapsed_time": "5 days, 9:35:26", "remaining_time": "1 day, 14:15:35", "throughput": 2729.48, "total_tokens": 1273373920} {"current_steps": 7053, "total_steps": 9134, "loss": 1.0682, "learning_rate": 6.1349559909943425e-06, "epoch": 0.7721065163250226, "percentage": 77.22, "elapsed_time": "5 days, 9:36:32", "remaining_time": "1 day, 14:14:28", "throughput": 2729.48, "total_tokens": 1273554240} {"current_steps": 7054, "total_steps": 9134, "loss": 0.7695, "learning_rate": 6.129314836807834e-06, "epoch": 0.7722159883959605, "percentage": 77.23, "elapsed_time": "5 days, 9:37:36", "remaining_time": "1 day, 14:13:22", "throughput": 2729.52, "total_tokens": 1273749344} {"current_steps": 7055, "total_steps": 9134, "loss": 0.7262, "learning_rate": 6.123675914987323e-06, "epoch": 0.7723254604668984, "percentage": 77.24, "elapsed_time": "5 days, 9:38:43", "remaining_time": "1 day, 14:12:16", "throughput": 2729.56, "total_tokens": 1273951840} {"current_steps": 7056, "total_steps": 9134, "loss": 0.9653, "learning_rate": 6.1180392261998484e-06, "epoch": 0.7724349325378362, "percentage": 77.25, "elapsed_time": "5 days, 9:39:47", "remaining_time": "1 day, 14:11:09", "throughput": 2729.56, "total_tokens": 1274122080} {"current_steps": 7057, "total_steps": 9134, "loss": 0.7795, "learning_rate": 6.112404771112246e-06, "epoch": 0.7725444046087742, "percentage": 77.26, "elapsed_time": "5 days, 9:40:51", "remaining_time": "1 day, 14:10:02", "throughput": 2729.59, "total_tokens": 1274315392} {"current_steps": 7058, "total_steps": 9134, "loss": 1.023, "learning_rate": 6.106772550391052e-06, "epoch": 0.7726538766797121, "percentage": 77.27, "elapsed_time": "5 days, 9:41:57", "remaining_time": "1 day, 14:08:56", "throughput": 2729.63, "total_tokens": 1274510944} {"current_steps": 7059, "total_steps": 9134, "loss": 0.7885, "learning_rate": 6.101142564702539e-06, "epoch": 0.77276334875065, "percentage": 77.28, "elapsed_time": "5 days, 9:43:04", "remaining_time": "1 day, 14:07:50", "throughput": 2729.65, "total_tokens": 1274704032} {"current_steps": 7060, "total_steps": 9134, "loss": 0.7571, "learning_rate": 6.095514814712747e-06, "epoch": 0.7728728208215879, "percentage": 77.29, "elapsed_time": "5 days, 9:44:12", "remaining_time": "1 day, 14:06:44", "throughput": 2729.7, "total_tokens": 1274912128} {"current_steps": 7061, "total_steps": 9134, "loss": 0.8818, "learning_rate": 6.089889301087398e-06, "epoch": 0.7729822928925258, "percentage": 77.3, "elapsed_time": "5 days, 9:45:16", "remaining_time": "1 day, 14:05:38", "throughput": 2729.69, "total_tokens": 1275083040} {"current_steps": 7062, "total_steps": 9134, "loss": 0.9021, "learning_rate": 6.084266024492011e-06, "epoch": 0.7730917649634637, "percentage": 77.32, "elapsed_time": "5 days, 9:46:21", "remaining_time": "1 day, 14:04:31", "throughput": 2729.68, "total_tokens": 1275254848} {"current_steps": 7063, "total_steps": 9134, "loss": 0.6819, "learning_rate": 6.078644985591778e-06, "epoch": 0.7732012370344016, "percentage": 77.33, "elapsed_time": "5 days, 9:47:23", "remaining_time": "1 day, 14:03:24", "throughput": 2729.66, "total_tokens": 1275415232} {"current_steps": 7064, "total_steps": 9134, "loss": 0.6285, "learning_rate": 6.0730261850516865e-06, "epoch": 0.7733107091053395, "percentage": 77.34, "elapsed_time": "5 days, 9:48:31", "remaining_time": "1 day, 14:02:18", "throughput": 2729.66, "total_tokens": 1275602720} {"current_steps": 7065, "total_steps": 9134, "loss": 0.8252, "learning_rate": 6.067409623536399e-06, "epoch": 0.7734201811762774, "percentage": 77.35, "elapsed_time": "5 days, 9:49:34", "remaining_time": "1 day, 14:01:11", "throughput": 2729.68, "total_tokens": 1275782816} {"current_steps": 7066, "total_steps": 9134, "loss": 0.7356, "learning_rate": 6.061795301710368e-06, "epoch": 0.7735296532472153, "percentage": 77.36, "elapsed_time": "5 days, 9:50:41", "remaining_time": "1 day, 14:00:05", "throughput": 2729.7, "total_tokens": 1275976800} {"current_steps": 7067, "total_steps": 9134, "loss": 1.1747, "learning_rate": 6.056183220237749e-06, "epoch": 0.7736391253181532, "percentage": 77.37, "elapsed_time": "5 days, 9:51:48", "remaining_time": "1 day, 13:58:59", "throughput": 2729.76, "total_tokens": 1276187360} {"current_steps": 7068, "total_steps": 9134, "loss": 0.9811, "learning_rate": 6.05057337978244e-06, "epoch": 0.7737485973890911, "percentage": 77.38, "elapsed_time": "5 days, 9:52:56", "remaining_time": "1 day, 13:57:54", "throughput": 2729.8, "total_tokens": 1276390752} {"current_steps": 7069, "total_steps": 9134, "loss": 0.7985, "learning_rate": 6.044965781008077e-06, "epoch": 0.773858069460029, "percentage": 77.39, "elapsed_time": "5 days, 9:54:02", "remaining_time": "1 day, 13:56:47", "throughput": 2729.84, "total_tokens": 1276588544} {"current_steps": 7070, "total_steps": 9134, "loss": 0.7445, "learning_rate": 6.039360424578017e-06, "epoch": 0.7739675415309669, "percentage": 77.4, "elapsed_time": "5 days, 9:55:07", "remaining_time": "1 day, 13:55:41", "throughput": 2729.82, "total_tokens": 1276759008} {"current_steps": 7071, "total_steps": 9134, "loss": 1.134, "learning_rate": 6.033757311155386e-06, "epoch": 0.7740770136019048, "percentage": 77.41, "elapsed_time": "5 days, 9:56:15", "remaining_time": "1 day, 13:54:35", "throughput": 2729.84, "total_tokens": 1276952992} {"current_steps": 7072, "total_steps": 9134, "loss": 0.7267, "learning_rate": 6.028156441402996e-06, "epoch": 0.7741864856728428, "percentage": 77.43, "elapsed_time": "5 days, 9:57:18", "remaining_time": "1 day, 13:53:28", "throughput": 2729.81, "total_tokens": 1277110016} {"current_steps": 7073, "total_steps": 9134, "loss": 0.7452, "learning_rate": 6.022557815983437e-06, "epoch": 0.7742959577437806, "percentage": 77.44, "elapsed_time": "5 days, 9:58:25", "remaining_time": "1 day, 13:52:22", "throughput": 2729.85, "total_tokens": 1277310048} {"current_steps": 7074, "total_steps": 9134, "loss": 0.7344, "learning_rate": 6.01696143555901e-06, "epoch": 0.7744054298147185, "percentage": 77.45, "elapsed_time": "5 days, 9:59:31", "remaining_time": "1 day, 13:51:16", "throughput": 2729.85, "total_tokens": 1277491936} {"current_steps": 7075, "total_steps": 9134, "loss": 0.8633, "learning_rate": 6.011367300791754e-06, "epoch": 0.7745149018856564, "percentage": 77.46, "elapsed_time": "5 days, 10:00:35", "remaining_time": "1 day, 13:50:09", "throughput": 2729.84, "total_tokens": 1277665088} {"current_steps": 7076, "total_steps": 9134, "loss": 1.0539, "learning_rate": 6.005775412343448e-06, "epoch": 0.7746243739565943, "percentage": 77.47, "elapsed_time": "5 days, 10:01:42", "remaining_time": "1 day, 13:49:03", "throughput": 2729.86, "total_tokens": 1277852800} {"current_steps": 7077, "total_steps": 9134, "loss": 0.8265, "learning_rate": 6.0001857708755996e-06, "epoch": 0.7747338460275323, "percentage": 77.48, "elapsed_time": "5 days, 10:02:49", "remaining_time": "1 day, 13:47:58", "throughput": 2729.88, "total_tokens": 1278046784} {"current_steps": 7078, "total_steps": 9134, "loss": 0.5865, "learning_rate": 5.994598377049446e-06, "epoch": 0.7748433180984702, "percentage": 77.49, "elapsed_time": "5 days, 10:03:56", "remaining_time": "1 day, 13:46:52", "throughput": 2729.9, "total_tokens": 1278240768} {"current_steps": 7079, "total_steps": 9134, "loss": 0.7526, "learning_rate": 5.989013231525978e-06, "epoch": 0.774952790169408, "percentage": 77.5, "elapsed_time": "5 days, 10:05:00", "remaining_time": "1 day, 13:45:45", "throughput": 2729.92, "total_tokens": 1278422880} {"current_steps": 7080, "total_steps": 9134, "loss": 0.7515, "learning_rate": 5.983430334965903e-06, "epoch": 0.7750622622403459, "percentage": 77.51, "elapsed_time": "5 days, 10:06:05", "remaining_time": "1 day, 13:44:39", "throughput": 2729.98, "total_tokens": 1278627392} {"current_steps": 7081, "total_steps": 9134, "loss": 0.804, "learning_rate": 5.977849688029666e-06, "epoch": 0.7751717343112838, "percentage": 77.52, "elapsed_time": "5 days, 10:07:10", "remaining_time": "1 day, 13:43:32", "throughput": 2729.98, "total_tokens": 1278802336} {"current_steps": 7082, "total_steps": 9134, "loss": 0.9395, "learning_rate": 5.972271291377446e-06, "epoch": 0.7752812063822218, "percentage": 77.53, "elapsed_time": "5 days, 10:08:13", "remaining_time": "1 day, 13:42:25", "throughput": 2729.98, "total_tokens": 1278980192} {"current_steps": 7083, "total_steps": 9134, "loss": 1.0355, "learning_rate": 5.96669514566916e-06, "epoch": 0.7753906784531597, "percentage": 77.55, "elapsed_time": "5 days, 10:09:18", "remaining_time": "1 day, 13:41:18", "throughput": 2729.99, "total_tokens": 1279157376} {"current_steps": 7084, "total_steps": 9134, "loss": 0.9748, "learning_rate": 5.96112125156445e-06, "epoch": 0.7755001505240975, "percentage": 77.56, "elapsed_time": "5 days, 10:10:23", "remaining_time": "1 day, 13:40:12", "throughput": 2730.06, "total_tokens": 1279368832} {"current_steps": 7085, "total_steps": 9134, "loss": 0.8729, "learning_rate": 5.9555496097226934e-06, "epoch": 0.7756096225950354, "percentage": 77.57, "elapsed_time": "5 days, 10:11:30", "remaining_time": "1 day, 13:39:06", "throughput": 2730.01, "total_tokens": 1279528768} {"current_steps": 7086, "total_steps": 9134, "loss": 0.871, "learning_rate": 5.949980220803025e-06, "epoch": 0.7757190946659733, "percentage": 77.58, "elapsed_time": "5 days, 10:12:35", "remaining_time": "1 day, 13:37:59", "throughput": 2730.04, "total_tokens": 1279718944} {"current_steps": 7087, "total_steps": 9134, "loss": 1.0069, "learning_rate": 5.944413085464265e-06, "epoch": 0.7758285667369113, "percentage": 77.59, "elapsed_time": "5 days, 10:13:37", "remaining_time": "1 day, 13:36:52", "throughput": 2730.06, "total_tokens": 1279898368} {"current_steps": 7088, "total_steps": 9134, "loss": 0.894, "learning_rate": 5.938848204365016e-06, "epoch": 0.7759380388078492, "percentage": 77.6, "elapsed_time": "5 days, 10:14:45", "remaining_time": "1 day, 13:35:47", "throughput": 2730.12, "total_tokens": 1280114528} {"current_steps": 7089, "total_steps": 9134, "loss": 0.7342, "learning_rate": 5.933285578163586e-06, "epoch": 0.7760475108787871, "percentage": 77.61, "elapsed_time": "5 days, 10:15:46", "remaining_time": "1 day, 13:34:39", "throughput": 2730.11, "total_tokens": 1280276480} {"current_steps": 7090, "total_steps": 9134, "loss": 0.7912, "learning_rate": 5.927725207518023e-06, "epoch": 0.7761569829497249, "percentage": 77.62, "elapsed_time": "5 days, 10:16:51", "remaining_time": "1 day, 13:33:33", "throughput": 2730.1, "total_tokens": 1280450528} {"current_steps": 7091, "total_steps": 9134, "loss": 0.7341, "learning_rate": 5.922167093086107e-06, "epoch": 0.7762664550206628, "percentage": 77.63, "elapsed_time": "5 days, 10:17:59", "remaining_time": "1 day, 13:32:27", "throughput": 2730.14, "total_tokens": 1280652576} {"current_steps": 7092, "total_steps": 9134, "loss": 0.6909, "learning_rate": 5.916611235525346e-06, "epoch": 0.7763759270916007, "percentage": 77.64, "elapsed_time": "5 days, 10:19:06", "remaining_time": "1 day, 13:31:21", "throughput": 2730.19, "total_tokens": 1280861120} {"current_steps": 7093, "total_steps": 9134, "loss": 0.7855, "learning_rate": 5.9110576354930085e-06, "epoch": 0.7764853991625387, "percentage": 77.65, "elapsed_time": "5 days, 10:20:12", "remaining_time": "1 day, 13:30:15", "throughput": 2730.24, "total_tokens": 1281064512} {"current_steps": 7094, "total_steps": 9134, "loss": 0.8154, "learning_rate": 5.9055062936460484e-06, "epoch": 0.7765948712334766, "percentage": 77.67, "elapsed_time": "5 days, 10:21:20", "remaining_time": "1 day, 13:29:09", "throughput": 2730.27, "total_tokens": 1281263872} {"current_steps": 7095, "total_steps": 9134, "loss": 0.9646, "learning_rate": 5.899957210641205e-06, "epoch": 0.7767043433044145, "percentage": 77.68, "elapsed_time": "5 days, 10:22:24", "remaining_time": "1 day, 13:28:02", "throughput": 2730.28, "total_tokens": 1281441280} {"current_steps": 7096, "total_steps": 9134, "loss": 0.757, "learning_rate": 5.894410387134896e-06, "epoch": 0.7768138153753523, "percentage": 77.69, "elapsed_time": "5 days, 10:23:28", "remaining_time": "1 day, 13:26:55", "throughput": 2730.24, "total_tokens": 1281597184} {"current_steps": 7097, "total_steps": 9134, "loss": 0.7303, "learning_rate": 5.888865823783329e-06, "epoch": 0.7769232874462902, "percentage": 77.7, "elapsed_time": "5 days, 10:24:32", "remaining_time": "1 day, 13:25:49", "throughput": 2730.24, "total_tokens": 1281771456} {"current_steps": 7098, "total_steps": 9134, "loss": 0.9309, "learning_rate": 5.883323521242387e-06, "epoch": 0.7770327595172282, "percentage": 77.71, "elapsed_time": "5 days, 10:25:37", "remaining_time": "1 day, 13:24:42", "throughput": 2730.22, "total_tokens": 1281940800} {"current_steps": 7099, "total_steps": 9134, "loss": 0.8703, "learning_rate": 5.877783480167734e-06, "epoch": 0.7771422315881661, "percentage": 77.72, "elapsed_time": "5 days, 10:26:37", "remaining_time": "1 day, 13:23:34", "throughput": 2730.2, "total_tokens": 1282097152} {"current_steps": 7100, "total_steps": 9134, "loss": 0.869, "learning_rate": 5.872245701214741e-06, "epoch": 0.777251703659104, "percentage": 77.73, "elapsed_time": "5 days, 10:27:39", "remaining_time": "1 day, 13:22:27", "throughput": 2730.22, "total_tokens": 1282274560} {"current_steps": 7101, "total_steps": 9134, "loss": 0.7411, "learning_rate": 5.8667101850385045e-06, "epoch": 0.7773611757300418, "percentage": 77.74, "elapsed_time": "5 days, 10:28:43", "remaining_time": "1 day, 13:21:20", "throughput": 2730.24, "total_tokens": 1282458912} {"current_steps": 7102, "total_steps": 9134, "loss": 0.7192, "learning_rate": 5.861176932293894e-06, "epoch": 0.7774706478009797, "percentage": 77.75, "elapsed_time": "5 days, 10:29:50", "remaining_time": "1 day, 13:20:14", "throughput": 2730.25, "total_tokens": 1282643040} {"current_steps": 7103, "total_steps": 9134, "loss": 0.9403, "learning_rate": 5.855645943635449e-06, "epoch": 0.7775801198719177, "percentage": 77.76, "elapsed_time": "5 days, 10:30:57", "remaining_time": "1 day, 13:19:08", "throughput": 2730.25, "total_tokens": 1282827392} {"current_steps": 7104, "total_steps": 9134, "loss": 0.7367, "learning_rate": 5.850117219717507e-06, "epoch": 0.7776895919428556, "percentage": 77.78, "elapsed_time": "5 days, 10:31:59", "remaining_time": "1 day, 13:18:01", "throughput": 2730.22, "total_tokens": 1282984640} {"current_steps": 7105, "total_steps": 9134, "loss": 0.9722, "learning_rate": 5.8445907611940745e-06, "epoch": 0.7777990640137935, "percentage": 77.79, "elapsed_time": "5 days, 10:33:04", "remaining_time": "1 day, 13:16:55", "throughput": 2730.2, "total_tokens": 1283152864} {"current_steps": 7106, "total_steps": 9134, "loss": 0.7742, "learning_rate": 5.839066568718946e-06, "epoch": 0.7779085360847314, "percentage": 77.8, "elapsed_time": "5 days, 10:34:09", "remaining_time": "1 day, 13:15:48", "throughput": 2730.21, "total_tokens": 1283334080} {"current_steps": 7107, "total_steps": 9134, "loss": 0.8517, "learning_rate": 5.83354464294561e-06, "epoch": 0.7780180081556692, "percentage": 77.81, "elapsed_time": "5 days, 10:35:13", "remaining_time": "1 day, 13:14:41", "throughput": 2730.25, "total_tokens": 1283527616} {"current_steps": 7108, "total_steps": 9134, "loss": 1.0476, "learning_rate": 5.8280249845273025e-06, "epoch": 0.7781274802266072, "percentage": 77.82, "elapsed_time": "5 days, 10:36:20", "remaining_time": "1 day, 13:13:35", "throughput": 2730.28, "total_tokens": 1283724288} {"current_steps": 7109, "total_steps": 9134, "loss": 0.7596, "learning_rate": 5.822507594116988e-06, "epoch": 0.7782369522975451, "percentage": 77.83, "elapsed_time": "5 days, 10:37:25", "remaining_time": "1 day, 13:12:29", "throughput": 2730.31, "total_tokens": 1283916704} {"current_steps": 7110, "total_steps": 9134, "loss": 0.659, "learning_rate": 5.816992472367366e-06, "epoch": 0.778346424368483, "percentage": 77.84, "elapsed_time": "5 days, 10:38:27", "remaining_time": "1 day, 13:11:22", "throughput": 2730.34, "total_tokens": 1284100832} {"current_steps": 7111, "total_steps": 9134, "loss": 0.8332, "learning_rate": 5.811479619930862e-06, "epoch": 0.7784558964394209, "percentage": 77.85, "elapsed_time": "5 days, 10:39:32", "remaining_time": "1 day, 13:10:15", "throughput": 2730.37, "total_tokens": 1284288320} {"current_steps": 7112, "total_steps": 9134, "loss": 1.1182, "learning_rate": 5.80596903745963e-06, "epoch": 0.7785653685103588, "percentage": 77.86, "elapsed_time": "5 days, 10:40:35", "remaining_time": "1 day, 13:09:08", "throughput": 2730.39, "total_tokens": 1284474464} {"current_steps": 7113, "total_steps": 9134, "loss": 0.8664, "learning_rate": 5.800460725605575e-06, "epoch": 0.7786748405812967, "percentage": 77.87, "elapsed_time": "5 days, 10:41:39", "remaining_time": "1 day, 13:08:02", "throughput": 2730.41, "total_tokens": 1284657920} {"current_steps": 7114, "total_steps": 9134, "loss": 0.8599, "learning_rate": 5.794954685020312e-06, "epoch": 0.7787843126522346, "percentage": 77.88, "elapsed_time": "5 days, 10:42:40", "remaining_time": "1 day, 13:06:54", "throughput": 2730.4, "total_tokens": 1284817184} {"current_steps": 7115, "total_steps": 9134, "loss": 0.8686, "learning_rate": 5.7894509163551995e-06, "epoch": 0.7788937847231725, "percentage": 77.9, "elapsed_time": "5 days, 10:43:44", "remaining_time": "1 day, 13:05:47", "throughput": 2730.37, "total_tokens": 1284976896} {"current_steps": 7116, "total_steps": 9134, "loss": 0.9102, "learning_rate": 5.783949420261315e-06, "epoch": 0.7790032567941104, "percentage": 77.91, "elapsed_time": "5 days, 10:44:50", "remaining_time": "1 day, 13:04:41", "throughput": 2730.39, "total_tokens": 1285169088} {"current_steps": 7117, "total_steps": 9134, "loss": 0.9065, "learning_rate": 5.778450197389481e-06, "epoch": 0.7791127288650483, "percentage": 77.92, "elapsed_time": "5 days, 10:45:54", "remaining_time": "1 day, 13:03:34", "throughput": 2730.42, "total_tokens": 1285357248} {"current_steps": 7118, "total_steps": 9134, "loss": 0.6077, "learning_rate": 5.772953248390242e-06, "epoch": 0.7792222009359862, "percentage": 77.93, "elapsed_time": "5 days, 10:46:57", "remaining_time": "1 day, 13:02:27", "throughput": 2730.43, "total_tokens": 1285534432} {"current_steps": 7119, "total_steps": 9134, "loss": 0.8168, "learning_rate": 5.767458573913881e-06, "epoch": 0.7793316730069241, "percentage": 77.94, "elapsed_time": "5 days, 10:48:05", "remaining_time": "1 day, 13:01:21", "throughput": 2730.48, "total_tokens": 1285741856} {"current_steps": 7120, "total_steps": 9134, "loss": 0.8357, "learning_rate": 5.761966174610395e-06, "epoch": 0.779441145077862, "percentage": 77.95, "elapsed_time": "5 days, 10:49:11", "remaining_time": "1 day, 13:00:15", "throughput": 2730.52, "total_tokens": 1285939872} {"current_steps": 7121, "total_steps": 9134, "loss": 0.6239, "learning_rate": 5.756476051129542e-06, "epoch": 0.7795506171487999, "percentage": 77.96, "elapsed_time": "5 days, 10:50:17", "remaining_time": "1 day, 12:59:09", "throughput": 2730.5, "total_tokens": 1286115936} {"current_steps": 7122, "total_steps": 9134, "loss": 1.2033, "learning_rate": 5.750988204120783e-06, "epoch": 0.7796600892197378, "percentage": 77.97, "elapsed_time": "5 days, 10:51:23", "remaining_time": "1 day, 12:58:03", "throughput": 2730.57, "total_tokens": 1286327840} {"current_steps": 7123, "total_steps": 9134, "loss": 0.796, "learning_rate": 5.7455026342333215e-06, "epoch": 0.7797695612906758, "percentage": 77.98, "elapsed_time": "5 days, 10:52:27", "remaining_time": "1 day, 12:56:56", "throughput": 2730.58, "total_tokens": 1286504576} {"current_steps": 7124, "total_steps": 9134, "loss": 0.69, "learning_rate": 5.74001934211609e-06, "epoch": 0.7798790333616136, "percentage": 77.99, "elapsed_time": "5 days, 10:53:34", "remaining_time": "1 day, 12:55:50", "throughput": 2730.58, "total_tokens": 1286691616} {"current_steps": 7125, "total_steps": 9134, "loss": 0.6984, "learning_rate": 5.734538328417754e-06, "epoch": 0.7799885054325515, "percentage": 78.01, "elapsed_time": "5 days, 10:54:37", "remaining_time": "1 day, 12:54:43", "throughput": 2730.61, "total_tokens": 1286876192} {"current_steps": 7126, "total_steps": 9134, "loss": 0.824, "learning_rate": 5.729059593786701e-06, "epoch": 0.7800979775034894, "percentage": 78.02, "elapsed_time": "5 days, 10:55:42", "remaining_time": "1 day, 12:53:37", "throughput": 2730.67, "total_tokens": 1287077792} {"current_steps": 7127, "total_steps": 9134, "loss": 1.001, "learning_rate": 5.7235831388710524e-06, "epoch": 0.7802074495744273, "percentage": 78.03, "elapsed_time": "5 days, 10:56:48", "remaining_time": "1 day, 12:52:31", "throughput": 2730.68, "total_tokens": 1287267520} {"current_steps": 7128, "total_steps": 9134, "loss": 0.6067, "learning_rate": 5.718108964318683e-06, "epoch": 0.7803169216453653, "percentage": 78.04, "elapsed_time": "5 days, 10:57:56", "remaining_time": "1 day, 12:51:25", "throughput": 2730.7, "total_tokens": 1287458592} {"current_steps": 7129, "total_steps": 9134, "loss": 0.888, "learning_rate": 5.7126370707771495e-06, "epoch": 0.7804263937163032, "percentage": 78.05, "elapsed_time": "5 days, 10:59:01", "remaining_time": "1 day, 12:50:18", "throughput": 2730.68, "total_tokens": 1287629056} {"current_steps": 7130, "total_steps": 9134, "loss": 0.8089, "learning_rate": 5.707167458893786e-06, "epoch": 0.780535865787241, "percentage": 78.06, "elapsed_time": "5 days, 11:00:00", "remaining_time": "1 day, 12:49:10", "throughput": 2730.64, "total_tokens": 1287772640} {"current_steps": 7131, "total_steps": 9134, "loss": 0.7197, "learning_rate": 5.701700129315629e-06, "epoch": 0.7806453378581789, "percentage": 78.07, "elapsed_time": "5 days, 11:01:05", "remaining_time": "1 day, 12:48:04", "throughput": 2730.66, "total_tokens": 1287960576} {"current_steps": 7132, "total_steps": 9134, "loss": 0.7743, "learning_rate": 5.696235082689455e-06, "epoch": 0.7807548099291168, "percentage": 78.08, "elapsed_time": "5 days, 11:02:10", "remaining_time": "1 day, 12:46:57", "throughput": 2730.65, "total_tokens": 1288129472} {"current_steps": 7133, "total_steps": 9134, "loss": 1.0666, "learning_rate": 5.690772319661769e-06, "epoch": 0.7808642820000548, "percentage": 78.09, "elapsed_time": "5 days, 11:03:12", "remaining_time": "1 day, 12:45:50", "throughput": 2730.66, "total_tokens": 1288305312} {"current_steps": 7134, "total_steps": 9134, "loss": 0.8718, "learning_rate": 5.685311840878796e-06, "epoch": 0.7809737540709927, "percentage": 78.1, "elapsed_time": "5 days, 11:04:18", "remaining_time": "1 day, 12:44:44", "throughput": 2730.72, "total_tokens": 1288510720} {"current_steps": 7135, "total_steps": 9134, "loss": 0.7753, "learning_rate": 5.679853646986524e-06, "epoch": 0.7810832261419305, "percentage": 78.11, "elapsed_time": "5 days, 11:05:22", "remaining_time": "1 day, 12:43:37", "throughput": 2730.71, "total_tokens": 1288684096} {"current_steps": 7136, "total_steps": 9134, "loss": 0.9181, "learning_rate": 5.674397738630619e-06, "epoch": 0.7811926982128684, "percentage": 78.13, "elapsed_time": "5 days, 11:06:29", "remaining_time": "1 day, 12:42:31", "throughput": 2730.71, "total_tokens": 1288864864} {"current_steps": 7137, "total_steps": 9134, "loss": 1.0108, "learning_rate": 5.668944116456529e-06, "epoch": 0.7813021702838063, "percentage": 78.14, "elapsed_time": "5 days, 11:07:35", "remaining_time": "1 day, 12:41:25", "throughput": 2730.74, "total_tokens": 1289059968} {"current_steps": 7138, "total_steps": 9134, "loss": 1.027, "learning_rate": 5.663492781109381e-06, "epoch": 0.7814116423547443, "percentage": 78.15, "elapsed_time": "5 days, 11:08:42", "remaining_time": "1 day, 12:40:19", "throughput": 2730.81, "total_tokens": 1289279264} {"current_steps": 7139, "total_steps": 9134, "loss": 0.7495, "learning_rate": 5.658043733234081e-06, "epoch": 0.7815211144256822, "percentage": 78.16, "elapsed_time": "5 days, 11:09:49", "remaining_time": "1 day, 12:39:13", "throughput": 2730.83, "total_tokens": 1289470336} {"current_steps": 7140, "total_steps": 9134, "loss": 1.0545, "learning_rate": 5.65259697347523e-06, "epoch": 0.7816305864966201, "percentage": 78.17, "elapsed_time": "5 days, 11:10:55", "remaining_time": "1 day, 12:38:07", "throughput": 2730.85, "total_tokens": 1289658048} {"current_steps": 7141, "total_steps": 9134, "loss": 0.7799, "learning_rate": 5.647152502477171e-06, "epoch": 0.7817400585675579, "percentage": 78.18, "elapsed_time": "5 days, 11:12:00", "remaining_time": "1 day, 12:37:01", "throughput": 2730.86, "total_tokens": 1289839488} {"current_steps": 7142, "total_steps": 9134, "loss": 0.8366, "learning_rate": 5.641710320883975e-06, "epoch": 0.7818495306384958, "percentage": 78.19, "elapsed_time": "5 days, 11:13:05", "remaining_time": "1 day, 12:35:54", "throughput": 2730.85, "total_tokens": 1290011744} {"current_steps": 7143, "total_steps": 9134, "loss": 0.8165, "learning_rate": 5.636270429339436e-06, "epoch": 0.7819590027094337, "percentage": 78.2, "elapsed_time": "5 days, 11:14:05", "remaining_time": "1 day, 12:34:46", "throughput": 2730.79, "total_tokens": 1290148832} {"current_steps": 7144, "total_steps": 9134, "loss": 0.7619, "learning_rate": 5.630832828487101e-06, "epoch": 0.7820684747803717, "percentage": 78.21, "elapsed_time": "5 days, 11:15:10", "remaining_time": "1 day, 12:33:40", "throughput": 2730.8, "total_tokens": 1290331168} {"current_steps": 7145, "total_steps": 9134, "loss": 0.9793, "learning_rate": 5.625397518970199e-06, "epoch": 0.7821779468513096, "percentage": 78.22, "elapsed_time": "5 days, 11:16:18", "remaining_time": "1 day, 12:32:34", "throughput": 2730.89, "total_tokens": 1290560544} {"current_steps": 7146, "total_steps": 9134, "loss": 0.8817, "learning_rate": 5.619964501431743e-06, "epoch": 0.7822874189222475, "percentage": 78.24, "elapsed_time": "5 days, 11:17:23", "remaining_time": "1 day, 12:31:28", "throughput": 2730.96, "total_tokens": 1290773344} {"current_steps": 7147, "total_steps": 9134, "loss": 0.7341, "learning_rate": 5.614533776514436e-06, "epoch": 0.7823968909931853, "percentage": 78.25, "elapsed_time": "5 days, 11:18:31", "remaining_time": "1 day, 12:30:22", "throughput": 2730.93, "total_tokens": 1290940224} {"current_steps": 7148, "total_steps": 9134, "loss": 1.0079, "learning_rate": 5.609105344860724e-06, "epoch": 0.7825063630641232, "percentage": 78.26, "elapsed_time": "5 days, 11:19:39", "remaining_time": "1 day, 12:29:17", "throughput": 2731.0, "total_tokens": 1291160416} {"current_steps": 7149, "total_steps": 9134, "loss": 0.8004, "learning_rate": 5.603679207112781e-06, "epoch": 0.7826158351350612, "percentage": 78.27, "elapsed_time": "5 days, 11:20:44", "remaining_time": "1 day, 12:28:10", "throughput": 2730.99, "total_tokens": 1291334016} {"current_steps": 7150, "total_steps": 9134, "loss": 0.8687, "learning_rate": 5.598255363912508e-06, "epoch": 0.7827253072059991, "percentage": 78.28, "elapsed_time": "5 days, 11:21:51", "remaining_time": "1 day, 12:27:04", "throughput": 2731.04, "total_tokens": 1291542560} {"current_steps": 7151, "total_steps": 9134, "loss": 0.8457, "learning_rate": 5.592833815901538e-06, "epoch": 0.782834779276937, "percentage": 78.29, "elapsed_time": "5 days, 11:22:59", "remaining_time": "1 day, 12:25:58", "throughput": 2731.06, "total_tokens": 1291735648} {"current_steps": 7152, "total_steps": 9134, "loss": 0.8753, "learning_rate": 5.5874145637212245e-06, "epoch": 0.7829442513478748, "percentage": 78.3, "elapsed_time": "5 days, 11:24:06", "remaining_time": "1 day, 12:24:53", "throughput": 2731.13, "total_tokens": 1291952480} {"current_steps": 7153, "total_steps": 9134, "loss": 0.7886, "learning_rate": 5.581997608012651e-06, "epoch": 0.7830537234188127, "percentage": 78.31, "elapsed_time": "5 days, 11:25:12", "remaining_time": "1 day, 12:23:47", "throughput": 2731.17, "total_tokens": 1292151616} {"current_steps": 7154, "total_steps": 9134, "loss": 0.9653, "learning_rate": 5.576582949416648e-06, "epoch": 0.7831631954897507, "percentage": 78.32, "elapsed_time": "5 days, 11:26:18", "remaining_time": "1 day, 12:22:40", "throughput": 2731.2, "total_tokens": 1292345824} {"current_steps": 7155, "total_steps": 9134, "loss": 0.8671, "learning_rate": 5.571170588573751e-06, "epoch": 0.7832726675606886, "percentage": 78.33, "elapsed_time": "5 days, 11:27:22", "remaining_time": "1 day, 12:21:33", "throughput": 2731.2, "total_tokens": 1292519872} {"current_steps": 7156, "total_steps": 9134, "loss": 0.9059, "learning_rate": 5.56576052612423e-06, "epoch": 0.7833821396316265, "percentage": 78.34, "elapsed_time": "5 days, 11:28:29", "remaining_time": "1 day, 12:20:28", "throughput": 2731.24, "total_tokens": 1292719680} {"current_steps": 7157, "total_steps": 9134, "loss": 0.9734, "learning_rate": 5.560352762708088e-06, "epoch": 0.7834916117025644, "percentage": 78.36, "elapsed_time": "5 days, 11:29:36", "remaining_time": "1 day, 12:19:22", "throughput": 2731.26, "total_tokens": 1292913440} {"current_steps": 7158, "total_steps": 9134, "loss": 0.8488, "learning_rate": 5.554947298965052e-06, "epoch": 0.7836010837735022, "percentage": 78.37, "elapsed_time": "5 days, 11:30:34", "remaining_time": "1 day, 12:18:13", "throughput": 2731.2, "total_tokens": 1293044480} {"current_steps": 7159, "total_steps": 9134, "loss": 0.8337, "learning_rate": 5.5495441355345766e-06, "epoch": 0.7837105558444402, "percentage": 78.38, "elapsed_time": "5 days, 11:31:40", "remaining_time": "1 day, 12:17:07", "throughput": 2731.2, "total_tokens": 1293223232} {"current_steps": 7160, "total_steps": 9134, "loss": 0.7503, "learning_rate": 5.54414327305584e-06, "epoch": 0.7838200279153781, "percentage": 78.39, "elapsed_time": "5 days, 11:32:43", "remaining_time": "1 day, 12:16:00", "throughput": 2731.16, "total_tokens": 1293377568} {"current_steps": 7161, "total_steps": 9134, "loss": 0.605, "learning_rate": 5.538744712167776e-06, "epoch": 0.783929499986316, "percentage": 78.4, "elapsed_time": "5 days, 11:33:49", "remaining_time": "1 day, 12:14:54", "throughput": 2731.15, "total_tokens": 1293554528} {"current_steps": 7162, "total_steps": 9134, "loss": 0.8616, "learning_rate": 5.533348453508996e-06, "epoch": 0.7840389720572539, "percentage": 78.41, "elapsed_time": "5 days, 11:34:54", "remaining_time": "1 day, 12:13:47", "throughput": 2731.15, "total_tokens": 1293730816} {"current_steps": 7163, "total_steps": 9134, "loss": 0.9879, "learning_rate": 5.527954497717886e-06, "epoch": 0.7841484441281918, "percentage": 78.42, "elapsed_time": "5 days, 11:36:01", "remaining_time": "1 day, 12:12:42", "throughput": 2731.17, "total_tokens": 1293921216} {"current_steps": 7164, "total_steps": 9134, "loss": 0.9222, "learning_rate": 5.522562845432533e-06, "epoch": 0.7842579161991297, "percentage": 78.43, "elapsed_time": "5 days, 11:37:02", "remaining_time": "1 day, 12:11:34", "throughput": 2731.15, "total_tokens": 1294078016} {"current_steps": 7165, "total_steps": 9134, "loss": 0.9044, "learning_rate": 5.517173497290762e-06, "epoch": 0.7843673882700676, "percentage": 78.44, "elapsed_time": "5 days, 11:38:08", "remaining_time": "1 day, 12:10:28", "throughput": 2731.19, "total_tokens": 1294277376} {"current_steps": 7166, "total_steps": 9134, "loss": 0.8362, "learning_rate": 5.511786453930124e-06, "epoch": 0.7844768603410055, "percentage": 78.45, "elapsed_time": "5 days, 11:39:14", "remaining_time": "1 day, 12:09:22", "throughput": 2731.25, "total_tokens": 1294487712} {"current_steps": 7167, "total_steps": 9134, "loss": 0.9422, "learning_rate": 5.5064017159878826e-06, "epoch": 0.7845863324119434, "percentage": 78.47, "elapsed_time": "5 days, 11:40:21", "remaining_time": "1 day, 12:08:16", "throughput": 2731.29, "total_tokens": 1294690432} {"current_steps": 7168, "total_steps": 9134, "loss": 0.9463, "learning_rate": 5.501019284101067e-06, "epoch": 0.7846958044828813, "percentage": 78.48, "elapsed_time": "5 days, 11:41:24", "remaining_time": "1 day, 12:07:09", "throughput": 2731.25, "total_tokens": 1294843648} {"current_steps": 7169, "total_steps": 9134, "loss": 0.8343, "learning_rate": 5.495639158906382e-06, "epoch": 0.7848052765538192, "percentage": 78.49, "elapsed_time": "5 days, 11:42:25", "remaining_time": "1 day, 12:06:01", "throughput": 2731.21, "total_tokens": 1294992832} {"current_steps": 7170, "total_steps": 9134, "loss": 1.1909, "learning_rate": 5.490261341040312e-06, "epoch": 0.7849147486247571, "percentage": 78.5, "elapsed_time": "5 days, 11:43:27", "remaining_time": "1 day, 12:04:54", "throughput": 2731.23, "total_tokens": 1295171584} {"current_steps": 7171, "total_steps": 9134, "loss": 0.8948, "learning_rate": 5.4848858311390165e-06, "epoch": 0.785024220695695, "percentage": 78.51, "elapsed_time": "5 days, 11:44:32", "remaining_time": "1 day, 12:03:48", "throughput": 2731.25, "total_tokens": 1295358400} {"current_steps": 7172, "total_steps": 9134, "loss": 0.9567, "learning_rate": 5.479512629838426e-06, "epoch": 0.7851336927666329, "percentage": 78.52, "elapsed_time": "5 days, 11:45:35", "remaining_time": "1 day, 12:02:40", "throughput": 2731.21, "total_tokens": 1295507360} {"current_steps": 7173, "total_steps": 9134, "loss": 0.9231, "learning_rate": 5.4741417377741745e-06, "epoch": 0.7852431648375708, "percentage": 78.53, "elapsed_time": "5 days, 11:46:42", "remaining_time": "1 day, 12:01:35", "throughput": 2731.22, "total_tokens": 1295699104} {"current_steps": 7174, "total_steps": 9134, "loss": 0.6667, "learning_rate": 5.468773155581627e-06, "epoch": 0.7853526369085088, "percentage": 78.54, "elapsed_time": "5 days, 11:47:48", "remaining_time": "1 day, 12:00:28", "throughput": 2731.22, "total_tokens": 1295878752} {"current_steps": 7175, "total_steps": 9134, "loss": 0.8825, "learning_rate": 5.46340688389588e-06, "epoch": 0.7854621089794466, "percentage": 78.55, "elapsed_time": "5 days, 11:48:55", "remaining_time": "1 day, 11:59:23", "throughput": 2731.3, "total_tokens": 1296097376} {"current_steps": 7176, "total_steps": 9134, "loss": 0.8169, "learning_rate": 5.458042923351744e-06, "epoch": 0.7855715810503845, "percentage": 78.56, "elapsed_time": "5 days, 11:50:03", "remaining_time": "1 day, 11:58:17", "throughput": 2731.33, "total_tokens": 1296296736} {"current_steps": 7177, "total_steps": 9134, "loss": 0.7495, "learning_rate": 5.452681274583784e-06, "epoch": 0.7856810531213224, "percentage": 78.57, "elapsed_time": "5 days, 11:51:09", "remaining_time": "1 day, 11:57:11", "throughput": 2731.33, "total_tokens": 1296479520} {"current_steps": 7178, "total_steps": 9134, "loss": 0.5854, "learning_rate": 5.447321938226249e-06, "epoch": 0.7857905251922603, "percentage": 78.59, "elapsed_time": "5 days, 11:52:13", "remaining_time": "1 day, 11:56:04", "throughput": 2731.34, "total_tokens": 1296658496} {"current_steps": 7179, "total_steps": 9134, "loss": 0.8077, "learning_rate": 5.441964914913164e-06, "epoch": 0.7858999972631983, "percentage": 78.6, "elapsed_time": "5 days, 11:53:15", "remaining_time": "1 day, 11:54:57", "throughput": 2731.34, "total_tokens": 1296829408} {"current_steps": 7180, "total_steps": 9134, "loss": 0.6957, "learning_rate": 5.436610205278228e-06, "epoch": 0.7860094693341362, "percentage": 78.61, "elapsed_time": "5 days, 11:54:23", "remaining_time": "1 day, 11:53:51", "throughput": 2731.39, "total_tokens": 1297037504} {"current_steps": 7181, "total_steps": 9134, "loss": 0.7868, "learning_rate": 5.4312578099549125e-06, "epoch": 0.786118941405074, "percentage": 78.62, "elapsed_time": "5 days, 11:55:29", "remaining_time": "1 day, 11:52:45", "throughput": 2731.39, "total_tokens": 1297217824} {"current_steps": 7182, "total_steps": 9134, "loss": 0.7377, "learning_rate": 5.425907729576388e-06, "epoch": 0.7862284134760119, "percentage": 78.63, "elapsed_time": "5 days, 11:56:36", "remaining_time": "1 day, 11:51:39", "throughput": 2731.41, "total_tokens": 1297409792} {"current_steps": 7183, "total_steps": 9134, "loss": 1.0815, "learning_rate": 5.42055996477556e-06, "epoch": 0.7863378855469498, "percentage": 78.64, "elapsed_time": "5 days, 11:57:43", "remaining_time": "1 day, 11:50:33", "throughput": 2731.46, "total_tokens": 1297616096} {"current_steps": 7184, "total_steps": 9134, "loss": 0.7193, "learning_rate": 5.415214516185061e-06, "epoch": 0.7864473576178878, "percentage": 78.65, "elapsed_time": "5 days, 11:58:50", "remaining_time": "1 day, 11:49:27", "throughput": 2731.51, "total_tokens": 1297822848} {"current_steps": 7185, "total_steps": 9134, "loss": 0.7032, "learning_rate": 5.409871384437234e-06, "epoch": 0.7865568296888257, "percentage": 78.66, "elapsed_time": "5 days, 11:59:53", "remaining_time": "1 day, 11:48:20", "throughput": 2731.53, "total_tokens": 1298005184} {"current_steps": 7186, "total_steps": 9134, "loss": 0.6884, "learning_rate": 5.404530570164187e-06, "epoch": 0.7866663017597635, "percentage": 78.67, "elapsed_time": "5 days, 12:01:00", "remaining_time": "1 day, 11:47:14", "throughput": 2731.53, "total_tokens": 1298186624} {"current_steps": 7187, "total_steps": 9134, "loss": 0.7827, "learning_rate": 5.399192073997703e-06, "epoch": 0.7867757738307014, "percentage": 78.68, "elapsed_time": "5 days, 12:02:01", "remaining_time": "1 day, 11:46:07", "throughput": 2731.49, "total_tokens": 1298337376} {"current_steps": 7188, "total_steps": 9134, "loss": 0.6941, "learning_rate": 5.39385589656933e-06, "epoch": 0.7868852459016393, "percentage": 78.69, "elapsed_time": "5 days, 12:03:08", "remaining_time": "1 day, 11:45:01", "throughput": 2731.5, "total_tokens": 1298523520} {"current_steps": 7189, "total_steps": 9134, "loss": 0.7276, "learning_rate": 5.3885220385103245e-06, "epoch": 0.7869947179725773, "percentage": 78.71, "elapsed_time": "5 days, 12:04:16", "remaining_time": "1 day, 11:43:55", "throughput": 2731.54, "total_tokens": 1298726464} {"current_steps": 7190, "total_steps": 9134, "loss": 0.9199, "learning_rate": 5.383190500451671e-06, "epoch": 0.7871041900435152, "percentage": 78.72, "elapsed_time": "5 days, 12:05:23", "remaining_time": "1 day, 11:42:50", "throughput": 2731.55, "total_tokens": 1298916192} {"current_steps": 7191, "total_steps": 9134, "loss": 0.6858, "learning_rate": 5.3778612830240795e-06, "epoch": 0.7872136621144531, "percentage": 78.73, "elapsed_time": "5 days, 12:06:23", "remaining_time": "1 day, 11:41:42", "throughput": 2731.5, "total_tokens": 1299055296} {"current_steps": 7192, "total_steps": 9134, "loss": 0.8372, "learning_rate": 5.372534386857988e-06, "epoch": 0.7873231341853909, "percentage": 78.74, "elapsed_time": "5 days, 12:07:27", "remaining_time": "1 day, 11:40:35", "throughput": 2731.47, "total_tokens": 1299217920} {"current_steps": 7193, "total_steps": 9134, "loss": 0.7408, "learning_rate": 5.367209812583557e-06, "epoch": 0.7874326062563288, "percentage": 78.75, "elapsed_time": "5 days, 12:08:35", "remaining_time": "1 day, 11:39:29", "throughput": 2731.46, "total_tokens": 1299400032} {"current_steps": 7194, "total_steps": 9134, "loss": 0.9779, "learning_rate": 5.361887560830675e-06, "epoch": 0.7875420783272667, "percentage": 78.76, "elapsed_time": "5 days, 12:09:38", "remaining_time": "1 day, 11:38:22", "throughput": 2731.49, "total_tokens": 1299587296} {"current_steps": 7195, "total_steps": 9134, "loss": 0.782, "learning_rate": 5.356567632228943e-06, "epoch": 0.7876515503982047, "percentage": 78.77, "elapsed_time": "5 days, 12:10:43", "remaining_time": "1 day, 11:37:16", "throughput": 2731.48, "total_tokens": 1299755520} {"current_steps": 7196, "total_steps": 9134, "loss": 1.1653, "learning_rate": 5.351250027407717e-06, "epoch": 0.7877610224691426, "percentage": 78.78, "elapsed_time": "5 days, 12:11:45", "remaining_time": "1 day, 11:36:09", "throughput": 2731.46, "total_tokens": 1299918144} {"current_steps": 7197, "total_steps": 9134, "loss": 0.8483, "learning_rate": 5.345934746996051e-06, "epoch": 0.7878704945400805, "percentage": 78.79, "elapsed_time": "5 days, 12:12:46", "remaining_time": "1 day, 11:35:01", "throughput": 2731.48, "total_tokens": 1300093088} {"current_steps": 7198, "total_steps": 9134, "loss": 0.7346, "learning_rate": 5.340621791622733e-06, "epoch": 0.7879799666110183, "percentage": 78.8, "elapsed_time": "5 days, 12:13:52", "remaining_time": "1 day, 11:33:55", "throughput": 2731.47, "total_tokens": 1300265792} {"current_steps": 7199, "total_steps": 9134, "loss": 0.6802, "learning_rate": 5.335311161916273e-06, "epoch": 0.7880894386819562, "percentage": 78.82, "elapsed_time": "5 days, 12:14:56", "remaining_time": "1 day, 11:32:48", "throughput": 2731.49, "total_tokens": 1300451712} {"current_steps": 7200, "total_steps": 9134, "loss": 0.6344, "learning_rate": 5.330002858504904e-06, "epoch": 0.7881989107528942, "percentage": 78.83, "elapsed_time": "5 days, 12:16:04", "remaining_time": "1 day, 11:31:43", "throughput": 2731.5, "total_tokens": 1300640768} {"current_steps": 7201, "total_steps": 9134, "loss": 1.0618, "learning_rate": 5.324696882016606e-06, "epoch": 0.7883083828238321, "percentage": 78.84, "elapsed_time": "5 days, 12:17:06", "remaining_time": "1 day, 11:30:35", "throughput": 2731.5, "total_tokens": 1300811680} {"current_steps": 7202, "total_steps": 9134, "loss": 0.768, "learning_rate": 5.319393233079042e-06, "epoch": 0.78841785489477, "percentage": 78.85, "elapsed_time": "5 days, 12:18:11", "remaining_time": "1 day, 11:29:29", "throughput": 2731.49, "total_tokens": 1300986848} {"current_steps": 7203, "total_steps": 9134, "loss": 0.8251, "learning_rate": 5.314091912319649e-06, "epoch": 0.7885273269657078, "percentage": 78.86, "elapsed_time": "5 days, 12:19:17", "remaining_time": "1 day, 11:28:23", "throughput": 2731.47, "total_tokens": 1301154400} {"current_steps": 7204, "total_steps": 9134, "loss": 0.9199, "learning_rate": 5.3087929203655375e-06, "epoch": 0.7886367990366457, "percentage": 78.87, "elapsed_time": "5 days, 12:20:21", "remaining_time": "1 day, 11:27:16", "throughput": 2731.49, "total_tokens": 1301341216} {"current_steps": 7205, "total_steps": 9134, "loss": 0.5308, "learning_rate": 5.303496257843585e-06, "epoch": 0.7887462711075837, "percentage": 78.88, "elapsed_time": "5 days, 12:21:25", "remaining_time": "1 day, 11:26:09", "throughput": 2731.49, "total_tokens": 1301513472} {"current_steps": 7206, "total_steps": 9134, "loss": 0.812, "learning_rate": 5.2982019253803725e-06, "epoch": 0.7888557431785216, "percentage": 78.89, "elapsed_time": "5 days, 12:22:31", "remaining_time": "1 day, 11:25:03", "throughput": 2731.5, "total_tokens": 1301702752} {"current_steps": 7207, "total_steps": 9134, "loss": 0.8791, "learning_rate": 5.29290992360221e-06, "epoch": 0.7889652152494595, "percentage": 78.9, "elapsed_time": "5 days, 12:23:37", "remaining_time": "1 day, 11:23:57", "throughput": 2731.56, "total_tokens": 1301909504} {"current_steps": 7208, "total_steps": 9134, "loss": 0.792, "learning_rate": 5.2876202531351285e-06, "epoch": 0.7890746873203974, "percentage": 78.91, "elapsed_time": "5 days, 12:24:43", "remaining_time": "1 day, 11:22:51", "throughput": 2731.56, "total_tokens": 1302091840} {"current_steps": 7209, "total_steps": 9134, "loss": 0.8927, "learning_rate": 5.2823329146048815e-06, "epoch": 0.7891841593913352, "percentage": 78.92, "elapsed_time": "5 days, 12:25:50", "remaining_time": "1 day, 11:21:45", "throughput": 2731.55, "total_tokens": 1302268128} {"current_steps": 7210, "total_steps": 9134, "loss": 0.8556, "learning_rate": 5.27704790863697e-06, "epoch": 0.7892936314622732, "percentage": 78.94, "elapsed_time": "5 days, 12:26:47", "remaining_time": "1 day, 11:20:36", "throughput": 2731.51, "total_tokens": 1302402528} {"current_steps": 7211, "total_steps": 9134, "loss": 0.9642, "learning_rate": 5.271765235856574e-06, "epoch": 0.7894031035332111, "percentage": 78.95, "elapsed_time": "5 days, 12:27:48", "remaining_time": "1 day, 11:19:29", "throughput": 2731.5, "total_tokens": 1302564480} {"current_steps": 7212, "total_steps": 9134, "loss": 0.7, "learning_rate": 5.266484896888649e-06, "epoch": 0.789512575604149, "percentage": 78.96, "elapsed_time": "5 days, 12:28:50", "remaining_time": "1 day, 11:18:21", "throughput": 2731.5, "total_tokens": 1302734720} {"current_steps": 7213, "total_steps": 9134, "loss": 0.6713, "learning_rate": 5.261206892357825e-06, "epoch": 0.7896220476750869, "percentage": 78.97, "elapsed_time": "5 days, 12:29:55", "remaining_time": "1 day, 11:17:15", "throughput": 2731.55, "total_tokens": 1302937664} {"current_steps": 7214, "total_steps": 9134, "loss": 0.7201, "learning_rate": 5.255931222888497e-06, "epoch": 0.7897315197460248, "percentage": 78.98, "elapsed_time": "5 days, 12:31:02", "remaining_time": "1 day, 11:16:09", "throughput": 2731.55, "total_tokens": 1303122016} {"current_steps": 7215, "total_steps": 9134, "loss": 1.0483, "learning_rate": 5.25065788910476e-06, "epoch": 0.7898409918169627, "percentage": 78.99, "elapsed_time": "5 days, 12:32:08", "remaining_time": "1 day, 11:15:03", "throughput": 2731.6, "total_tokens": 1303321152} {"current_steps": 7216, "total_steps": 9134, "loss": 0.9278, "learning_rate": 5.245386891630441e-06, "epoch": 0.7899504638879006, "percentage": 79.0, "elapsed_time": "5 days, 12:33:15", "remaining_time": "1 day, 11:13:57", "throughput": 2731.6, "total_tokens": 1303507520} {"current_steps": 7217, "total_steps": 9134, "loss": 1.0411, "learning_rate": 5.240118231089089e-06, "epoch": 0.7900599359588385, "percentage": 79.01, "elapsed_time": "5 days, 12:34:22", "remaining_time": "1 day, 11:12:51", "throughput": 2731.57, "total_tokens": 1303677312} {"current_steps": 7218, "total_steps": 9134, "loss": 0.8597, "learning_rate": 5.234851908103969e-06, "epoch": 0.7901694080297764, "percentage": 79.02, "elapsed_time": "5 days, 12:35:26", "remaining_time": "1 day, 11:11:45", "throughput": 2731.59, "total_tokens": 1303861888} {"current_steps": 7219, "total_steps": 9134, "loss": 0.689, "learning_rate": 5.229587923298099e-06, "epoch": 0.7902788801007143, "percentage": 79.03, "elapsed_time": "5 days, 12:36:30", "remaining_time": "1 day, 11:10:38", "throughput": 2731.6, "total_tokens": 1304040192} {"current_steps": 7220, "total_steps": 9134, "loss": 0.8445, "learning_rate": 5.224326277294167e-06, "epoch": 0.7903883521716522, "percentage": 79.05, "elapsed_time": "5 days, 12:37:34", "remaining_time": "1 day, 11:09:31", "throughput": 2731.63, "total_tokens": 1304228128} {"current_steps": 7221, "total_steps": 9134, "loss": 0.9796, "learning_rate": 5.219066970714639e-06, "epoch": 0.7904978242425901, "percentage": 79.06, "elapsed_time": "5 days, 12:38:38", "remaining_time": "1 day, 11:08:25", "throughput": 2731.64, "total_tokens": 1304409568} {"current_steps": 7222, "total_steps": 9134, "loss": 0.7517, "learning_rate": 5.2138100041816736e-06, "epoch": 0.790607296313528, "percentage": 79.07, "elapsed_time": "5 days, 12:39:43", "remaining_time": "1 day, 11:07:18", "throughput": 2731.66, "total_tokens": 1304597728} {"current_steps": 7223, "total_steps": 9134, "loss": 0.8287, "learning_rate": 5.208555378317159e-06, "epoch": 0.7907167683844659, "percentage": 79.08, "elapsed_time": "5 days, 12:40:48", "remaining_time": "1 day, 11:06:12", "throughput": 2731.65, "total_tokens": 1304768416} {"current_steps": 7224, "total_steps": 9134, "loss": 0.7679, "learning_rate": 5.203303093742712e-06, "epoch": 0.7908262404554038, "percentage": 79.09, "elapsed_time": "5 days, 12:41:55", "remaining_time": "1 day, 11:05:06", "throughput": 2731.65, "total_tokens": 1304953888} {"current_steps": 7225, "total_steps": 9134, "loss": 0.879, "learning_rate": 5.1980531510796595e-06, "epoch": 0.7909357125263418, "percentage": 79.1, "elapsed_time": "5 days, 12:42:58", "remaining_time": "1 day, 11:03:59", "throughput": 2731.68, "total_tokens": 1305138240} {"current_steps": 7226, "total_steps": 9134, "loss": 0.9277, "learning_rate": 5.192805550949068e-06, "epoch": 0.7910451845972796, "percentage": 79.11, "elapsed_time": "5 days, 12:44:00", "remaining_time": "1 day, 11:02:52", "throughput": 2731.69, "total_tokens": 1305310496} {"current_steps": 7227, "total_steps": 9134, "loss": 1.0396, "learning_rate": 5.187560293971705e-06, "epoch": 0.7911546566682175, "percentage": 79.12, "elapsed_time": "5 days, 12:45:04", "remaining_time": "1 day, 11:01:45", "throughput": 2731.7, "total_tokens": 1305491264} {"current_steps": 7228, "total_steps": 9134, "loss": 0.6558, "learning_rate": 5.182317380768092e-06, "epoch": 0.7912641287391554, "percentage": 79.13, "elapsed_time": "5 days, 12:46:06", "remaining_time": "1 day, 11:00:38", "throughput": 2731.7, "total_tokens": 1305661056} {"current_steps": 7229, "total_steps": 9134, "loss": 0.7057, "learning_rate": 5.177076811958451e-06, "epoch": 0.7913736008100933, "percentage": 79.14, "elapsed_time": "5 days, 12:47:02", "remaining_time": "1 day, 10:59:29", "throughput": 2731.66, "total_tokens": 1305797920} {"current_steps": 7230, "total_steps": 9134, "loss": 0.788, "learning_rate": 5.171838588162725e-06, "epoch": 0.7914830728810313, "percentage": 79.15, "elapsed_time": "5 days, 12:48:03", "remaining_time": "1 day, 10:58:22", "throughput": 2731.61, "total_tokens": 1305939264} {"current_steps": 7231, "total_steps": 9134, "loss": 0.6852, "learning_rate": 5.16660271000059e-06, "epoch": 0.7915925449519692, "percentage": 79.17, "elapsed_time": "5 days, 12:49:08", "remaining_time": "1 day, 10:57:15", "throughput": 2731.63, "total_tokens": 1306124512} {"current_steps": 7232, "total_steps": 9134, "loss": 0.804, "learning_rate": 5.161369178091438e-06, "epoch": 0.791702017022907, "percentage": 79.18, "elapsed_time": "5 days, 12:50:12", "remaining_time": "1 day, 10:56:08", "throughput": 2731.64, "total_tokens": 1306303936} {"current_steps": 7233, "total_steps": 9134, "loss": 0.9677, "learning_rate": 5.1561379930543885e-06, "epoch": 0.7918114890938449, "percentage": 79.19, "elapsed_time": "5 days, 12:51:18", "remaining_time": "1 day, 10:55:02", "throughput": 2731.67, "total_tokens": 1306499936} {"current_steps": 7234, "total_steps": 9134, "loss": 0.8378, "learning_rate": 5.1509091555082794e-06, "epoch": 0.7919209611647828, "percentage": 79.2, "elapsed_time": "5 days, 12:52:25", "remaining_time": "1 day, 10:53:56", "throughput": 2731.72, "total_tokens": 1306706688} {"current_steps": 7235, "total_steps": 9134, "loss": 1.0767, "learning_rate": 5.145682666071663e-06, "epoch": 0.7920304332357208, "percentage": 79.21, "elapsed_time": "5 days, 12:53:32", "remaining_time": "1 day, 10:52:50", "throughput": 2731.77, "total_tokens": 1306913888} {"current_steps": 7236, "total_steps": 9134, "loss": 0.7659, "learning_rate": 5.140458525362848e-06, "epoch": 0.7921399053066587, "percentage": 79.22, "elapsed_time": "5 days, 12:54:29", "remaining_time": "1 day, 10:51:42", "throughput": 2731.72, "total_tokens": 1307046944} {"current_steps": 7237, "total_steps": 9134, "loss": 0.7439, "learning_rate": 5.135236733999813e-06, "epoch": 0.7922493773775965, "percentage": 79.23, "elapsed_time": "5 days, 12:55:35", "remaining_time": "1 day, 10:50:36", "throughput": 2731.76, "total_tokens": 1307246528} {"current_steps": 7238, "total_steps": 9134, "loss": 0.9518, "learning_rate": 5.1300172926003e-06, "epoch": 0.7923588494485344, "percentage": 79.24, "elapsed_time": "5 days, 12:56:41", "remaining_time": "1 day, 10:49:30", "throughput": 2731.79, "total_tokens": 1307440064} {"current_steps": 7239, "total_steps": 9134, "loss": 0.9752, "learning_rate": 5.1248002017817596e-06, "epoch": 0.7924683215194723, "percentage": 79.25, "elapsed_time": "5 days, 12:57:46", "remaining_time": "1 day, 10:48:23", "throughput": 2731.81, "total_tokens": 1307623744} {"current_steps": 7240, "total_steps": 9134, "loss": 0.7972, "learning_rate": 5.119585462161358e-06, "epoch": 0.7925777935904103, "percentage": 79.26, "elapsed_time": "5 days, 12:58:54", "remaining_time": "1 day, 10:47:17", "throughput": 2731.84, "total_tokens": 1307824448} {"current_steps": 7241, "total_steps": 9134, "loss": 1.0068, "learning_rate": 5.114373074355994e-06, "epoch": 0.7926872656613482, "percentage": 79.28, "elapsed_time": "5 days, 13:00:01", "remaining_time": "1 day, 10:46:12", "throughput": 2731.89, "total_tokens": 1308033888} {"current_steps": 7242, "total_steps": 9134, "loss": 0.9101, "learning_rate": 5.10916303898227e-06, "epoch": 0.7927967377322861, "percentage": 79.29, "elapsed_time": "5 days, 13:01:09", "remaining_time": "1 day, 10:45:06", "throughput": 2731.87, "total_tokens": 1308208832} {"current_steps": 7243, "total_steps": 9134, "loss": 0.9809, "learning_rate": 5.1039553566565505e-06, "epoch": 0.7929062098032239, "percentage": 79.3, "elapsed_time": "5 days, 13:02:14", "remaining_time": "1 day, 10:44:00", "throughput": 2731.91, "total_tokens": 1308407072} {"current_steps": 7244, "total_steps": 9134, "loss": 0.6347, "learning_rate": 5.098750027994862e-06, "epoch": 0.7930156818741618, "percentage": 79.31, "elapsed_time": "5 days, 13:03:20", "remaining_time": "1 day, 10:42:53", "throughput": 2731.9, "total_tokens": 1308583808} {"current_steps": 7245, "total_steps": 9134, "loss": 0.6307, "learning_rate": 5.0935470536130155e-06, "epoch": 0.7931251539450997, "percentage": 79.32, "elapsed_time": "5 days, 13:04:27", "remaining_time": "1 day, 10:41:47", "throughput": 2731.89, "total_tokens": 1308761440} {"current_steps": 7246, "total_steps": 9134, "loss": 0.8108, "learning_rate": 5.088346434126481e-06, "epoch": 0.7932346260160377, "percentage": 79.33, "elapsed_time": "5 days, 13:05:31", "remaining_time": "1 day, 10:40:41", "throughput": 2731.86, "total_tokens": 1308919808} {"current_steps": 7247, "total_steps": 9134, "loss": 0.7119, "learning_rate": 5.083148170150509e-06, "epoch": 0.7933440980869756, "percentage": 79.34, "elapsed_time": "5 days, 13:06:34", "remaining_time": "1 day, 10:39:34", "throughput": 2731.87, "total_tokens": 1309096320} {"current_steps": 7248, "total_steps": 9134, "loss": 0.8216, "learning_rate": 5.0779522623000345e-06, "epoch": 0.7934535701579135, "percentage": 79.35, "elapsed_time": "5 days, 13:07:38", "remaining_time": "1 day, 10:38:27", "throughput": 2731.86, "total_tokens": 1309264768} {"current_steps": 7249, "total_steps": 9134, "loss": 1.054, "learning_rate": 5.072758711189721e-06, "epoch": 0.7935630422288513, "percentage": 79.36, "elapsed_time": "5 days, 13:08:44", "remaining_time": "1 day, 10:37:21", "throughput": 2731.89, "total_tokens": 1309460768} {"current_steps": 7250, "total_steps": 9134, "loss": 0.7784, "learning_rate": 5.067567517433958e-06, "epoch": 0.7936725142997892, "percentage": 79.37, "elapsed_time": "5 days, 13:09:49", "remaining_time": "1 day, 10:36:15", "throughput": 2731.92, "total_tokens": 1309654752} {"current_steps": 7251, "total_steps": 9134, "loss": 0.8269, "learning_rate": 5.062378681646845e-06, "epoch": 0.7937819863707272, "percentage": 79.38, "elapsed_time": "5 days, 13:10:55", "remaining_time": "1 day, 10:35:08", "throughput": 2731.93, "total_tokens": 1309837536} {"current_steps": 7252, "total_steps": 9134, "loss": 0.8039, "learning_rate": 5.057192204442235e-06, "epoch": 0.7938914584416651, "percentage": 79.4, "elapsed_time": "5 days, 13:12:00", "remaining_time": "1 day, 10:34:02", "throughput": 2731.95, "total_tokens": 1310024576} {"current_steps": 7253, "total_steps": 9134, "loss": 0.7508, "learning_rate": 5.052008086433649e-06, "epoch": 0.794000930512603, "percentage": 79.41, "elapsed_time": "5 days, 13:13:02", "remaining_time": "1 day, 10:32:55", "throughput": 2731.89, "total_tokens": 1310167264} {"current_steps": 7254, "total_steps": 9134, "loss": 0.8507, "learning_rate": 5.046826328234386e-06, "epoch": 0.7941104025835408, "percentage": 79.42, "elapsed_time": "5 days, 13:14:06", "remaining_time": "1 day, 10:31:48", "throughput": 2731.86, "total_tokens": 1310328320} {"current_steps": 7255, "total_steps": 9134, "loss": 0.8398, "learning_rate": 5.041646930457411e-06, "epoch": 0.7942198746544787, "percentage": 79.43, "elapsed_time": "5 days, 13:15:08", "remaining_time": "1 day, 10:30:41", "throughput": 2731.86, "total_tokens": 1310496992} {"current_steps": 7256, "total_steps": 9134, "loss": 0.5934, "learning_rate": 5.0364698937154565e-06, "epoch": 0.7943293467254167, "percentage": 79.44, "elapsed_time": "5 days, 13:16:13", "remaining_time": "1 day, 10:29:35", "throughput": 2731.85, "total_tokens": 1310669920} {"current_steps": 7257, "total_steps": 9134, "loss": 0.9749, "learning_rate": 5.031295218620952e-06, "epoch": 0.7944388187963546, "percentage": 79.45, "elapsed_time": "5 days, 13:17:20", "remaining_time": "1 day, 10:28:29", "throughput": 2731.91, "total_tokens": 1310882944} {"current_steps": 7258, "total_steps": 9134, "loss": 0.7317, "learning_rate": 5.026122905786046e-06, "epoch": 0.7945482908672925, "percentage": 79.46, "elapsed_time": "5 days, 13:18:19", "remaining_time": "1 day, 10:27:21", "throughput": 2731.86, "total_tokens": 1311019360} {"current_steps": 7259, "total_steps": 9134, "loss": 0.8124, "learning_rate": 5.020952955822619e-06, "epoch": 0.7946577629382304, "percentage": 79.47, "elapsed_time": "5 days, 13:19:25", "remaining_time": "1 day, 10:26:15", "throughput": 2731.85, "total_tokens": 1311194752} {"current_steps": 7260, "total_steps": 9134, "loss": 0.9262, "learning_rate": 5.015785369342255e-06, "epoch": 0.7947672350091682, "percentage": 79.48, "elapsed_time": "5 days, 13:20:28", "remaining_time": "1 day, 10:25:08", "throughput": 2731.85, "total_tokens": 1311364992} {"current_steps": 7261, "total_steps": 9134, "loss": 0.8334, "learning_rate": 5.010620146956293e-06, "epoch": 0.7948767070801062, "percentage": 79.49, "elapsed_time": "5 days, 13:21:32", "remaining_time": "1 day, 10:24:01", "throughput": 2731.82, "total_tokens": 1311524928} {"current_steps": 7262, "total_steps": 9134, "loss": 0.9194, "learning_rate": 5.0054572892757416e-06, "epoch": 0.7949861791510441, "percentage": 79.51, "elapsed_time": "5 days, 13:22:39", "remaining_time": "1 day, 10:22:55", "throughput": 2731.84, "total_tokens": 1311721600} {"current_steps": 7263, "total_steps": 9134, "loss": 0.8079, "learning_rate": 5.000296796911377e-06, "epoch": 0.795095651221982, "percentage": 79.52, "elapsed_time": "5 days, 13:23:45", "remaining_time": "1 day, 10:21:49", "throughput": 2731.85, "total_tokens": 1311903040} {"current_steps": 7264, "total_steps": 9134, "loss": 0.7586, "learning_rate": 4.995138670473667e-06, "epoch": 0.7952051232929199, "percentage": 79.53, "elapsed_time": "5 days, 13:24:48", "remaining_time": "1 day, 10:20:42", "throughput": 2731.9, "total_tokens": 1312098592} {"current_steps": 7265, "total_steps": 9134, "loss": 0.947, "learning_rate": 4.98998291057281e-06, "epoch": 0.7953145953638578, "percentage": 79.54, "elapsed_time": "5 days, 13:25:56", "remaining_time": "1 day, 10:19:36", "throughput": 2731.96, "total_tokens": 1312314080} {"current_steps": 7266, "total_steps": 9134, "loss": 0.8285, "learning_rate": 4.984829517818723e-06, "epoch": 0.7954240674347957, "percentage": 79.55, "elapsed_time": "5 days, 13:27:02", "remaining_time": "1 day, 10:18:30", "throughput": 2731.99, "total_tokens": 1312511200} {"current_steps": 7267, "total_steps": 9134, "loss": 0.9699, "learning_rate": 4.979678492821041e-06, "epoch": 0.7955335395057336, "percentage": 79.56, "elapsed_time": "5 days, 13:28:06", "remaining_time": "1 day, 10:17:24", "throughput": 2732.0, "total_tokens": 1312689056} {"current_steps": 7268, "total_steps": 9134, "loss": 0.9445, "learning_rate": 4.974529836189113e-06, "epoch": 0.7956430115766715, "percentage": 79.57, "elapsed_time": "5 days, 13:29:13", "remaining_time": "1 day, 10:16:18", "throughput": 2732.03, "total_tokens": 1312887968} {"current_steps": 7269, "total_steps": 9134, "loss": 0.841, "learning_rate": 4.969383548532031e-06, "epoch": 0.7957524836476094, "percentage": 79.58, "elapsed_time": "5 days, 13:30:17", "remaining_time": "1 day, 10:15:11", "throughput": 2732.04, "total_tokens": 1313066048} {"current_steps": 7270, "total_steps": 9134, "loss": 0.692, "learning_rate": 4.9642396304585834e-06, "epoch": 0.7958619557185473, "percentage": 79.59, "elapsed_time": "5 days, 13:31:17", "remaining_time": "1 day, 10:14:03", "throughput": 2732.01, "total_tokens": 1313217920} {"current_steps": 7271, "total_steps": 9134, "loss": 0.8613, "learning_rate": 4.959098082577284e-06, "epoch": 0.7959714277894852, "percentage": 79.6, "elapsed_time": "5 days, 13:32:21", "remaining_time": "1 day, 10:12:57", "throughput": 2732.0, "total_tokens": 1313387264} {"current_steps": 7272, "total_steps": 9134, "loss": 0.8678, "learning_rate": 4.953958905496372e-06, "epoch": 0.7960808998604231, "percentage": 79.61, "elapsed_time": "5 days, 13:33:28", "remaining_time": "1 day, 10:11:51", "throughput": 2732.02, "total_tokens": 1313579008} {"current_steps": 7273, "total_steps": 9134, "loss": 0.7518, "learning_rate": 4.948822099823797e-06, "epoch": 0.796190371931361, "percentage": 79.63, "elapsed_time": "5 days, 13:34:33", "remaining_time": "1 day, 10:10:44", "throughput": 2732.03, "total_tokens": 1313761792} {"current_steps": 7274, "total_steps": 9134, "loss": 0.7532, "learning_rate": 4.943687666167238e-06, "epoch": 0.7962998440022989, "percentage": 79.64, "elapsed_time": "5 days, 13:35:38", "remaining_time": "1 day, 10:09:38", "throughput": 2732.04, "total_tokens": 1313943904} {"current_steps": 7275, "total_steps": 9134, "loss": 0.9277, "learning_rate": 4.938555605134082e-06, "epoch": 0.7964093160732368, "percentage": 79.65, "elapsed_time": "5 days, 13:36:40", "remaining_time": "1 day, 10:08:31", "throughput": 2732.02, "total_tokens": 1314101824} {"current_steps": 7276, "total_steps": 9134, "loss": 0.8782, "learning_rate": 4.9334259173314575e-06, "epoch": 0.7965187881441748, "percentage": 79.66, "elapsed_time": "5 days, 13:37:44", "remaining_time": "1 day, 10:07:24", "throughput": 2732.0, "total_tokens": 1314267584} {"current_steps": 7277, "total_steps": 9134, "loss": 0.8843, "learning_rate": 4.928298603366174e-06, "epoch": 0.7966282602151126, "percentage": 79.67, "elapsed_time": "5 days, 13:38:51", "remaining_time": "1 day, 10:06:18", "throughput": 2732.02, "total_tokens": 1314460672} {"current_steps": 7278, "total_steps": 9134, "loss": 0.6677, "learning_rate": 4.92317366384481e-06, "epoch": 0.7967377322860505, "percentage": 79.68, "elapsed_time": "5 days, 13:39:54", "remaining_time": "1 day, 10:05:11", "throughput": 2732.04, "total_tokens": 1314642112} {"current_steps": 7279, "total_steps": 9134, "loss": 0.7358, "learning_rate": 4.918051099373605e-06, "epoch": 0.7968472043569884, "percentage": 79.69, "elapsed_time": "5 days, 13:41:02", "remaining_time": "1 day, 10:04:06", "throughput": 2732.1, "total_tokens": 1314856256} {"current_steps": 7280, "total_steps": 9134, "loss": 0.6461, "learning_rate": 4.912930910558572e-06, "epoch": 0.7969566764279263, "percentage": 79.7, "elapsed_time": "5 days, 13:42:06", "remaining_time": "1 day, 10:02:59", "throughput": 2732.08, "total_tokens": 1315023136} {"current_steps": 7281, "total_steps": 9134, "loss": 0.7788, "learning_rate": 4.907813098005415e-06, "epoch": 0.7970661484988643, "percentage": 79.71, "elapsed_time": "5 days, 13:43:13", "remaining_time": "1 day, 10:01:53", "throughput": 2732.11, "total_tokens": 1315220704} {"current_steps": 7282, "total_steps": 9134, "loss": 0.9316, "learning_rate": 4.90269766231955e-06, "epoch": 0.7971756205698022, "percentage": 79.72, "elapsed_time": "5 days, 13:44:18", "remaining_time": "1 day, 10:00:47", "throughput": 2732.14, "total_tokens": 1315414240} {"current_steps": 7283, "total_steps": 9134, "loss": 0.7114, "learning_rate": 4.897584604106145e-06, "epoch": 0.79728509264074, "percentage": 79.74, "elapsed_time": "5 days, 13:45:18", "remaining_time": "1 day, 9:59:39", "throughput": 2732.1, "total_tokens": 1315555136} {"current_steps": 7284, "total_steps": 9134, "loss": 1.1238, "learning_rate": 4.89247392397004e-06, "epoch": 0.7973945647116779, "percentage": 79.75, "elapsed_time": "5 days, 13:46:24", "remaining_time": "1 day, 9:58:33", "throughput": 2732.14, "total_tokens": 1315754496} {"current_steps": 7285, "total_steps": 9134, "loss": 0.8349, "learning_rate": 4.8873656225158405e-06, "epoch": 0.7975040367826158, "percentage": 79.76, "elapsed_time": "5 days, 13:47:25", "remaining_time": "1 day, 9:57:26", "throughput": 2732.14, "total_tokens": 1315921824} {"current_steps": 7286, "total_steps": 9134, "loss": 0.8369, "learning_rate": 4.88225970034783e-06, "epoch": 0.7976135088535538, "percentage": 79.77, "elapsed_time": "5 days, 13:48:27", "remaining_time": "1 day, 9:56:18", "throughput": 2732.12, "total_tokens": 1316085344} {"current_steps": 7287, "total_steps": 9134, "loss": 1.3288, "learning_rate": 4.8771561580700505e-06, "epoch": 0.7977229809244917, "percentage": 79.78, "elapsed_time": "5 days, 13:49:32", "remaining_time": "1 day, 9:55:12", "throughput": 2732.16, "total_tokens": 1316281120} {"current_steps": 7288, "total_steps": 9134, "loss": 0.7825, "learning_rate": 4.872054996286216e-06, "epoch": 0.7978324529954295, "percentage": 79.79, "elapsed_time": "5 days, 13:50:40", "remaining_time": "1 day, 9:54:06", "throughput": 2732.13, "total_tokens": 1316450464} {"current_steps": 7289, "total_steps": 9134, "loss": 0.6704, "learning_rate": 4.866956215599802e-06, "epoch": 0.7979419250663674, "percentage": 79.8, "elapsed_time": "5 days, 13:51:43", "remaining_time": "1 day, 9:53:00", "throughput": 2732.11, "total_tokens": 1316614432} {"current_steps": 7290, "total_steps": 9134, "loss": 0.8262, "learning_rate": 4.861859816613981e-06, "epoch": 0.7980513971373053, "percentage": 79.81, "elapsed_time": "5 days, 13:52:45", "remaining_time": "1 day, 9:51:52", "throughput": 2732.09, "total_tokens": 1316775488} {"current_steps": 7291, "total_steps": 9134, "loss": 1.0612, "learning_rate": 4.856765799931648e-06, "epoch": 0.7981608692082433, "percentage": 79.82, "elapsed_time": "5 days, 13:53:52", "remaining_time": "1 day, 9:50:46", "throughput": 2732.13, "total_tokens": 1316976640} {"current_steps": 7292, "total_steps": 9134, "loss": 0.7451, "learning_rate": 4.851674166155412e-06, "epoch": 0.7982703412791812, "percentage": 79.83, "elapsed_time": "5 days, 13:54:57", "remaining_time": "1 day, 9:49:40", "throughput": 2732.15, "total_tokens": 1317163680} {"current_steps": 7293, "total_steps": 9134, "loss": 0.7143, "learning_rate": 4.846584915887597e-06, "epoch": 0.7983798133501191, "percentage": 79.84, "elapsed_time": "5 days, 13:56:04", "remaining_time": "1 day, 9:48:34", "throughput": 2732.17, "total_tokens": 1317356320} {"current_steps": 7294, "total_steps": 9134, "loss": 0.8668, "learning_rate": 4.8414980497302755e-06, "epoch": 0.7984892854210569, "percentage": 79.86, "elapsed_time": "5 days, 13:57:05", "remaining_time": "1 day, 9:47:27", "throughput": 2732.17, "total_tokens": 1317524320} {"current_steps": 7295, "total_steps": 9134, "loss": 0.799, "learning_rate": 4.836413568285183e-06, "epoch": 0.7985987574919948, "percentage": 79.87, "elapsed_time": "5 days, 13:58:07", "remaining_time": "1 day, 9:46:20", "throughput": 2732.15, "total_tokens": 1317682464} {"current_steps": 7296, "total_steps": 9134, "loss": 0.8909, "learning_rate": 4.831331472153828e-06, "epoch": 0.7987082295629327, "percentage": 79.88, "elapsed_time": "5 days, 13:59:11", "remaining_time": "1 day, 9:45:13", "throughput": 2732.14, "total_tokens": 1317851136} {"current_steps": 7297, "total_steps": 9134, "loss": 0.724, "learning_rate": 4.8262517619374e-06, "epoch": 0.7988177016338707, "percentage": 79.89, "elapsed_time": "5 days, 14:00:17", "remaining_time": "1 day, 9:44:07", "throughput": 2732.18, "total_tokens": 1318050720} {"current_steps": 7298, "total_steps": 9134, "loss": 0.9177, "learning_rate": 4.821174438236825e-06, "epoch": 0.7989271737048086, "percentage": 79.9, "elapsed_time": "5 days, 14:01:23", "remaining_time": "1 day, 9:43:01", "throughput": 2732.18, "total_tokens": 1318231936} {"current_steps": 7299, "total_steps": 9134, "loss": 0.8303, "learning_rate": 4.816099501652741e-06, "epoch": 0.7990366457757465, "percentage": 79.91, "elapsed_time": "5 days, 14:02:25", "remaining_time": "1 day, 9:41:53", "throughput": 2732.19, "total_tokens": 1318403968} {"current_steps": 7300, "total_steps": 9134, "loss": 0.8109, "learning_rate": 4.8110269527854965e-06, "epoch": 0.7991461178466843, "percentage": 79.92, "elapsed_time": "5 days, 14:03:25", "remaining_time": "1 day, 9:40:46", "throughput": 2732.15, "total_tokens": 1318550016} {"current_steps": 7301, "total_steps": 9134, "loss": 0.7822, "learning_rate": 4.805956792235172e-06, "epoch": 0.7992555899176222, "percentage": 79.93, "elapsed_time": "5 days, 14:04:28", "remaining_time": "1 day, 9:39:39", "throughput": 2732.15, "total_tokens": 1318721600} {"current_steps": 7302, "total_steps": 9134, "loss": 1.0638, "learning_rate": 4.800889020601548e-06, "epoch": 0.7993650619885602, "percentage": 79.94, "elapsed_time": "5 days, 14:05:31", "remaining_time": "1 day, 9:38:32", "throughput": 2732.09, "total_tokens": 1318866304} {"current_steps": 7303, "total_steps": 9134, "loss": 0.9173, "learning_rate": 4.795823638484142e-06, "epoch": 0.7994745340594981, "percentage": 79.95, "elapsed_time": "5 days, 14:06:37", "remaining_time": "1 day, 9:37:26", "throughput": 2732.11, "total_tokens": 1319056480} {"current_steps": 7304, "total_steps": 9134, "loss": 0.8702, "learning_rate": 4.790760646482178e-06, "epoch": 0.799584006130436, "percentage": 79.96, "elapsed_time": "5 days, 14:07:39", "remaining_time": "1 day, 9:36:19", "throughput": 2732.09, "total_tokens": 1319217312} {"current_steps": 7305, "total_steps": 9134, "loss": 0.7576, "learning_rate": 4.785700045194596e-06, "epoch": 0.7996934782013738, "percentage": 79.98, "elapsed_time": "5 days, 14:08:42", "remaining_time": "1 day, 9:35:12", "throughput": 2732.1, "total_tokens": 1319394048} {"current_steps": 7306, "total_steps": 9134, "loss": 0.9075, "learning_rate": 4.7806418352200565e-06, "epoch": 0.7998029502723117, "percentage": 79.99, "elapsed_time": "5 days, 14:09:48", "remaining_time": "1 day, 9:34:06", "throughput": 2732.16, "total_tokens": 1319601024} {"current_steps": 7307, "total_steps": 9134, "loss": 0.8667, "learning_rate": 4.775586017156936e-06, "epoch": 0.7999124223432497, "percentage": 80.0, "elapsed_time": "5 days, 14:10:50", "remaining_time": "1 day, 9:32:59", "throughput": 2732.19, "total_tokens": 1319786944} {"current_steps": 7308, "total_steps": 9134, "loss": 0.8673, "learning_rate": 4.770532591603324e-06, "epoch": 0.8000218944141876, "percentage": 80.01, "elapsed_time": "5 days, 14:11:55", "remaining_time": "1 day, 9:31:52", "throughput": 2732.2, "total_tokens": 1319966592} {"current_steps": 7309, "total_steps": 9134, "loss": 0.8826, "learning_rate": 4.765481559157034e-06, "epoch": 0.8001313664851255, "percentage": 80.02, "elapsed_time": "5 days, 14:12:58", "remaining_time": "1 day, 9:30:45", "throughput": 2732.22, "total_tokens": 1320149152} {"current_steps": 7310, "total_steps": 9134, "loss": 0.7683, "learning_rate": 4.760432920415589e-06, "epoch": 0.8002408385560634, "percentage": 80.03, "elapsed_time": "5 days, 14:14:04", "remaining_time": "1 day, 9:29:39", "throughput": 2732.27, "total_tokens": 1320353440} {"current_steps": 7311, "total_steps": 9134, "loss": 0.7083, "learning_rate": 4.755386675976245e-06, "epoch": 0.8003503106270012, "percentage": 80.04, "elapsed_time": "5 days, 14:15:08", "remaining_time": "1 day, 9:28:33", "throughput": 2732.28, "total_tokens": 1320536224} {"current_steps": 7312, "total_steps": 9134, "loss": 0.8471, "learning_rate": 4.750342826435955e-06, "epoch": 0.8004597826979392, "percentage": 80.05, "elapsed_time": "5 days, 14:16:13", "remaining_time": "1 day, 9:27:26", "throughput": 2732.34, "total_tokens": 1320739392} {"current_steps": 7313, "total_steps": 9134, "loss": 1.229, "learning_rate": 4.745301372391397e-06, "epoch": 0.8005692547688771, "percentage": 80.06, "elapsed_time": "5 days, 14:17:19", "remaining_time": "1 day, 9:26:20", "throughput": 2732.35, "total_tokens": 1320927328} {"current_steps": 7314, "total_steps": 9134, "loss": 0.827, "learning_rate": 4.740262314438968e-06, "epoch": 0.800678726839815, "percentage": 80.07, "elapsed_time": "5 days, 14:18:25", "remaining_time": "1 day, 9:25:14", "throughput": 2732.39, "total_tokens": 1321123104} {"current_steps": 7315, "total_steps": 9134, "loss": 0.8672, "learning_rate": 4.7352256531747766e-06, "epoch": 0.8007881989107529, "percentage": 80.09, "elapsed_time": "5 days, 14:19:27", "remaining_time": "1 day, 9:24:07", "throughput": 2732.37, "total_tokens": 1321284832} {"current_steps": 7316, "total_steps": 9134, "loss": 0.6346, "learning_rate": 4.730191389194652e-06, "epoch": 0.8008976709816908, "percentage": 80.1, "elapsed_time": "5 days, 14:20:32", "remaining_time": "1 day, 9:23:00", "throughput": 2732.38, "total_tokens": 1321465824} {"current_steps": 7317, "total_steps": 9134, "loss": 0.7188, "learning_rate": 4.725159523094127e-06, "epoch": 0.8010071430526287, "percentage": 80.11, "elapsed_time": "5 days, 14:21:33", "remaining_time": "1 day, 9:21:53", "throughput": 2732.37, "total_tokens": 1321632256} {"current_steps": 7318, "total_steps": 9134, "loss": 0.7554, "learning_rate": 4.720130055468488e-06, "epoch": 0.8011166151235666, "percentage": 80.12, "elapsed_time": "5 days, 14:22:40", "remaining_time": "1 day, 9:20:47", "throughput": 2732.42, "total_tokens": 1321836096} {"current_steps": 7319, "total_steps": 9134, "loss": 0.7997, "learning_rate": 4.7151029869126784e-06, "epoch": 0.8012260871945045, "percentage": 80.13, "elapsed_time": "5 days, 14:23:44", "remaining_time": "1 day, 9:19:41", "throughput": 2732.45, "total_tokens": 1322027392} {"current_steps": 7320, "total_steps": 9134, "loss": 0.924, "learning_rate": 4.710078318021424e-06, "epoch": 0.8013355592654424, "percentage": 80.14, "elapsed_time": "5 days, 14:24:50", "remaining_time": "1 day, 9:18:35", "throughput": 2732.46, "total_tokens": 1322213536} {"current_steps": 7321, "total_steps": 9134, "loss": 0.7621, "learning_rate": 4.705056049389101e-06, "epoch": 0.8014450313363803, "percentage": 80.15, "elapsed_time": "5 days, 14:25:52", "remaining_time": "1 day, 9:17:27", "throughput": 2732.45, "total_tokens": 1322377056} {"current_steps": 7322, "total_steps": 9134, "loss": 0.6781, "learning_rate": 4.700036181609857e-06, "epoch": 0.8015545034073182, "percentage": 80.16, "elapsed_time": "5 days, 14:26:54", "remaining_time": "1 day, 9:16:20", "throughput": 2732.47, "total_tokens": 1322556704} {"current_steps": 7323, "total_steps": 9134, "loss": 0.6953, "learning_rate": 4.695018715277527e-06, "epoch": 0.8016639754782561, "percentage": 80.17, "elapsed_time": "5 days, 14:27:58", "remaining_time": "1 day, 9:15:14", "throughput": 2732.47, "total_tokens": 1322729856} {"current_steps": 7324, "total_steps": 9134, "loss": 1.0356, "learning_rate": 4.690003650985658e-06, "epoch": 0.801773447549194, "percentage": 80.18, "elapsed_time": "5 days, 14:29:04", "remaining_time": "1 day, 9:14:07", "throughput": 2732.52, "total_tokens": 1322934368} {"current_steps": 7325, "total_steps": 9134, "loss": 0.8542, "learning_rate": 4.684990989327548e-06, "epoch": 0.8018829196201319, "percentage": 80.19, "elapsed_time": "5 days, 14:30:11", "remaining_time": "1 day, 9:13:02", "throughput": 2732.49, "total_tokens": 1323103712} {"current_steps": 7326, "total_steps": 9134, "loss": 0.8998, "learning_rate": 4.679980730896153e-06, "epoch": 0.8019923916910698, "percentage": 80.21, "elapsed_time": "5 days, 14:31:18", "remaining_time": "1 day, 9:11:56", "throughput": 2732.51, "total_tokens": 1323295232} {"current_steps": 7327, "total_steps": 9134, "loss": 0.9954, "learning_rate": 4.674972876284203e-06, "epoch": 0.8021018637620078, "percentage": 80.22, "elapsed_time": "5 days, 14:32:20", "remaining_time": "1 day, 9:10:49", "throughput": 2732.51, "total_tokens": 1323467712} {"current_steps": 7328, "total_steps": 9134, "loss": 0.8045, "learning_rate": 4.6699674260840955e-06, "epoch": 0.8022113358329456, "percentage": 80.23, "elapsed_time": "5 days, 14:33:25", "remaining_time": "1 day, 9:09:42", "throughput": 2732.52, "total_tokens": 1323649600} {"current_steps": 7329, "total_steps": 9134, "loss": 0.6878, "learning_rate": 4.664964380887985e-06, "epoch": 0.8023208079038835, "percentage": 80.24, "elapsed_time": "5 days, 14:34:30", "remaining_time": "1 day, 9:08:36", "throughput": 2732.55, "total_tokens": 1323840448} {"current_steps": 7330, "total_steps": 9134, "loss": 0.8504, "learning_rate": 4.6599637412877125e-06, "epoch": 0.8024302799748214, "percentage": 80.25, "elapsed_time": "5 days, 14:35:36", "remaining_time": "1 day, 9:07:30", "throughput": 2732.57, "total_tokens": 1324028160} {"current_steps": 7331, "total_steps": 9134, "loss": 0.8893, "learning_rate": 4.654965507874845e-06, "epoch": 0.8025397520457593, "percentage": 80.26, "elapsed_time": "5 days, 14:36:42", "remaining_time": "1 day, 9:06:24", "throughput": 2732.56, "total_tokens": 1324204672} {"current_steps": 7332, "total_steps": 9134, "loss": 0.8834, "learning_rate": 4.649969681240668e-06, "epoch": 0.8026492241166973, "percentage": 80.27, "elapsed_time": "5 days, 14:37:43", "remaining_time": "1 day, 9:05:16", "throughput": 2732.56, "total_tokens": 1324373120} {"current_steps": 7333, "total_steps": 9134, "loss": 1.0278, "learning_rate": 4.644976261976172e-06, "epoch": 0.8027586961876352, "percentage": 80.28, "elapsed_time": "5 days, 14:38:48", "remaining_time": "1 day, 9:04:10", "throughput": 2732.57, "total_tokens": 1324556352} {"current_steps": 7334, "total_steps": 9134, "loss": 0.6972, "learning_rate": 4.639985250672074e-06, "epoch": 0.802868168258573, "percentage": 80.29, "elapsed_time": "5 days, 14:39:52", "remaining_time": "1 day, 9:03:03", "throughput": 2732.61, "total_tokens": 1324750784} {"current_steps": 7335, "total_steps": 9134, "loss": 0.8335, "learning_rate": 4.634996647918791e-06, "epoch": 0.8029776403295109, "percentage": 80.3, "elapsed_time": "5 days, 14:40:57", "remaining_time": "1 day, 9:01:57", "throughput": 2732.59, "total_tokens": 1324914976} {"current_steps": 7336, "total_steps": 9134, "loss": 0.7898, "learning_rate": 4.63001045430648e-06, "epoch": 0.8030871124004488, "percentage": 80.32, "elapsed_time": "5 days, 14:41:59", "remaining_time": "1 day, 9:00:50", "throughput": 2732.57, "total_tokens": 1325077376} {"current_steps": 7337, "total_steps": 9134, "loss": 0.9254, "learning_rate": 4.625026670424992e-06, "epoch": 0.8031965844713868, "percentage": 80.33, "elapsed_time": "5 days, 14:43:01", "remaining_time": "1 day, 8:59:43", "throughput": 2732.54, "total_tokens": 1325234176} {"current_steps": 7338, "total_steps": 9134, "loss": 0.9004, "learning_rate": 4.620045296863898e-06, "epoch": 0.8033060565423247, "percentage": 80.34, "elapsed_time": "5 days, 14:44:02", "remaining_time": "1 day, 8:58:35", "throughput": 2732.54, "total_tokens": 1325400160} {"current_steps": 7339, "total_steps": 9134, "loss": 0.8151, "learning_rate": 4.615066334212487e-06, "epoch": 0.8034155286132625, "percentage": 80.35, "elapsed_time": "5 days, 14:45:07", "remaining_time": "1 day, 8:57:29", "throughput": 2732.56, "total_tokens": 1325586976} {"current_steps": 7340, "total_steps": 9134, "loss": 0.8776, "learning_rate": 4.61008978305976e-06, "epoch": 0.8035250006842004, "percentage": 80.36, "elapsed_time": "5 days, 14:46:09", "remaining_time": "1 day, 8:56:22", "throughput": 2732.56, "total_tokens": 1325754080} {"current_steps": 7341, "total_steps": 9134, "loss": 1.0879, "learning_rate": 4.605115643994429e-06, "epoch": 0.8036344727551383, "percentage": 80.37, "elapsed_time": "5 days, 14:47:16", "remaining_time": "1 day, 8:55:16", "throughput": 2732.61, "total_tokens": 1325964416} {"current_steps": 7342, "total_steps": 9134, "loss": 0.8148, "learning_rate": 4.6001439176049325e-06, "epoch": 0.8037439448260763, "percentage": 80.38, "elapsed_time": "5 days, 14:48:20", "remaining_time": "1 day, 8:54:09", "throughput": 2732.61, "total_tokens": 1326135104} {"current_steps": 7343, "total_steps": 9134, "loss": 0.8462, "learning_rate": 4.595174604479405e-06, "epoch": 0.8038534168970142, "percentage": 80.39, "elapsed_time": "5 days, 14:49:26", "remaining_time": "1 day, 8:53:03", "throughput": 2732.6, "total_tokens": 1326312064} {"current_steps": 7344, "total_steps": 9134, "loss": 0.8595, "learning_rate": 4.590207705205718e-06, "epoch": 0.8039628889679521, "percentage": 80.4, "elapsed_time": "5 days, 14:50:33", "remaining_time": "1 day, 8:51:57", "throughput": 2732.61, "total_tokens": 1326497984} {"current_steps": 7345, "total_steps": 9134, "loss": 0.8105, "learning_rate": 4.585243220371446e-06, "epoch": 0.8040723610388899, "percentage": 80.41, "elapsed_time": "5 days, 14:51:37", "remaining_time": "1 day, 8:50:51", "throughput": 2732.61, "total_tokens": 1326673824} {"current_steps": 7346, "total_steps": 9134, "loss": 0.9916, "learning_rate": 4.580281150563873e-06, "epoch": 0.8041818331098278, "percentage": 80.42, "elapsed_time": "5 days, 14:52:45", "remaining_time": "1 day, 8:49:45", "throughput": 2732.67, "total_tokens": 1326889088} {"current_steps": 7347, "total_steps": 9134, "loss": 0.815, "learning_rate": 4.575321496370005e-06, "epoch": 0.8042913051807657, "percentage": 80.44, "elapsed_time": "5 days, 14:53:51", "remaining_time": "1 day, 8:48:39", "throughput": 2732.67, "total_tokens": 1327073216} {"current_steps": 7348, "total_steps": 9134, "loss": 0.6458, "learning_rate": 4.570364258376558e-06, "epoch": 0.8044007772517037, "percentage": 80.45, "elapsed_time": "5 days, 14:54:56", "remaining_time": "1 day, 8:47:33", "throughput": 2732.66, "total_tokens": 1327245248} {"current_steps": 7349, "total_steps": 9134, "loss": 0.9682, "learning_rate": 4.565409437169965e-06, "epoch": 0.8045102493226416, "percentage": 80.46, "elapsed_time": "5 days, 14:56:00", "remaining_time": "1 day, 8:46:26", "throughput": 2732.68, "total_tokens": 1327428256} {"current_steps": 7350, "total_steps": 9134, "loss": 0.8056, "learning_rate": 4.560457033336365e-06, "epoch": 0.8046197213935795, "percentage": 80.47, "elapsed_time": "5 days, 14:57:07", "remaining_time": "1 day, 8:45:20", "throughput": 2732.71, "total_tokens": 1327626720} {"current_steps": 7351, "total_steps": 9134, "loss": 0.7252, "learning_rate": 4.555507047461638e-06, "epoch": 0.8047291934645173, "percentage": 80.48, "elapsed_time": "5 days, 14:58:09", "remaining_time": "1 day, 8:44:13", "throughput": 2732.69, "total_tokens": 1327783072} {"current_steps": 7352, "total_steps": 9134, "loss": 0.8611, "learning_rate": 4.550559480131328e-06, "epoch": 0.8048386655354552, "percentage": 80.49, "elapsed_time": "5 days, 14:59:13", "remaining_time": "1 day, 8:43:06", "throughput": 2732.68, "total_tokens": 1327957120} {"current_steps": 7353, "total_steps": 9134, "loss": 0.953, "learning_rate": 4.5456143319307475e-06, "epoch": 0.8049481376063932, "percentage": 80.5, "elapsed_time": "5 days, 15:00:18", "remaining_time": "1 day, 8:42:00", "throughput": 2732.67, "total_tokens": 1328127360} {"current_steps": 7354, "total_steps": 9134, "loss": 0.8742, "learning_rate": 4.5406716034448905e-06, "epoch": 0.8050576096773311, "percentage": 80.51, "elapsed_time": "5 days, 15:01:22", "remaining_time": "1 day, 8:40:53", "throughput": 2732.67, "total_tokens": 1328302080} {"current_steps": 7355, "total_steps": 9134, "loss": 0.7185, "learning_rate": 4.535731295258469e-06, "epoch": 0.805167081748269, "percentage": 80.52, "elapsed_time": "5 days, 15:02:22", "remaining_time": "1 day, 8:39:46", "throughput": 2732.65, "total_tokens": 1328458208} {"current_steps": 7356, "total_steps": 9134, "loss": 0.8009, "learning_rate": 4.530793407955913e-06, "epoch": 0.8052765538192068, "percentage": 80.53, "elapsed_time": "5 days, 15:03:28", "remaining_time": "1 day, 8:38:40", "throughput": 2732.63, "total_tokens": 1328626208} {"current_steps": 7357, "total_steps": 9134, "loss": 0.9275, "learning_rate": 4.525857942121364e-06, "epoch": 0.8053860258901447, "percentage": 80.55, "elapsed_time": "5 days, 15:04:32", "remaining_time": "1 day, 8:37:33", "throughput": 2732.65, "total_tokens": 1328810336} {"current_steps": 7358, "total_steps": 9134, "loss": 0.9113, "learning_rate": 4.520924898338691e-06, "epoch": 0.8054954979610827, "percentage": 80.56, "elapsed_time": "5 days, 15:05:36", "remaining_time": "1 day, 8:36:26", "throughput": 2732.67, "total_tokens": 1328994240} {"current_steps": 7359, "total_steps": 9134, "loss": 0.9001, "learning_rate": 4.51599427719144e-06, "epoch": 0.8056049700320206, "percentage": 80.57, "elapsed_time": "5 days, 15:06:39", "remaining_time": "1 day, 8:35:20", "throughput": 2732.64, "total_tokens": 1329153280} {"current_steps": 7360, "total_steps": 9134, "loss": 0.7351, "learning_rate": 4.511066079262921e-06, "epoch": 0.8057144421029585, "percentage": 80.58, "elapsed_time": "5 days, 15:07:40", "remaining_time": "1 day, 8:34:12", "throughput": 2732.63, "total_tokens": 1329318368} {"current_steps": 7361, "total_steps": 9134, "loss": 1.0326, "learning_rate": 4.506140305136103e-06, "epoch": 0.8058239141738964, "percentage": 80.59, "elapsed_time": "5 days, 15:08:47", "remaining_time": "1 day, 8:33:07", "throughput": 2732.68, "total_tokens": 1329524448} {"current_steps": 7362, "total_steps": 9134, "loss": 0.7761, "learning_rate": 4.501216955393722e-06, "epoch": 0.8059333862448342, "percentage": 80.6, "elapsed_time": "5 days, 15:09:54", "remaining_time": "1 day, 8:32:01", "throughput": 2732.69, "total_tokens": 1329713504} {"current_steps": 7363, "total_steps": 9134, "loss": 0.7, "learning_rate": 4.496296030618177e-06, "epoch": 0.8060428583157722, "percentage": 80.61, "elapsed_time": "5 days, 15:11:00", "remaining_time": "1 day, 8:30:54", "throughput": 2732.7, "total_tokens": 1329896736} {"current_steps": 7364, "total_steps": 9134, "loss": 0.7794, "learning_rate": 4.491377531391619e-06, "epoch": 0.8061523303867101, "percentage": 80.62, "elapsed_time": "5 days, 15:12:03", "remaining_time": "1 day, 8:29:48", "throughput": 2732.72, "total_tokens": 1330080864} {"current_steps": 7365, "total_steps": 9134, "loss": 1.1626, "learning_rate": 4.486461458295896e-06, "epoch": 0.806261802457648, "percentage": 80.63, "elapsed_time": "5 days, 15:13:09", "remaining_time": "1 day, 8:28:42", "throughput": 2732.74, "total_tokens": 1330271264} {"current_steps": 7366, "total_steps": 9134, "loss": 0.7979, "learning_rate": 4.4815478119125595e-06, "epoch": 0.8063712745285859, "percentage": 80.64, "elapsed_time": "5 days, 15:14:13", "remaining_time": "1 day, 8:27:35", "throughput": 2732.73, "total_tokens": 1330438816} {"current_steps": 7367, "total_steps": 9134, "loss": 0.7302, "learning_rate": 4.4766365928229054e-06, "epoch": 0.8064807465995238, "percentage": 80.65, "elapsed_time": "5 days, 15:15:15", "remaining_time": "1 day, 8:26:28", "throughput": 2732.72, "total_tokens": 1330600544} {"current_steps": 7368, "total_steps": 9134, "loss": 0.7553, "learning_rate": 4.471727801607895e-06, "epoch": 0.8065902186704617, "percentage": 80.67, "elapsed_time": "5 days, 15:16:18", "remaining_time": "1 day, 8:25:21", "throughput": 2732.73, "total_tokens": 1330782208} {"current_steps": 7369, "total_steps": 9134, "loss": 0.6178, "learning_rate": 4.466821438848254e-06, "epoch": 0.8066996907413996, "percentage": 80.68, "elapsed_time": "5 days, 15:17:24", "remaining_time": "1 day, 8:24:15", "throughput": 2732.67, "total_tokens": 1330932512} {"current_steps": 7370, "total_steps": 9134, "loss": 0.5548, "learning_rate": 4.461917505124375e-06, "epoch": 0.8068091628123375, "percentage": 80.69, "elapsed_time": "5 days, 15:18:26", "remaining_time": "1 day, 8:23:08", "throughput": 2732.69, "total_tokens": 1331111936} {"current_steps": 7371, "total_steps": 9134, "loss": 0.7824, "learning_rate": 4.457016001016395e-06, "epoch": 0.8069186348832754, "percentage": 80.7, "elapsed_time": "5 days, 15:19:30", "remaining_time": "1 day, 8:22:01", "throughput": 2732.67, "total_tokens": 1331275680} {"current_steps": 7372, "total_steps": 9134, "loss": 0.7388, "learning_rate": 4.452116927104152e-06, "epoch": 0.8070281069542133, "percentage": 80.71, "elapsed_time": "5 days, 15:20:31", "remaining_time": "1 day, 8:20:54", "throughput": 2732.68, "total_tokens": 1331448832} {"current_steps": 7373, "total_steps": 9134, "loss": 0.8116, "learning_rate": 4.447220283967196e-06, "epoch": 0.8071375790251512, "percentage": 80.72, "elapsed_time": "5 days, 15:21:38", "remaining_time": "1 day, 8:19:48", "throughput": 2732.7, "total_tokens": 1331641024} {"current_steps": 7374, "total_steps": 9134, "loss": 0.8541, "learning_rate": 4.442326072184791e-06, "epoch": 0.8072470510960891, "percentage": 80.73, "elapsed_time": "5 days, 15:22:43", "remaining_time": "1 day, 8:18:42", "throughput": 2732.75, "total_tokens": 1331842176} {"current_steps": 7375, "total_steps": 9134, "loss": 0.6279, "learning_rate": 4.4374342923359125e-06, "epoch": 0.807356523167027, "percentage": 80.74, "elapsed_time": "5 days, 15:23:50", "remaining_time": "1 day, 8:17:36", "throughput": 2732.82, "total_tokens": 1332058560} {"current_steps": 7376, "total_steps": 9134, "loss": 0.8353, "learning_rate": 4.4325449449992455e-06, "epoch": 0.8074659952379649, "percentage": 80.75, "elapsed_time": "5 days, 15:24:58", "remaining_time": "1 day, 8:16:30", "throughput": 2732.87, "total_tokens": 1332270464} {"current_steps": 7377, "total_steps": 9134, "loss": 0.7302, "learning_rate": 4.42765803075319e-06, "epoch": 0.8075754673089028, "percentage": 80.76, "elapsed_time": "5 days, 15:26:05", "remaining_time": "1 day, 8:15:24", "throughput": 2732.9, "total_tokens": 1332467360} {"current_steps": 7378, "total_steps": 9134, "loss": 0.7016, "learning_rate": 4.4227735501758654e-06, "epoch": 0.8076849393798408, "percentage": 80.78, "elapsed_time": "5 days, 15:27:12", "remaining_time": "1 day, 8:14:18", "throughput": 2732.95, "total_tokens": 1332676576} {"current_steps": 7379, "total_steps": 9134, "loss": 0.7291, "learning_rate": 4.417891503845095e-06, "epoch": 0.8077944114507786, "percentage": 80.79, "elapsed_time": "5 days, 15:28:19", "remaining_time": "1 day, 8:13:12", "throughput": 2732.97, "total_tokens": 1332868768} {"current_steps": 7380, "total_steps": 9134, "loss": 1.055, "learning_rate": 4.413011892338412e-06, "epoch": 0.8079038835217165, "percentage": 80.8, "elapsed_time": "5 days, 15:29:26", "remaining_time": "1 day, 8:12:07", "throughput": 2733.03, "total_tokens": 1333081120} {"current_steps": 7381, "total_steps": 9134, "loss": 0.8997, "learning_rate": 4.408134716233067e-06, "epoch": 0.8080133555926544, "percentage": 80.81, "elapsed_time": "5 days, 15:30:32", "remaining_time": "1 day, 8:11:01", "throughput": 2733.05, "total_tokens": 1333270400} {"current_steps": 7382, "total_steps": 9134, "loss": 0.7662, "learning_rate": 4.403259976106019e-06, "epoch": 0.8081228276635923, "percentage": 80.82, "elapsed_time": "5 days, 15:31:37", "remaining_time": "1 day, 8:09:54", "throughput": 2733.07, "total_tokens": 1333459008} {"current_steps": 7383, "total_steps": 9134, "loss": 0.8401, "learning_rate": 4.398387672533944e-06, "epoch": 0.8082322997345303, "percentage": 80.83, "elapsed_time": "5 days, 15:32:45", "remaining_time": "1 day, 8:08:48", "throughput": 2733.13, "total_tokens": 1333674272} {"current_steps": 7384, "total_steps": 9134, "loss": 0.8886, "learning_rate": 4.393517806093219e-06, "epoch": 0.8083417718054682, "percentage": 80.84, "elapsed_time": "5 days, 15:33:52", "remaining_time": "1 day, 8:07:43", "throughput": 2733.18, "total_tokens": 1333882144} {"current_steps": 7385, "total_steps": 9134, "loss": 0.9777, "learning_rate": 4.388650377359943e-06, "epoch": 0.808451243876406, "percentage": 80.85, "elapsed_time": "5 days, 15:34:58", "remaining_time": "1 day, 8:06:37", "throughput": 2733.22, "total_tokens": 1334082624} {"current_steps": 7386, "total_steps": 9134, "loss": 1.0062, "learning_rate": 4.383785386909931e-06, "epoch": 0.8085607159473439, "percentage": 80.86, "elapsed_time": "5 days, 15:36:04", "remaining_time": "1 day, 8:05:30", "throughput": 2733.2, "total_tokens": 1334251072} {"current_steps": 7387, "total_steps": 9134, "loss": 0.9016, "learning_rate": 4.378922835318694e-06, "epoch": 0.8086701880182818, "percentage": 80.87, "elapsed_time": "5 days, 15:37:04", "remaining_time": "1 day, 8:04:23", "throughput": 2733.14, "total_tokens": 1334385024} {"current_steps": 7388, "total_steps": 9134, "loss": 0.8015, "learning_rate": 4.374062723161468e-06, "epoch": 0.8087796600892198, "percentage": 80.88, "elapsed_time": "5 days, 15:38:09", "remaining_time": "1 day, 8:03:17", "throughput": 2733.14, "total_tokens": 1334564672} {"current_steps": 7389, "total_steps": 9134, "loss": 0.9851, "learning_rate": 4.369205051013189e-06, "epoch": 0.8088891321601577, "percentage": 80.9, "elapsed_time": "5 days, 15:39:09", "remaining_time": "1 day, 8:02:09", "throughput": 2733.1, "total_tokens": 1334707360} {"current_steps": 7390, "total_steps": 9134, "loss": 0.5972, "learning_rate": 4.364349819448507e-06, "epoch": 0.8089986042310956, "percentage": 80.91, "elapsed_time": "5 days, 15:40:14", "remaining_time": "1 day, 8:01:03", "throughput": 2733.08, "total_tokens": 1334874016} {"current_steps": 7391, "total_steps": 9134, "loss": 1.1233, "learning_rate": 4.359497029041807e-06, "epoch": 0.8091080763020334, "percentage": 80.92, "elapsed_time": "5 days, 15:41:18", "remaining_time": "1 day, 7:59:56", "throughput": 2733.12, "total_tokens": 1335070688} {"current_steps": 7392, "total_steps": 9134, "loss": 0.5571, "learning_rate": 4.354646680367136e-06, "epoch": 0.8092175483729713, "percentage": 80.93, "elapsed_time": "5 days, 15:42:23", "remaining_time": "1 day, 7:58:50", "throughput": 2733.11, "total_tokens": 1335242272} {"current_steps": 7393, "total_steps": 9134, "loss": 0.784, "learning_rate": 4.34979877399831e-06, "epoch": 0.8093270204439093, "percentage": 80.94, "elapsed_time": "5 days, 15:43:25", "remaining_time": "1 day, 7:57:43", "throughput": 2733.11, "total_tokens": 1335412288} {"current_steps": 7394, "total_steps": 9134, "loss": 0.9471, "learning_rate": 4.3449533105087984e-06, "epoch": 0.8094364925148472, "percentage": 80.95, "elapsed_time": "5 days, 15:44:30", "remaining_time": "1 day, 7:56:36", "throughput": 2733.15, "total_tokens": 1335611424} {"current_steps": 7395, "total_steps": 9134, "loss": 0.7161, "learning_rate": 4.3401102904718296e-06, "epoch": 0.8095459645857851, "percentage": 80.96, "elapsed_time": "5 days, 15:45:32", "remaining_time": "1 day, 7:55:29", "throughput": 2733.14, "total_tokens": 1335776288} {"current_steps": 7396, "total_steps": 9134, "loss": 0.6695, "learning_rate": 4.335269714460322e-06, "epoch": 0.8096554366567229, "percentage": 80.97, "elapsed_time": "5 days, 15:46:36", "remaining_time": "1 day, 7:54:23", "throughput": 2733.13, "total_tokens": 1335943616} {"current_steps": 7397, "total_steps": 9134, "loss": 0.9346, "learning_rate": 4.3304315830468985e-06, "epoch": 0.8097649087276608, "percentage": 80.98, "elapsed_time": "5 days, 15:47:41", "remaining_time": "1 day, 7:53:16", "throughput": 2733.15, "total_tokens": 1336130880} {"current_steps": 7398, "total_steps": 9134, "loss": 0.7704, "learning_rate": 4.325595896803908e-06, "epoch": 0.8098743807985987, "percentage": 80.99, "elapsed_time": "5 days, 15:48:49", "remaining_time": "1 day, 7:52:11", "throughput": 2733.21, "total_tokens": 1336346144} {"current_steps": 7399, "total_steps": 9134, "loss": 0.8845, "learning_rate": 4.320762656303392e-06, "epoch": 0.8099838528695367, "percentage": 81.01, "elapsed_time": "5 days, 15:49:54", "remaining_time": "1 day, 7:51:04", "throughput": 2733.21, "total_tokens": 1336521984} {"current_steps": 7400, "total_steps": 9134, "loss": 0.8613, "learning_rate": 4.315931862117137e-06, "epoch": 0.8100933249404746, "percentage": 81.02, "elapsed_time": "5 days, 15:50:56", "remaining_time": "1 day, 7:49:57", "throughput": 2733.19, "total_tokens": 1336681920} {"current_steps": 7401, "total_steps": 9134, "loss": 0.753, "learning_rate": 4.311103514816589e-06, "epoch": 0.8102027970114125, "percentage": 81.03, "elapsed_time": "5 days, 15:51:55", "remaining_time": "1 day, 7:48:49", "throughput": 2733.13, "total_tokens": 1336815872} {"current_steps": 7402, "total_steps": 9134, "loss": 0.7864, "learning_rate": 4.306277614972956e-06, "epoch": 0.8103122690823503, "percentage": 81.04, "elapsed_time": "5 days, 15:53:02", "remaining_time": "1 day, 7:47:44", "throughput": 2733.13, "total_tokens": 1337000896} {"current_steps": 7403, "total_steps": 9134, "loss": 0.848, "learning_rate": 4.3014541631571095e-06, "epoch": 0.8104217411532882, "percentage": 81.05, "elapsed_time": "5 days, 15:54:08", "remaining_time": "1 day, 7:46:38", "throughput": 2733.14, "total_tokens": 1337183680} {"current_steps": 7404, "total_steps": 9134, "loss": 0.9624, "learning_rate": 4.29663315993967e-06, "epoch": 0.8105312132242262, "percentage": 81.06, "elapsed_time": "5 days, 15:55:15", "remaining_time": "1 day, 7:45:32", "throughput": 2733.16, "total_tokens": 1337376768} {"current_steps": 7405, "total_steps": 9134, "loss": 0.9327, "learning_rate": 4.291814605890954e-06, "epoch": 0.8106406852951641, "percentage": 81.07, "elapsed_time": "5 days, 15:56:16", "remaining_time": "1 day, 7:44:24", "throughput": 2733.16, "total_tokens": 1337541632} {"current_steps": 7406, "total_steps": 9134, "loss": 0.6438, "learning_rate": 4.28699850158098e-06, "epoch": 0.810750157366102, "percentage": 81.08, "elapsed_time": "5 days, 15:57:19", "remaining_time": "1 day, 7:43:18", "throughput": 2733.11, "total_tokens": 1337694624} {"current_steps": 7407, "total_steps": 9134, "loss": 1.0823, "learning_rate": 4.2821848475794875e-06, "epoch": 0.8108596294370399, "percentage": 81.09, "elapsed_time": "5 days, 15:58:23", "remaining_time": "1 day, 7:42:11", "throughput": 2733.13, "total_tokens": 1337878080} {"current_steps": 7408, "total_steps": 9134, "loss": 0.8478, "learning_rate": 4.277373644455915e-06, "epoch": 0.8109691015079777, "percentage": 81.1, "elapsed_time": "5 days, 15:59:28", "remaining_time": "1 day, 7:41:05", "throughput": 2733.14, "total_tokens": 1338059744} {"current_steps": 7409, "total_steps": 9134, "loss": 0.9285, "learning_rate": 4.272564892779438e-06, "epoch": 0.8110785735789157, "percentage": 81.11, "elapsed_time": "5 days, 16:00:32", "remaining_time": "1 day, 7:39:58", "throughput": 2733.16, "total_tokens": 1338242304} {"current_steps": 7410, "total_steps": 9134, "loss": 0.919, "learning_rate": 4.267758593118898e-06, "epoch": 0.8111880456498536, "percentage": 81.13, "elapsed_time": "5 days, 16:01:35", "remaining_time": "1 day, 7:38:51", "throughput": 2733.18, "total_tokens": 1338426656} {"current_steps": 7411, "total_steps": 9134, "loss": 0.7394, "learning_rate": 4.262954746042888e-06, "epoch": 0.8112975177207915, "percentage": 81.14, "elapsed_time": "5 days, 16:02:40", "remaining_time": "1 day, 7:37:45", "throughput": 2733.16, "total_tokens": 1338594656} {"current_steps": 7412, "total_steps": 9134, "loss": 0.821, "learning_rate": 4.258153352119693e-06, "epoch": 0.8114069897917294, "percentage": 81.15, "elapsed_time": "5 days, 16:03:41", "remaining_time": "1 day, 7:36:38", "throughput": 2733.15, "total_tokens": 1338753024} {"current_steps": 7413, "total_steps": 9134, "loss": 0.7586, "learning_rate": 4.253354411917302e-06, "epoch": 0.8115164618626672, "percentage": 81.16, "elapsed_time": "5 days, 16:04:46", "remaining_time": "1 day, 7:35:31", "throughput": 2733.14, "total_tokens": 1338927744} {"current_steps": 7414, "total_steps": 9134, "loss": 0.6698, "learning_rate": 4.2485579260034215e-06, "epoch": 0.8116259339336052, "percentage": 81.17, "elapsed_time": "5 days, 16:05:53", "remaining_time": "1 day, 7:34:25", "throughput": 2733.09, "total_tokens": 1339084992} {"current_steps": 7415, "total_steps": 9134, "loss": 0.8649, "learning_rate": 4.243763894945471e-06, "epoch": 0.8117354060045431, "percentage": 81.18, "elapsed_time": "5 days, 16:06:56", "remaining_time": "1 day, 7:33:19", "throughput": 2733.09, "total_tokens": 1339261280} {"current_steps": 7416, "total_steps": 9134, "loss": 0.893, "learning_rate": 4.238972319310572e-06, "epoch": 0.811844878075481, "percentage": 81.19, "elapsed_time": "5 days, 16:07:55", "remaining_time": "1 day, 7:32:11", "throughput": 2733.05, "total_tokens": 1339400384} {"current_steps": 7417, "total_steps": 9134, "loss": 1.0016, "learning_rate": 4.234183199665559e-06, "epoch": 0.8119543501464189, "percentage": 81.2, "elapsed_time": "5 days, 16:08:57", "remaining_time": "1 day, 7:31:04", "throughput": 2733.06, "total_tokens": 1339573088} {"current_steps": 7418, "total_steps": 9134, "loss": 0.7836, "learning_rate": 4.229396536576968e-06, "epoch": 0.8120638222173568, "percentage": 81.21, "elapsed_time": "5 days, 16:10:03", "remaining_time": "1 day, 7:29:58", "throughput": 2733.12, "total_tokens": 1339782976} {"current_steps": 7419, "total_steps": 9134, "loss": 0.6798, "learning_rate": 4.224612330611069e-06, "epoch": 0.8121732942882947, "percentage": 81.22, "elapsed_time": "5 days, 16:11:04", "remaining_time": "1 day, 7:28:51", "throughput": 2733.07, "total_tokens": 1339929248} {"current_steps": 7420, "total_steps": 9134, "loss": 0.8248, "learning_rate": 4.219830582333814e-06, "epoch": 0.8122827663592326, "percentage": 81.23, "elapsed_time": "5 days, 16:12:07", "remaining_time": "1 day, 7:27:44", "throughput": 2733.08, "total_tokens": 1340105536} {"current_steps": 7421, "total_steps": 9134, "loss": 0.8452, "learning_rate": 4.215051292310876e-06, "epoch": 0.8123922384301705, "percentage": 81.25, "elapsed_time": "5 days, 16:13:09", "remaining_time": "1 day, 7:26:37", "throughput": 2733.08, "total_tokens": 1340273536} {"current_steps": 7422, "total_steps": 9134, "loss": 0.6397, "learning_rate": 4.210274461107638e-06, "epoch": 0.8125017105011084, "percentage": 81.26, "elapsed_time": "5 days, 16:14:12", "remaining_time": "1 day, 7:25:30", "throughput": 2733.1, "total_tokens": 1340458560} {"current_steps": 7423, "total_steps": 9134, "loss": 0.9328, "learning_rate": 4.205500089289185e-06, "epoch": 0.8126111825720463, "percentage": 81.27, "elapsed_time": "5 days, 16:15:19", "remaining_time": "1 day, 7:24:24", "throughput": 2733.12, "total_tokens": 1340648512} {"current_steps": 7424, "total_steps": 9134, "loss": 0.7542, "learning_rate": 4.200728177420321e-06, "epoch": 0.8127206546429843, "percentage": 81.28, "elapsed_time": "5 days, 16:16:26", "remaining_time": "1 day, 7:23:18", "throughput": 2733.12, "total_tokens": 1340833312} {"current_steps": 7425, "total_steps": 9134, "loss": 1.1945, "learning_rate": 4.1959587260655465e-06, "epoch": 0.8128301267139221, "percentage": 81.29, "elapsed_time": "5 days, 16:17:29", "remaining_time": "1 day, 7:22:12", "throughput": 2733.13, "total_tokens": 1341012512} {"current_steps": 7426, "total_steps": 9134, "loss": 0.7304, "learning_rate": 4.191191735789096e-06, "epoch": 0.81293959878486, "percentage": 81.3, "elapsed_time": "5 days, 16:18:34", "remaining_time": "1 day, 7:21:05", "throughput": 2733.19, "total_tokens": 1341217696} {"current_steps": 7427, "total_steps": 9134, "loss": 0.847, "learning_rate": 4.186427207154869e-06, "epoch": 0.8130490708557979, "percentage": 81.31, "elapsed_time": "5 days, 16:19:41", "remaining_time": "1 day, 7:19:59", "throughput": 2733.18, "total_tokens": 1341394208} {"current_steps": 7428, "total_steps": 9134, "loss": 0.8174, "learning_rate": 4.181665140726523e-06, "epoch": 0.8131585429267358, "percentage": 81.32, "elapsed_time": "5 days, 16:20:45", "remaining_time": "1 day, 7:18:53", "throughput": 2733.16, "total_tokens": 1341558176} {"current_steps": 7429, "total_steps": 9134, "loss": 0.8906, "learning_rate": 4.176905537067394e-06, "epoch": 0.8132680149976738, "percentage": 81.33, "elapsed_time": "5 days, 16:21:49", "remaining_time": "1 day, 7:17:46", "throughput": 2733.13, "total_tokens": 1341716992} {"current_steps": 7430, "total_steps": 9134, "loss": 0.8367, "learning_rate": 4.1721483967405305e-06, "epoch": 0.8133774870686116, "percentage": 81.34, "elapsed_time": "5 days, 16:22:53", "remaining_time": "1 day, 7:16:40", "throughput": 2733.13, "total_tokens": 1341893280} {"current_steps": 7431, "total_steps": 9134, "loss": 0.8482, "learning_rate": 4.167393720308699e-06, "epoch": 0.8134869591395495, "percentage": 81.36, "elapsed_time": "5 days, 16:23:57", "remaining_time": "1 day, 7:15:33", "throughput": 2733.13, "total_tokens": 1342072032} {"current_steps": 7432, "total_steps": 9134, "loss": 0.7623, "learning_rate": 4.162641508334355e-06, "epoch": 0.8135964312104874, "percentage": 81.37, "elapsed_time": "5 days, 16:25:02", "remaining_time": "1 day, 7:14:27", "throughput": 2733.19, "total_tokens": 1342274080} {"current_steps": 7433, "total_steps": 9134, "loss": 0.9178, "learning_rate": 4.157891761379701e-06, "epoch": 0.8137059032814253, "percentage": 81.38, "elapsed_time": "5 days, 16:26:07", "remaining_time": "1 day, 7:13:20", "throughput": 2733.18, "total_tokens": 1342449920} {"current_steps": 7434, "total_steps": 9134, "loss": 0.9183, "learning_rate": 4.153144480006593e-06, "epoch": 0.8138153753523633, "percentage": 81.39, "elapsed_time": "5 days, 16:27:13", "remaining_time": "1 day, 7:12:14", "throughput": 2733.19, "total_tokens": 1342636736} {"current_steps": 7435, "total_steps": 9134, "loss": 0.9112, "learning_rate": 4.148399664776656e-06, "epoch": 0.8139248474233012, "percentage": 81.4, "elapsed_time": "5 days, 16:28:18", "remaining_time": "1 day, 7:11:08", "throughput": 2733.18, "total_tokens": 1342808544} {"current_steps": 7436, "total_steps": 9134, "loss": 0.7983, "learning_rate": 4.143657316251165e-06, "epoch": 0.814034319494239, "percentage": 81.41, "elapsed_time": "5 days, 16:29:25", "remaining_time": "1 day, 7:10:02", "throughput": 2733.2, "total_tokens": 1342996704} {"current_steps": 7437, "total_steps": 9134, "loss": 0.8805, "learning_rate": 4.1389174349911495e-06, "epoch": 0.8141437915651769, "percentage": 81.42, "elapsed_time": "5 days, 16:30:27", "remaining_time": "1 day, 7:08:55", "throughput": 2733.2, "total_tokens": 1343168736} {"current_steps": 7438, "total_steps": 9134, "loss": 0.6404, "learning_rate": 4.1341800215573185e-06, "epoch": 0.8142532636361148, "percentage": 81.43, "elapsed_time": "5 days, 16:31:33", "remaining_time": "1 day, 7:07:49", "throughput": 2733.21, "total_tokens": 1343357344} {"current_steps": 7439, "total_steps": 9134, "loss": 0.9419, "learning_rate": 4.129445076510105e-06, "epoch": 0.8143627357070528, "percentage": 81.44, "elapsed_time": "5 days, 16:32:37", "remaining_time": "1 day, 7:06:42", "throughput": 2733.2, "total_tokens": 1343525792} {"current_steps": 7440, "total_steps": 9134, "loss": 0.7908, "learning_rate": 4.124712600409638e-06, "epoch": 0.8144722077779907, "percentage": 81.45, "elapsed_time": "5 days, 16:33:41", "remaining_time": "1 day, 7:05:36", "throughput": 2733.2, "total_tokens": 1343701184} {"current_steps": 7441, "total_steps": 9134, "loss": 0.9502, "learning_rate": 4.119982593815761e-06, "epoch": 0.8145816798489286, "percentage": 81.46, "elapsed_time": "5 days, 16:34:48", "remaining_time": "1 day, 7:04:30", "throughput": 2733.19, "total_tokens": 1343877248} {"current_steps": 7442, "total_steps": 9134, "loss": 0.8549, "learning_rate": 4.11525505728804e-06, "epoch": 0.8146911519198664, "percentage": 81.48, "elapsed_time": "5 days, 16:35:55", "remaining_time": "1 day, 7:03:24", "throughput": 2733.24, "total_tokens": 1344084448} {"current_steps": 7443, "total_steps": 9134, "loss": 0.9725, "learning_rate": 4.110529991385706e-06, "epoch": 0.8148006239908043, "percentage": 81.49, "elapsed_time": "5 days, 16:36:57", "remaining_time": "1 day, 7:02:17", "throughput": 2733.21, "total_tokens": 1344243040} {"current_steps": 7444, "total_steps": 9134, "loss": 0.8335, "learning_rate": 4.105807396667755e-06, "epoch": 0.8149100960617423, "percentage": 81.5, "elapsed_time": "5 days, 16:38:04", "remaining_time": "1 day, 7:01:11", "throughput": 2733.22, "total_tokens": 1344424928} {"current_steps": 7445, "total_steps": 9134, "loss": 1.1022, "learning_rate": 4.10108727369283e-06, "epoch": 0.8150195681326802, "percentage": 81.51, "elapsed_time": "5 days, 16:39:11", "remaining_time": "1 day, 7:00:05", "throughput": 2733.28, "total_tokens": 1344641088} {"current_steps": 7446, "total_steps": 9134, "loss": 0.9508, "learning_rate": 4.0963696230193385e-06, "epoch": 0.8151290402036181, "percentage": 81.52, "elapsed_time": "5 days, 16:40:14", "remaining_time": "1 day, 6:58:59", "throughput": 2733.26, "total_tokens": 1344801920} {"current_steps": 7447, "total_steps": 9134, "loss": 0.7839, "learning_rate": 4.091654445205356e-06, "epoch": 0.8152385122745559, "percentage": 81.53, "elapsed_time": "5 days, 16:41:16", "remaining_time": "1 day, 6:57:52", "throughput": 2733.26, "total_tokens": 1344972160} {"current_steps": 7448, "total_steps": 9134, "loss": 0.7279, "learning_rate": 4.086941740808686e-06, "epoch": 0.8153479843454938, "percentage": 81.54, "elapsed_time": "5 days, 16:42:23", "remaining_time": "1 day, 6:56:46", "throughput": 2733.27, "total_tokens": 1345161216} {"current_steps": 7449, "total_steps": 9134, "loss": 0.7182, "learning_rate": 4.082231510386828e-06, "epoch": 0.8154574564164317, "percentage": 81.55, "elapsed_time": "5 days, 16:43:25", "remaining_time": "1 day, 6:55:39", "throughput": 2733.26, "total_tokens": 1345324960} {"current_steps": 7450, "total_steps": 9134, "loss": 0.9246, "learning_rate": 4.077523754496987e-06, "epoch": 0.8155669284873697, "percentage": 81.56, "elapsed_time": "5 days, 16:44:32", "remaining_time": "1 day, 6:54:33", "throughput": 2733.33, "total_tokens": 1345540896} {"current_steps": 7451, "total_steps": 9134, "loss": 0.7945, "learning_rate": 4.0728184736961025e-06, "epoch": 0.8156764005583076, "percentage": 81.57, "elapsed_time": "5 days, 16:45:30", "remaining_time": "1 day, 6:53:25", "throughput": 2733.27, "total_tokens": 1345674400} {"current_steps": 7452, "total_steps": 9134, "loss": 0.9205, "learning_rate": 4.068115668540776e-06, "epoch": 0.8157858726292455, "percentage": 81.59, "elapsed_time": "5 days, 16:46:28", "remaining_time": "1 day, 6:52:17", "throughput": 2733.26, "total_tokens": 1345828960} {"current_steps": 7453, "total_steps": 9134, "loss": 0.8473, "learning_rate": 4.063415339587354e-06, "epoch": 0.8158953447001833, "percentage": 81.6, "elapsed_time": "5 days, 16:47:33", "remaining_time": "1 day, 6:51:11", "throughput": 2733.27, "total_tokens": 1346009728} {"current_steps": 7454, "total_steps": 9134, "loss": 1.0731, "learning_rate": 4.058717487391875e-06, "epoch": 0.8160048167711212, "percentage": 81.61, "elapsed_time": "5 days, 16:48:39", "remaining_time": "1 day, 6:50:05", "throughput": 2733.31, "total_tokens": 1346209536} {"current_steps": 7455, "total_steps": 9134, "loss": 0.9373, "learning_rate": 4.0540221125100835e-06, "epoch": 0.8161142888420592, "percentage": 81.62, "elapsed_time": "5 days, 16:49:42", "remaining_time": "1 day, 6:48:58", "throughput": 2733.3, "total_tokens": 1346372832} {"current_steps": 7456, "total_steps": 9134, "loss": 0.7965, "learning_rate": 4.049329215497433e-06, "epoch": 0.8162237609129971, "percentage": 81.63, "elapsed_time": "5 days, 16:50:46", "remaining_time": "1 day, 6:47:51", "throughput": 2733.35, "total_tokens": 1346573984} {"current_steps": 7457, "total_steps": 9134, "loss": 0.8718, "learning_rate": 4.0446387969090865e-06, "epoch": 0.816333232983935, "percentage": 81.64, "elapsed_time": "5 days, 16:51:54", "remaining_time": "1 day, 6:46:46", "throughput": 2733.39, "total_tokens": 1346783648} {"current_steps": 7458, "total_steps": 9134, "loss": 0.8114, "learning_rate": 4.039950857299907e-06, "epoch": 0.8164427050548729, "percentage": 81.65, "elapsed_time": "5 days, 16:53:00", "remaining_time": "1 day, 6:45:40", "throughput": 2733.42, "total_tokens": 1346974048} {"current_steps": 7459, "total_steps": 9134, "loss": 0.9372, "learning_rate": 4.0352653972244805e-06, "epoch": 0.8165521771258107, "percentage": 81.66, "elapsed_time": "5 days, 16:54:07", "remaining_time": "1 day, 6:44:34", "throughput": 2733.41, "total_tokens": 1347157504} {"current_steps": 7460, "total_steps": 9134, "loss": 0.8335, "learning_rate": 4.030582417237069e-06, "epoch": 0.8166616491967487, "percentage": 81.67, "elapsed_time": "5 days, 16:55:10", "remaining_time": "1 day, 6:43:27", "throughput": 2733.43, "total_tokens": 1347339168} {"current_steps": 7461, "total_steps": 9134, "loss": 0.9939, "learning_rate": 4.025901917891678e-06, "epoch": 0.8167711212676866, "percentage": 81.68, "elapsed_time": "5 days, 16:56:09", "remaining_time": "1 day, 6:42:19", "throughput": 2733.38, "total_tokens": 1347473792} {"current_steps": 7462, "total_steps": 9134, "loss": 0.9088, "learning_rate": 4.021223899741993e-06, "epoch": 0.8168805933386245, "percentage": 81.69, "elapsed_time": "5 days, 16:57:15", "remaining_time": "1 day, 6:41:13", "throughput": 2733.43, "total_tokens": 1347679424} {"current_steps": 7463, "total_steps": 9134, "loss": 0.918, "learning_rate": 4.016548363341416e-06, "epoch": 0.8169900654095624, "percentage": 81.71, "elapsed_time": "5 days, 16:58:20", "remaining_time": "1 day, 6:40:07", "throughput": 2733.48, "total_tokens": 1347882368} {"current_steps": 7464, "total_steps": 9134, "loss": 1.0119, "learning_rate": 4.011875309243054e-06, "epoch": 0.8170995374805002, "percentage": 81.72, "elapsed_time": "5 days, 16:59:25", "remaining_time": "1 day, 6:39:01", "throughput": 2733.51, "total_tokens": 1348074784} {"current_steps": 7465, "total_steps": 9134, "loss": 1.0402, "learning_rate": 4.0072047379997175e-06, "epoch": 0.8172090095514382, "percentage": 81.73, "elapsed_time": "5 days, 17:00:29", "remaining_time": "1 day, 6:37:54", "throughput": 2733.52, "total_tokens": 1348251072} {"current_steps": 7466, "total_steps": 9134, "loss": 0.674, "learning_rate": 4.002536650163938e-06, "epoch": 0.8173184816223761, "percentage": 81.74, "elapsed_time": "5 days, 17:01:32", "remaining_time": "1 day, 6:36:47", "throughput": 2733.51, "total_tokens": 1348422656} {"current_steps": 7467, "total_steps": 9134, "loss": 0.8421, "learning_rate": 3.9978710462879206e-06, "epoch": 0.817427953693314, "percentage": 81.75, "elapsed_time": "5 days, 17:02:40", "remaining_time": "1 day, 6:35:42", "throughput": 2733.56, "total_tokens": 1348630304} {"current_steps": 7468, "total_steps": 9134, "loss": 0.9513, "learning_rate": 3.993207926923623e-06, "epoch": 0.8175374257642519, "percentage": 81.76, "elapsed_time": "5 days, 17:03:48", "remaining_time": "1 day, 6:34:36", "throughput": 2733.59, "total_tokens": 1348832128} {"current_steps": 7469, "total_steps": 9134, "loss": 0.7267, "learning_rate": 3.988547292622655e-06, "epoch": 0.8176468978351898, "percentage": 81.77, "elapsed_time": "5 days, 17:04:51", "remaining_time": "1 day, 6:33:29", "throughput": 2733.57, "total_tokens": 1348996544} {"current_steps": 7470, "total_steps": 9134, "loss": 0.8311, "learning_rate": 3.9838891439363816e-06, "epoch": 0.8177563699061277, "percentage": 81.78, "elapsed_time": "5 days, 17:05:55", "remaining_time": "1 day, 6:32:23", "throughput": 2733.57, "total_tokens": 1349166784} {"current_steps": 7471, "total_steps": 9134, "loss": 0.9876, "learning_rate": 3.979233481415848e-06, "epoch": 0.8178658419770656, "percentage": 81.79, "elapsed_time": "5 days, 17:06:54", "remaining_time": "1 day, 6:31:15", "throughput": 2733.55, "total_tokens": 1349322240} {"current_steps": 7472, "total_steps": 9134, "loss": 0.8015, "learning_rate": 3.974580305611808e-06, "epoch": 0.8179753140480035, "percentage": 81.8, "elapsed_time": "5 days, 17:07:57", "remaining_time": "1 day, 6:30:08", "throughput": 2733.57, "total_tokens": 1349502784} {"current_steps": 7473, "total_steps": 9134, "loss": 0.9212, "learning_rate": 3.9699296170747245e-06, "epoch": 0.8180847861189414, "percentage": 81.82, "elapsed_time": "5 days, 17:08:58", "remaining_time": "1 day, 6:29:01", "throughput": 2733.55, "total_tokens": 1349659808} {"current_steps": 7474, "total_steps": 9134, "loss": 0.8054, "learning_rate": 3.965281416354757e-06, "epoch": 0.8181942581898793, "percentage": 81.83, "elapsed_time": "5 days, 17:10:00", "remaining_time": "1 day, 6:27:54", "throughput": 2733.55, "total_tokens": 1349826464} {"current_steps": 7475, "total_steps": 9134, "loss": 0.9847, "learning_rate": 3.9606357040018e-06, "epoch": 0.8183037302608173, "percentage": 81.84, "elapsed_time": "5 days, 17:11:02", "remaining_time": "1 day, 6:26:47", "throughput": 2733.56, "total_tokens": 1350000736} {"current_steps": 7476, "total_steps": 9134, "loss": 0.9934, "learning_rate": 3.955992480565407e-06, "epoch": 0.8184132023317551, "percentage": 81.85, "elapsed_time": "5 days, 17:12:09", "remaining_time": "1 day, 6:25:41", "throughput": 2733.57, "total_tokens": 1350188448} {"current_steps": 7477, "total_steps": 9134, "loss": 0.6949, "learning_rate": 3.951351746594883e-06, "epoch": 0.818522674402693, "percentage": 81.86, "elapsed_time": "5 days, 17:13:14", "remaining_time": "1 day, 6:24:35", "throughput": 2733.56, "total_tokens": 1350362272} {"current_steps": 7478, "total_steps": 9134, "loss": 0.7585, "learning_rate": 3.9467135026392015e-06, "epoch": 0.8186321464736309, "percentage": 81.87, "elapsed_time": "5 days, 17:14:21", "remaining_time": "1 day, 6:23:29", "throughput": 2733.58, "total_tokens": 1350558496} {"current_steps": 7479, "total_steps": 9134, "loss": 1.0478, "learning_rate": 3.94207774924707e-06, "epoch": 0.8187416185445688, "percentage": 81.88, "elapsed_time": "5 days, 17:15:24", "remaining_time": "1 day, 6:22:22", "throughput": 2733.58, "total_tokens": 1350728736} {"current_steps": 7480, "total_steps": 9134, "loss": 1.0816, "learning_rate": 3.937444486966885e-06, "epoch": 0.8188510906155068, "percentage": 81.89, "elapsed_time": "5 days, 17:16:29", "remaining_time": "1 day, 6:21:16", "throughput": 2733.63, "total_tokens": 1350930112} {"current_steps": 7481, "total_steps": 9134, "loss": 0.5673, "learning_rate": 3.932813716346751e-06, "epoch": 0.8189605626864446, "percentage": 81.9, "elapsed_time": "5 days, 17:17:32", "remaining_time": "1 day, 6:20:09", "throughput": 2733.63, "total_tokens": 1351106848} {"current_steps": 7482, "total_steps": 9134, "loss": 0.7269, "learning_rate": 3.928185437934481e-06, "epoch": 0.8190700347573825, "percentage": 81.91, "elapsed_time": "5 days, 17:18:38", "remaining_time": "1 day, 6:19:03", "throughput": 2733.67, "total_tokens": 1351303296} {"current_steps": 7483, "total_steps": 9134, "loss": 0.9375, "learning_rate": 3.923559652277586e-06, "epoch": 0.8191795068283204, "percentage": 81.92, "elapsed_time": "5 days, 17:19:42", "remaining_time": "1 day, 6:17:57", "throughput": 2733.65, "total_tokens": 1351471296} {"current_steps": 7484, "total_steps": 9134, "loss": 0.8935, "learning_rate": 3.918936359923306e-06, "epoch": 0.8192889788992583, "percentage": 81.94, "elapsed_time": "5 days, 17:20:50", "remaining_time": "1 day, 6:16:51", "throughput": 2733.71, "total_tokens": 1351682976} {"current_steps": 7485, "total_steps": 9134, "loss": 0.7457, "learning_rate": 3.914315561418541e-06, "epoch": 0.8193984509701963, "percentage": 81.95, "elapsed_time": "5 days, 17:21:51", "remaining_time": "1 day, 6:15:44", "throughput": 2733.7, "total_tokens": 1351848736} {"current_steps": 7486, "total_steps": 9134, "loss": 0.8354, "learning_rate": 3.909697257309941e-06, "epoch": 0.8195079230411342, "percentage": 81.96, "elapsed_time": "5 days, 17:22:56", "remaining_time": "1 day, 6:14:38", "throughput": 2733.71, "total_tokens": 1352026816} {"current_steps": 7487, "total_steps": 9134, "loss": 0.7392, "learning_rate": 3.905081448143841e-06, "epoch": 0.819617395112072, "percentage": 81.97, "elapsed_time": "5 days, 17:23:56", "remaining_time": "1 day, 6:13:30", "throughput": 2733.7, "total_tokens": 1352186080} {"current_steps": 7488, "total_steps": 9134, "loss": 0.7189, "learning_rate": 3.9004681344662755e-06, "epoch": 0.8197268671830099, "percentage": 81.98, "elapsed_time": "5 days, 17:25:00", "remaining_time": "1 day, 6:12:24", "throughput": 2733.7, "total_tokens": 1352362368} {"current_steps": 7489, "total_steps": 9134, "loss": 0.8238, "learning_rate": 3.895857316822996e-06, "epoch": 0.8198363392539478, "percentage": 81.99, "elapsed_time": "5 days, 17:26:03", "remaining_time": "1 day, 6:11:17", "throughput": 2733.71, "total_tokens": 1352541568} {"current_steps": 7490, "total_steps": 9134, "loss": 0.8071, "learning_rate": 3.891248995759453e-06, "epoch": 0.8199458113248858, "percentage": 82.0, "elapsed_time": "5 days, 17:27:10", "remaining_time": "1 day, 6:10:11", "throughput": 2733.77, "total_tokens": 1352752576} {"current_steps": 7491, "total_steps": 9134, "loss": 0.8081, "learning_rate": 3.886643171820797e-06, "epoch": 0.8200552833958237, "percentage": 82.01, "elapsed_time": "5 days, 17:28:14", "remaining_time": "1 day, 6:09:05", "throughput": 2733.73, "total_tokens": 1352907808} {"current_steps": 7492, "total_steps": 9134, "loss": 0.8746, "learning_rate": 3.882039845551888e-06, "epoch": 0.8201647554667616, "percentage": 82.02, "elapsed_time": "5 days, 17:29:17", "remaining_time": "1 day, 6:07:58", "throughput": 2733.77, "total_tokens": 1353098208} {"current_steps": 7493, "total_steps": 9134, "loss": 0.936, "learning_rate": 3.877439017497303e-06, "epoch": 0.8202742275376994, "percentage": 82.03, "elapsed_time": "5 days, 17:30:23", "remaining_time": "1 day, 6:06:52", "throughput": 2733.79, "total_tokens": 1353287936} {"current_steps": 7494, "total_steps": 9134, "loss": 0.8818, "learning_rate": 3.872840688201299e-06, "epoch": 0.8203836996086373, "percentage": 82.05, "elapsed_time": "5 days, 17:31:29", "remaining_time": "1 day, 6:05:46", "throughput": 2733.76, "total_tokens": 1353456384} {"current_steps": 7495, "total_steps": 9134, "loss": 1.0529, "learning_rate": 3.868244858207854e-06, "epoch": 0.8204931716795753, "percentage": 82.06, "elapsed_time": "5 days, 17:32:32", "remaining_time": "1 day, 6:04:39", "throughput": 2733.77, "total_tokens": 1353632224} {"current_steps": 7496, "total_steps": 9134, "loss": 0.793, "learning_rate": 3.863651528060647e-06, "epoch": 0.8206026437505132, "percentage": 82.07, "elapsed_time": "5 days, 17:33:38", "remaining_time": "1 day, 6:03:33", "throughput": 2733.75, "total_tokens": 1353804480} {"current_steps": 7497, "total_steps": 9134, "loss": 1.0167, "learning_rate": 3.859060698303058e-06, "epoch": 0.8207121158214511, "percentage": 82.08, "elapsed_time": "5 days, 17:34:39", "remaining_time": "1 day, 6:02:26", "throughput": 2733.75, "total_tokens": 1353968000} {"current_steps": 7498, "total_steps": 9134, "loss": 0.5841, "learning_rate": 3.8544723694781706e-06, "epoch": 0.8208215878923889, "percentage": 82.09, "elapsed_time": "5 days, 17:35:42", "remaining_time": "1 day, 6:01:19", "throughput": 2733.74, "total_tokens": 1354139136} {"current_steps": 7499, "total_steps": 9134, "loss": 0.9554, "learning_rate": 3.849886542128784e-06, "epoch": 0.8209310599633268, "percentage": 82.1, "elapsed_time": "5 days, 17:36:49", "remaining_time": "1 day, 6:00:13", "throughput": 2733.78, "total_tokens": 1354338944} {"current_steps": 7500, "total_steps": 9134, "loss": 0.9102, "learning_rate": 3.845303216797377e-06, "epoch": 0.8210405320342647, "percentage": 82.11, "elapsed_time": "5 days, 17:37:52", "remaining_time": "1 day, 5:59:07", "throughput": 2733.76, "total_tokens": 1354505152} {"current_steps": 7501, "total_steps": 9134, "loss": 0.885, "learning_rate": 3.8407223940261725e-06, "epoch": 0.8211500041052027, "percentage": 82.12, "elapsed_time": "5 days, 17:38:59", "remaining_time": "1 day, 5:58:01", "throughput": 2733.8, "total_tokens": 1354704512} {"current_steps": 7502, "total_steps": 9134, "loss": 0.9483, "learning_rate": 3.8361440743570456e-06, "epoch": 0.8212594761761406, "percentage": 82.13, "elapsed_time": "5 days, 17:40:03", "remaining_time": "1 day, 5:56:54", "throughput": 2733.84, "total_tokens": 1354901408} {"current_steps": 7503, "total_steps": 9134, "loss": 0.8181, "learning_rate": 3.8315682583316224e-06, "epoch": 0.8213689482470785, "percentage": 82.14, "elapsed_time": "5 days, 17:41:06", "remaining_time": "1 day, 5:55:47", "throughput": 2733.83, "total_tokens": 1355066720} {"current_steps": 7504, "total_steps": 9134, "loss": 0.9978, "learning_rate": 3.826994946491208e-06, "epoch": 0.8214784203180163, "percentage": 82.15, "elapsed_time": "5 days, 17:42:12", "remaining_time": "1 day, 5:54:41", "throughput": 2733.85, "total_tokens": 1355258688} {"current_steps": 7505, "total_steps": 9134, "loss": 0.6953, "learning_rate": 3.822424139376815e-06, "epoch": 0.8215878923889542, "percentage": 82.17, "elapsed_time": "5 days, 17:43:17", "remaining_time": "1 day, 5:53:35", "throughput": 2733.89, "total_tokens": 1355456704} {"current_steps": 7506, "total_steps": 9134, "loss": 0.8468, "learning_rate": 3.817855837529164e-06, "epoch": 0.8216973644598922, "percentage": 82.18, "elapsed_time": "5 days, 17:44:23", "remaining_time": "1 day, 5:52:29", "throughput": 2733.9, "total_tokens": 1355641280} {"current_steps": 7507, "total_steps": 9134, "loss": 0.9035, "learning_rate": 3.8132900414886653e-06, "epoch": 0.8218068365308301, "percentage": 82.19, "elapsed_time": "5 days, 17:45:24", "remaining_time": "1 day, 5:51:22", "throughput": 2733.91, "total_tokens": 1355810848} {"current_steps": 7508, "total_steps": 9134, "loss": 0.8664, "learning_rate": 3.8087267517954633e-06, "epoch": 0.821916308601768, "percentage": 82.2, "elapsed_time": "5 days, 17:46:30", "remaining_time": "1 day, 5:50:16", "throughput": 2733.9, "total_tokens": 1355988032} {"current_steps": 7509, "total_steps": 9134, "loss": 0.8168, "learning_rate": 3.8041659689893677e-06, "epoch": 0.8220257806727059, "percentage": 82.21, "elapsed_time": "5 days, 17:47:36", "remaining_time": "1 day, 5:49:10", "throughput": 2733.92, "total_tokens": 1356180672} {"current_steps": 7510, "total_steps": 9134, "loss": 0.7194, "learning_rate": 3.799607693609927e-06, "epoch": 0.8221352527436437, "percentage": 82.22, "elapsed_time": "5 days, 17:48:39", "remaining_time": "1 day, 5:48:03", "throughput": 2733.91, "total_tokens": 1356344416} {"current_steps": 7511, "total_steps": 9134, "loss": 0.7303, "learning_rate": 3.795051926196358e-06, "epoch": 0.8222447248145817, "percentage": 82.23, "elapsed_time": "5 days, 17:49:37", "remaining_time": "1 day, 5:46:55", "throughput": 2733.89, "total_tokens": 1356494048} {"current_steps": 7512, "total_steps": 9134, "loss": 1.0664, "learning_rate": 3.7904986672876146e-06, "epoch": 0.8223541968855196, "percentage": 82.24, "elapsed_time": "5 days, 17:50:43", "remaining_time": "1 day, 5:45:49", "throughput": 2733.89, "total_tokens": 1356677504} {"current_steps": 7513, "total_steps": 9134, "loss": 0.8093, "learning_rate": 3.7859479174223333e-06, "epoch": 0.8224636689564575, "percentage": 82.25, "elapsed_time": "5 days, 17:51:47", "remaining_time": "1 day, 5:44:43", "throughput": 2733.91, "total_tokens": 1356860960} {"current_steps": 7514, "total_steps": 9134, "loss": 0.8858, "learning_rate": 3.7813996771388583e-06, "epoch": 0.8225731410273954, "percentage": 82.26, "elapsed_time": "5 days, 17:52:55", "remaining_time": "1 day, 5:43:37", "throughput": 2733.94, "total_tokens": 1357061888} {"current_steps": 7515, "total_steps": 9134, "loss": 1.0126, "learning_rate": 3.7768539469752397e-06, "epoch": 0.8226826130983332, "percentage": 82.28, "elapsed_time": "5 days, 17:54:00", "remaining_time": "1 day, 5:42:30", "throughput": 2733.91, "total_tokens": 1357222720} {"current_steps": 7516, "total_steps": 9134, "loss": 0.8464, "learning_rate": 3.7723107274692193e-06, "epoch": 0.8227920851692712, "percentage": 82.29, "elapsed_time": "5 days, 17:55:03", "remaining_time": "1 day, 5:41:24", "throughput": 2733.93, "total_tokens": 1357406848} {"current_steps": 7517, "total_steps": 9134, "loss": 0.8982, "learning_rate": 3.767770019158273e-06, "epoch": 0.8229015572402091, "percentage": 82.3, "elapsed_time": "5 days, 17:56:08", "remaining_time": "1 day, 5:40:18", "throughput": 2733.93, "total_tokens": 1357585824} {"current_steps": 7518, "total_steps": 9134, "loss": 0.8991, "learning_rate": 3.76323182257953e-06, "epoch": 0.823011029311147, "percentage": 82.31, "elapsed_time": "5 days, 17:57:15", "remaining_time": "1 day, 5:39:12", "throughput": 2733.99, "total_tokens": 1357799968} {"current_steps": 7519, "total_steps": 9134, "loss": 0.839, "learning_rate": 3.758696138269874e-06, "epoch": 0.8231205013820849, "percentage": 82.32, "elapsed_time": "5 days, 17:58:17", "remaining_time": "1 day, 5:38:05", "throughput": 2733.98, "total_tokens": 1357962816} {"current_steps": 7520, "total_steps": 9134, "loss": 0.6424, "learning_rate": 3.7541629667658564e-06, "epoch": 0.8232299734530228, "percentage": 82.33, "elapsed_time": "5 days, 17:59:20", "remaining_time": "1 day, 5:36:58", "throughput": 2734.0, "total_tokens": 1358142688} {"current_steps": 7521, "total_steps": 9134, "loss": 0.8478, "learning_rate": 3.7496323086037456e-06, "epoch": 0.8233394455239607, "percentage": 82.34, "elapsed_time": "5 days, 18:00:25", "remaining_time": "1 day, 5:35:52", "throughput": 2733.99, "total_tokens": 1358314720} {"current_steps": 7522, "total_steps": 9134, "loss": 0.8221, "learning_rate": 3.7451041643195074e-06, "epoch": 0.8234489175948986, "percentage": 82.35, "elapsed_time": "5 days, 18:01:26", "remaining_time": "1 day, 5:34:45", "throughput": 2733.95, "total_tokens": 1358465024} {"current_steps": 7523, "total_steps": 9134, "loss": 0.9457, "learning_rate": 3.7405785344488157e-06, "epoch": 0.8235583896658365, "percentage": 82.36, "elapsed_time": "5 days, 18:02:29", "remaining_time": "1 day, 5:33:38", "throughput": 2733.96, "total_tokens": 1358640640} {"current_steps": 7524, "total_steps": 9134, "loss": 0.75, "learning_rate": 3.7360554195270403e-06, "epoch": 0.8236678617367744, "percentage": 82.37, "elapsed_time": "5 days, 18:03:35", "remaining_time": "1 day, 5:32:32", "throughput": 2733.99, "total_tokens": 1358835520} {"current_steps": 7525, "total_steps": 9134, "loss": 1.0283, "learning_rate": 3.731534820089255e-06, "epoch": 0.8237773338077123, "percentage": 82.38, "elapsed_time": "5 days, 18:04:37", "remaining_time": "1 day, 5:31:25", "throughput": 2734.0, "total_tokens": 1359009792} {"current_steps": 7526, "total_steps": 9134, "loss": 0.9679, "learning_rate": 3.727016736670247e-06, "epoch": 0.8238868058786503, "percentage": 82.4, "elapsed_time": "5 days, 18:05:42", "remaining_time": "1 day, 5:30:19", "throughput": 2734.01, "total_tokens": 1359193472} {"current_steps": 7527, "total_steps": 9134, "loss": 1.0486, "learning_rate": 3.722501169804493e-06, "epoch": 0.8239962779495881, "percentage": 82.41, "elapsed_time": "5 days, 18:06:47", "remaining_time": "1 day, 5:29:12", "throughput": 2734.04, "total_tokens": 1359382080} {"current_steps": 7528, "total_steps": 9134, "loss": 0.8244, "learning_rate": 3.7179881200261753e-06, "epoch": 0.824105750020526, "percentage": 82.42, "elapsed_time": "5 days, 18:07:52", "remaining_time": "1 day, 5:28:06", "throughput": 2734.05, "total_tokens": 1359566208} {"current_steps": 7529, "total_steps": 9134, "loss": 0.8143, "learning_rate": 3.7134775878691767e-06, "epoch": 0.8242152220914639, "percentage": 82.43, "elapsed_time": "5 days, 18:08:56", "remaining_time": "1 day, 5:27:00", "throughput": 2734.03, "total_tokens": 1359730848} {"current_steps": 7530, "total_steps": 9134, "loss": 0.6925, "learning_rate": 3.708969573867088e-06, "epoch": 0.8243246941624018, "percentage": 82.44, "elapsed_time": "5 days, 18:10:03", "remaining_time": "1 day, 5:25:54", "throughput": 2734.02, "total_tokens": 1359911392} {"current_steps": 7531, "total_steps": 9134, "loss": 1.038, "learning_rate": 3.7044640785531966e-06, "epoch": 0.8244341662333398, "percentage": 82.45, "elapsed_time": "5 days, 18:11:09", "remaining_time": "1 day, 5:24:48", "throughput": 2734.06, "total_tokens": 1360111648} {"current_steps": 7532, "total_steps": 9134, "loss": 0.6033, "learning_rate": 3.699961102460495e-06, "epoch": 0.8245436383042776, "percentage": 82.46, "elapsed_time": "5 days, 18:12:13", "remaining_time": "1 day, 5:23:41", "throughput": 2734.08, "total_tokens": 1360298688} {"current_steps": 7533, "total_steps": 9134, "loss": 0.8414, "learning_rate": 3.6954606461216706e-06, "epoch": 0.8246531103752155, "percentage": 82.47, "elapsed_time": "5 days, 18:13:20", "remaining_time": "1 day, 5:22:35", "throughput": 2734.07, "total_tokens": 1360473856} {"current_steps": 7534, "total_steps": 9134, "loss": 0.8728, "learning_rate": 3.6909627100691293e-06, "epoch": 0.8247625824461534, "percentage": 82.48, "elapsed_time": "5 days, 18:14:28", "remaining_time": "1 day, 5:21:30", "throughput": 2734.11, "total_tokens": 1360681952} {"current_steps": 7535, "total_steps": 9134, "loss": 0.9224, "learning_rate": 3.686467294834964e-06, "epoch": 0.8248720545170913, "percentage": 82.49, "elapsed_time": "5 days, 18:15:31", "remaining_time": "1 day, 5:20:23", "throughput": 2734.09, "total_tokens": 1360843232} {"current_steps": 7536, "total_steps": 9134, "loss": 0.9103, "learning_rate": 3.6819744009509715e-06, "epoch": 0.8249815265880293, "percentage": 82.5, "elapsed_time": "5 days, 18:16:35", "remaining_time": "1 day, 5:19:17", "throughput": 2734.05, "total_tokens": 1360996448} {"current_steps": 7537, "total_steps": 9134, "loss": 0.816, "learning_rate": 3.677484028948658e-06, "epoch": 0.8250909986589672, "percentage": 82.52, "elapsed_time": "5 days, 18:17:40", "remaining_time": "1 day, 5:18:10", "throughput": 2734.04, "total_tokens": 1361169600} {"current_steps": 7538, "total_steps": 9134, "loss": 0.8759, "learning_rate": 3.67299617935922e-06, "epoch": 0.825200470729905, "percentage": 82.53, "elapsed_time": "5 days, 18:18:45", "remaining_time": "1 day, 5:17:04", "throughput": 2734.03, "total_tokens": 1361341856} {"current_steps": 7539, "total_steps": 9134, "loss": 0.8793, "learning_rate": 3.6685108527135635e-06, "epoch": 0.8253099428008429, "percentage": 82.54, "elapsed_time": "5 days, 18:19:47", "remaining_time": "1 day, 5:15:57", "throughput": 2734.02, "total_tokens": 1361507168} {"current_steps": 7540, "total_steps": 9134, "loss": 0.8645, "learning_rate": 3.664028049542287e-06, "epoch": 0.8254194148717808, "percentage": 82.55, "elapsed_time": "5 days, 18:20:50", "remaining_time": "1 day, 5:14:50", "throughput": 2734.02, "total_tokens": 1361678528} {"current_steps": 7541, "total_steps": 9134, "loss": 0.9495, "learning_rate": 3.659547770375718e-06, "epoch": 0.8255288869427188, "percentage": 82.56, "elapsed_time": "5 days, 18:21:54", "remaining_time": "1 day, 5:13:44", "throughput": 2734.04, "total_tokens": 1361865792} {"current_steps": 7542, "total_steps": 9134, "loss": 1.0012, "learning_rate": 3.655070015743839e-06, "epoch": 0.8256383590136567, "percentage": 82.57, "elapsed_time": "5 days, 18:22:57", "remaining_time": "1 day, 5:12:37", "throughput": 2734.06, "total_tokens": 1362046336} {"current_steps": 7543, "total_steps": 9134, "loss": 0.8556, "learning_rate": 3.6505947861763867e-06, "epoch": 0.8257478310845946, "percentage": 82.58, "elapsed_time": "5 days, 18:23:58", "remaining_time": "1 day, 5:11:30", "throughput": 2734.03, "total_tokens": 1362197984} {"current_steps": 7544, "total_steps": 9134, "loss": 0.8818, "learning_rate": 3.6461220822027437e-06, "epoch": 0.8258573031555324, "percentage": 82.59, "elapsed_time": "5 days, 18:25:02", "remaining_time": "1 day, 5:10:23", "throughput": 2734.03, "total_tokens": 1362373600} {"current_steps": 7545, "total_steps": 9134, "loss": 0.6813, "learning_rate": 3.641651904352045e-06, "epoch": 0.8259667752264703, "percentage": 82.6, "elapsed_time": "5 days, 18:26:07", "remaining_time": "1 day, 5:09:17", "throughput": 2734.01, "total_tokens": 1362539136} {"current_steps": 7546, "total_steps": 9134, "loss": 1.0741, "learning_rate": 3.637184253153095e-06, "epoch": 0.8260762472974083, "percentage": 82.61, "elapsed_time": "5 days, 18:27:11", "remaining_time": "1 day, 5:08:11", "throughput": 2733.97, "total_tokens": 1362695264} {"current_steps": 7547, "total_steps": 9134, "loss": 0.7019, "learning_rate": 3.6327191291344015e-06, "epoch": 0.8261857193683462, "percentage": 82.63, "elapsed_time": "5 days, 18:28:15", "remaining_time": "1 day, 5:07:04", "throughput": 2734.0, "total_tokens": 1362886112} {"current_steps": 7548, "total_steps": 9134, "loss": 0.9411, "learning_rate": 3.6282565328242007e-06, "epoch": 0.8262951914392841, "percentage": 82.64, "elapsed_time": "5 days, 18:29:19", "remaining_time": "1 day, 5:05:58", "throughput": 2734.04, "total_tokens": 1363078752} {"current_steps": 7549, "total_steps": 9134, "loss": 0.8995, "learning_rate": 3.623796464750384e-06, "epoch": 0.8264046635102219, "percentage": 82.65, "elapsed_time": "5 days, 18:30:23", "remaining_time": "1 day, 5:04:51", "throughput": 2734.03, "total_tokens": 1363248320} {"current_steps": 7550, "total_steps": 9134, "loss": 0.9078, "learning_rate": 3.6193389254405934e-06, "epoch": 0.8265141355811598, "percentage": 82.66, "elapsed_time": "5 days, 18:31:29", "remaining_time": "1 day, 5:03:45", "throughput": 2734.04, "total_tokens": 1363435808} {"current_steps": 7551, "total_steps": 9134, "loss": 0.6517, "learning_rate": 3.6148839154221236e-06, "epoch": 0.8266236076520977, "percentage": 82.67, "elapsed_time": "5 days, 18:32:34", "remaining_time": "1 day, 5:02:39", "throughput": 2734.02, "total_tokens": 1363602688} {"current_steps": 7552, "total_steps": 9134, "loss": 0.7979, "learning_rate": 3.610431435222017e-06, "epoch": 0.8267330797230357, "percentage": 82.68, "elapsed_time": "5 days, 18:33:39", "remaining_time": "1 day, 5:01:33", "throughput": 2734.03, "total_tokens": 1363788384} {"current_steps": 7553, "total_steps": 9134, "loss": 0.7443, "learning_rate": 3.605981485366969e-06, "epoch": 0.8268425517939736, "percentage": 82.69, "elapsed_time": "5 days, 18:34:43", "remaining_time": "1 day, 5:00:26", "throughput": 2734.0, "total_tokens": 1363944288} {"current_steps": 7554, "total_steps": 9134, "loss": 0.9126, "learning_rate": 3.601534066383419e-06, "epoch": 0.8269520238649115, "percentage": 82.7, "elapsed_time": "5 days, 18:35:49", "remaining_time": "1 day, 4:59:20", "throughput": 2734.01, "total_tokens": 1364135360} {"current_steps": 7555, "total_steps": 9134, "loss": 0.761, "learning_rate": 3.597089178797483e-06, "epoch": 0.8270614959358493, "percentage": 82.71, "elapsed_time": "5 days, 18:36:54", "remaining_time": "1 day, 4:58:14", "throughput": 2734.03, "total_tokens": 1364321280} {"current_steps": 7556, "total_steps": 9134, "loss": 1.2141, "learning_rate": 3.5926468231349817e-06, "epoch": 0.8271709680067872, "percentage": 82.72, "elapsed_time": "5 days, 18:37:59", "remaining_time": "1 day, 4:57:08", "throughput": 2734.06, "total_tokens": 1364514816} {"current_steps": 7557, "total_steps": 9134, "loss": 0.7947, "learning_rate": 3.5882069999214366e-06, "epoch": 0.8272804400777252, "percentage": 82.73, "elapsed_time": "5 days, 18:39:04", "remaining_time": "1 day, 4:56:01", "throughput": 2734.1, "total_tokens": 1364708800} {"current_steps": 7558, "total_steps": 9134, "loss": 0.8245, "learning_rate": 3.583769709682064e-06, "epoch": 0.8273899121486631, "percentage": 82.75, "elapsed_time": "5 days, 18:40:09", "remaining_time": "1 day, 4:54:55", "throughput": 2734.13, "total_tokens": 1364902784} {"current_steps": 7559, "total_steps": 9134, "loss": 0.8493, "learning_rate": 3.579334952941807e-06, "epoch": 0.827499384219601, "percentage": 82.76, "elapsed_time": "5 days, 18:41:13", "remaining_time": "1 day, 4:53:49", "throughput": 2734.11, "total_tokens": 1365069888} {"current_steps": 7560, "total_steps": 9134, "loss": 0.8438, "learning_rate": 3.574902730225263e-06, "epoch": 0.8276088562905389, "percentage": 82.77, "elapsed_time": "5 days, 18:42:15", "remaining_time": "1 day, 4:52:42", "throughput": 2734.12, "total_tokens": 1365244608} {"current_steps": 7561, "total_steps": 9134, "loss": 0.9277, "learning_rate": 3.570473042056777e-06, "epoch": 0.8277183283614767, "percentage": 82.78, "elapsed_time": "5 days, 18:43:22", "remaining_time": "1 day, 4:51:36", "throughput": 2734.14, "total_tokens": 1365436800} {"current_steps": 7562, "total_steps": 9134, "loss": 0.9307, "learning_rate": 3.5660458889603594e-06, "epoch": 0.8278278004324147, "percentage": 82.79, "elapsed_time": "5 days, 18:44:28", "remaining_time": "1 day, 4:50:30", "throughput": 2734.13, "total_tokens": 1365613984} {"current_steps": 7563, "total_steps": 9134, "loss": 0.8611, "learning_rate": 3.561621271459742e-06, "epoch": 0.8279372725033526, "percentage": 82.8, "elapsed_time": "5 days, 18:45:36", "remaining_time": "1 day, 4:49:24", "throughput": 2734.16, "total_tokens": 1365812448} {"current_steps": 7564, "total_steps": 9134, "loss": 0.9351, "learning_rate": 3.557199190078342e-06, "epoch": 0.8280467445742905, "percentage": 82.81, "elapsed_time": "5 days, 18:46:43", "remaining_time": "1 day, 4:48:18", "throughput": 2734.15, "total_tokens": 1365991872} {"current_steps": 7565, "total_steps": 9134, "loss": 0.9575, "learning_rate": 3.5527796453392882e-06, "epoch": 0.8281562166452284, "percentage": 82.82, "elapsed_time": "5 days, 18:47:50", "remaining_time": "1 day, 4:47:12", "throughput": 2734.13, "total_tokens": 1366165248} {"current_steps": 7566, "total_steps": 9134, "loss": 0.9666, "learning_rate": 3.548362637765401e-06, "epoch": 0.8282656887161662, "percentage": 82.83, "elapsed_time": "5 days, 18:48:58", "remaining_time": "1 day, 4:46:07", "throughput": 2734.13, "total_tokens": 1366350496} {"current_steps": 7567, "total_steps": 9134, "loss": 0.8587, "learning_rate": 3.543948167879202e-06, "epoch": 0.8283751607871042, "percentage": 82.84, "elapsed_time": "5 days, 18:50:00", "remaining_time": "1 day, 4:45:00", "throughput": 2734.13, "total_tokens": 1366517376} {"current_steps": 7568, "total_steps": 9134, "loss": 0.7803, "learning_rate": 3.5395362362029198e-06, "epoch": 0.8284846328580421, "percentage": 82.86, "elapsed_time": "5 days, 18:51:01", "remaining_time": "1 day, 4:43:53", "throughput": 2734.1, "total_tokens": 1366671712} {"current_steps": 7569, "total_steps": 9134, "loss": 0.6866, "learning_rate": 3.5351268432584796e-06, "epoch": 0.82859410492898, "percentage": 82.87, "elapsed_time": "5 days, 18:52:01", "remaining_time": "1 day, 4:42:46", "throughput": 2734.08, "total_tokens": 1366827616} {"current_steps": 7570, "total_steps": 9134, "loss": 0.9221, "learning_rate": 3.5307199895674963e-06, "epoch": 0.8287035769999179, "percentage": 82.88, "elapsed_time": "5 days, 18:53:03", "remaining_time": "1 day, 4:41:39", "throughput": 2734.08, "total_tokens": 1366995616} {"current_steps": 7571, "total_steps": 9134, "loss": 0.9502, "learning_rate": 3.5263156756512983e-06, "epoch": 0.8288130490708558, "percentage": 82.89, "elapsed_time": "5 days, 18:54:08", "remaining_time": "1 day, 4:40:32", "throughput": 2734.1, "total_tokens": 1367181536} {"current_steps": 7572, "total_steps": 9134, "loss": 0.859, "learning_rate": 3.521913902030902e-06, "epoch": 0.8289225211417937, "percentage": 82.9, "elapsed_time": "5 days, 18:55:13", "remaining_time": "1 day, 4:39:26", "throughput": 2734.1, "total_tokens": 1367358496} {"current_steps": 7573, "total_steps": 9134, "loss": 0.8655, "learning_rate": 3.5175146692270344e-06, "epoch": 0.8290319932127316, "percentage": 82.91, "elapsed_time": "5 days, 18:56:16", "remaining_time": "1 day, 4:38:19", "throughput": 2734.12, "total_tokens": 1367540832} {"current_steps": 7574, "total_steps": 9134, "loss": 0.808, "learning_rate": 3.5131179777601136e-06, "epoch": 0.8291414652836695, "percentage": 82.92, "elapsed_time": "5 days, 18:57:21", "remaining_time": "1 day, 4:37:13", "throughput": 2734.13, "total_tokens": 1367724960} {"current_steps": 7575, "total_steps": 9134, "loss": 0.7754, "learning_rate": 3.508723828150254e-06, "epoch": 0.8292509373546074, "percentage": 82.93, "elapsed_time": "5 days, 18:58:22", "remaining_time": "1 day, 4:36:06", "throughput": 2734.07, "total_tokens": 1367863616} {"current_steps": 7576, "total_steps": 9134, "loss": 1.0484, "learning_rate": 3.504332220917289e-06, "epoch": 0.8293604094255453, "percentage": 82.94, "elapsed_time": "5 days, 18:59:30", "remaining_time": "1 day, 4:35:00", "throughput": 2734.13, "total_tokens": 1368075072} {"current_steps": 7577, "total_steps": 9134, "loss": 0.9036, "learning_rate": 3.499943156580726e-06, "epoch": 0.8294698814964833, "percentage": 82.95, "elapsed_time": "5 days, 19:00:31", "remaining_time": "1 day, 4:33:53", "throughput": 2734.13, "total_tokens": 1368244192} {"current_steps": 7578, "total_steps": 9134, "loss": 1.1906, "learning_rate": 3.4955566356597887e-06, "epoch": 0.8295793535674211, "percentage": 82.96, "elapsed_time": "5 days, 19:01:35", "remaining_time": "1 day, 4:32:47", "throughput": 2734.09, "total_tokens": 1368401888} {"current_steps": 7579, "total_steps": 9134, "loss": 1.1065, "learning_rate": 3.491172658673392e-06, "epoch": 0.829688825638359, "percentage": 82.98, "elapsed_time": "5 days, 19:02:39", "remaining_time": "1 day, 4:31:40", "throughput": 2734.1, "total_tokens": 1368578848} {"current_steps": 7580, "total_steps": 9134, "loss": 0.903, "learning_rate": 3.4867912261401458e-06, "epoch": 0.8297982977092969, "percentage": 82.99, "elapsed_time": "5 days, 19:03:46", "remaining_time": "1 day, 4:30:35", "throughput": 2734.11, "total_tokens": 1368767680} {"current_steps": 7581, "total_steps": 9134, "loss": 0.7845, "learning_rate": 3.4824123385783807e-06, "epoch": 0.8299077697802348, "percentage": 83.0, "elapsed_time": "5 days, 19:04:47", "remaining_time": "1 day, 4:29:27", "throughput": 2734.11, "total_tokens": 1368932992} {"current_steps": 7582, "total_steps": 9134, "loss": 0.7248, "learning_rate": 3.4780359965060934e-06, "epoch": 0.8300172418511728, "percentage": 83.01, "elapsed_time": "5 days, 19:05:49", "remaining_time": "1 day, 4:28:21", "throughput": 2734.09, "total_tokens": 1369096064} {"current_steps": 7583, "total_steps": 9134, "loss": 0.8587, "learning_rate": 3.4736622004410136e-06, "epoch": 0.8301267139221106, "percentage": 83.02, "elapsed_time": "5 days, 19:06:56", "remaining_time": "1 day, 4:27:15", "throughput": 2734.12, "total_tokens": 1369294752} {"current_steps": 7584, "total_steps": 9134, "loss": 0.9185, "learning_rate": 3.469290950900533e-06, "epoch": 0.8302361859930485, "percentage": 83.03, "elapsed_time": "5 days, 19:08:00", "remaining_time": "1 day, 4:26:08", "throughput": 2734.13, "total_tokens": 1369470816} {"current_steps": 7585, "total_steps": 9134, "loss": 1.2163, "learning_rate": 3.4649222484017836e-06, "epoch": 0.8303456580639864, "percentage": 83.04, "elapsed_time": "5 days, 19:09:07", "remaining_time": "1 day, 4:25:02", "throughput": 2734.17, "total_tokens": 1369676448} {"current_steps": 7586, "total_steps": 9134, "loss": 0.8272, "learning_rate": 3.460556093461556e-06, "epoch": 0.8304551301349243, "percentage": 83.05, "elapsed_time": "5 days, 19:10:12", "remaining_time": "1 day, 4:23:56", "throughput": 2734.15, "total_tokens": 1369842656} {"current_steps": 7587, "total_steps": 9134, "loss": 0.8145, "learning_rate": 3.4561924865963685e-06, "epoch": 0.8305646022058623, "percentage": 83.06, "elapsed_time": "5 days, 19:11:14", "remaining_time": "1 day, 4:22:49", "throughput": 2734.17, "total_tokens": 1370022304} {"current_steps": 7588, "total_steps": 9134, "loss": 1.0451, "learning_rate": 3.4518314283224275e-06, "epoch": 0.8306740742768002, "percentage": 83.07, "elapsed_time": "5 days, 19:12:18", "remaining_time": "1 day, 4:21:43", "throughput": 2734.21, "total_tokens": 1370218752} {"current_steps": 7589, "total_steps": 9134, "loss": 0.6608, "learning_rate": 3.447472919155628e-06, "epoch": 0.830783546347738, "percentage": 83.09, "elapsed_time": "5 days, 19:13:23", "remaining_time": "1 day, 4:20:37", "throughput": 2734.19, "total_tokens": 1370383840} {"current_steps": 7590, "total_steps": 9134, "loss": 0.7695, "learning_rate": 3.443116959611592e-06, "epoch": 0.8308930184186759, "percentage": 83.1, "elapsed_time": "5 days, 19:14:28", "remaining_time": "1 day, 4:19:30", "throughput": 2734.17, "total_tokens": 1370551616} {"current_steps": 7591, "total_steps": 9134, "loss": 0.7232, "learning_rate": 3.438763550205601e-06, "epoch": 0.8310024904896138, "percentage": 83.11, "elapsed_time": "5 days, 19:15:29", "remaining_time": "1 day, 4:18:23", "throughput": 2734.13, "total_tokens": 1370696992} {"current_steps": 7592, "total_steps": 9134, "loss": 0.6909, "learning_rate": 3.4344126914526735e-06, "epoch": 0.8311119625605518, "percentage": 83.12, "elapsed_time": "5 days, 19:16:33", "remaining_time": "1 day, 4:17:17", "throughput": 2734.12, "total_tokens": 1370866560} {"current_steps": 7593, "total_steps": 9134, "loss": 1.0863, "learning_rate": 3.430064383867487e-06, "epoch": 0.8312214346314897, "percentage": 83.13, "elapsed_time": "5 days, 19:17:37", "remaining_time": "1 day, 4:16:10", "throughput": 2734.14, "total_tokens": 1371055392} {"current_steps": 7594, "total_steps": 9134, "loss": 0.8436, "learning_rate": 3.4257186279644554e-06, "epoch": 0.8313309067024276, "percentage": 83.14, "elapsed_time": "5 days, 19:18:41", "remaining_time": "1 day, 4:15:04", "throughput": 2734.12, "total_tokens": 1371222720} {"current_steps": 7595, "total_steps": 9134, "loss": 0.8846, "learning_rate": 3.4213754242576668e-06, "epoch": 0.8314403787733654, "percentage": 83.15, "elapsed_time": "5 days, 19:19:49", "remaining_time": "1 day, 4:13:58", "throughput": 2734.19, "total_tokens": 1371439328} {"current_steps": 7596, "total_steps": 9134, "loss": 0.7815, "learning_rate": 3.417034773260913e-06, "epoch": 0.8315498508443033, "percentage": 83.16, "elapsed_time": "5 days, 19:20:50", "remaining_time": "1 day, 4:12:51", "throughput": 2734.16, "total_tokens": 1371591200} {"current_steps": 7597, "total_steps": 9134, "loss": 1.1292, "learning_rate": 3.4126966754876867e-06, "epoch": 0.8316593229152413, "percentage": 83.17, "elapsed_time": "5 days, 19:21:55", "remaining_time": "1 day, 4:11:45", "throughput": 2734.17, "total_tokens": 1371776224} {"current_steps": 7598, "total_steps": 9134, "loss": 0.7694, "learning_rate": 3.4083611314511763e-06, "epoch": 0.8317687949861792, "percentage": 83.18, "elapsed_time": "5 days, 19:23:02", "remaining_time": "1 day, 4:10:39", "throughput": 2734.21, "total_tokens": 1371977600} {"current_steps": 7599, "total_steps": 9134, "loss": 0.9288, "learning_rate": 3.4040281416642672e-06, "epoch": 0.8318782670571171, "percentage": 83.19, "elapsed_time": "5 days, 19:24:04", "remaining_time": "1 day, 4:09:32", "throughput": 2734.21, "total_tokens": 1372148288} {"current_steps": 7600, "total_steps": 9134, "loss": 0.8855, "learning_rate": 3.3996977066395376e-06, "epoch": 0.8319877391280549, "percentage": 83.21, "elapsed_time": "5 days, 19:25:06", "remaining_time": "1 day, 4:08:25", "throughput": 2734.19, "total_tokens": 1372305536} {"current_steps": 7601, "total_steps": 9134, "loss": 0.6935, "learning_rate": 3.3953698268892857e-06, "epoch": 0.8320972111989928, "percentage": 83.22, "elapsed_time": "5 days, 19:26:11", "remaining_time": "1 day, 4:07:19", "throughput": 2734.19, "total_tokens": 1372483840} {"current_steps": 7602, "total_steps": 9134, "loss": 0.8322, "learning_rate": 3.391044502925478e-06, "epoch": 0.8322066832699307, "percentage": 83.23, "elapsed_time": "5 days, 19:27:19", "remaining_time": "1 day, 4:06:13", "throughput": 2734.23, "total_tokens": 1372691712} {"current_steps": 7603, "total_steps": 9134, "loss": 0.9013, "learning_rate": 3.3867217352597984e-06, "epoch": 0.8323161553408687, "percentage": 83.24, "elapsed_time": "5 days, 19:28:23", "remaining_time": "1 day, 4:05:07", "throughput": 2734.23, "total_tokens": 1372867104} {"current_steps": 7604, "total_steps": 9134, "loss": 0.9737, "learning_rate": 3.3824015244036222e-06, "epoch": 0.8324256274118066, "percentage": 83.25, "elapsed_time": "5 days, 19:29:30", "remaining_time": "1 day, 4:04:01", "throughput": 2734.25, "total_tokens": 1373060192} {"current_steps": 7605, "total_steps": 9134, "loss": 0.7662, "learning_rate": 3.3780838708680153e-06, "epoch": 0.8325350994827445, "percentage": 83.26, "elapsed_time": "5 days, 19:30:38", "remaining_time": "1 day, 4:02:55", "throughput": 2734.29, "total_tokens": 1373264704} {"current_steps": 7606, "total_steps": 9134, "loss": 0.831, "learning_rate": 3.373768775163755e-06, "epoch": 0.8326445715536823, "percentage": 83.27, "elapsed_time": "5 days, 19:31:34", "remaining_time": "1 day, 4:01:47", "throughput": 2734.22, "total_tokens": 1373380736} {"current_steps": 7607, "total_steps": 9134, "loss": 0.8734, "learning_rate": 3.3694562378013076e-06, "epoch": 0.8327540436246202, "percentage": 83.28, "elapsed_time": "5 days, 19:32:36", "remaining_time": "1 day, 4:00:41", "throughput": 2734.17, "total_tokens": 1373528576} {"current_steps": 7608, "total_steps": 9134, "loss": 0.8528, "learning_rate": 3.3651462592908275e-06, "epoch": 0.8328635156955582, "percentage": 83.29, "elapsed_time": "5 days, 19:33:43", "remaining_time": "1 day, 3:59:35", "throughput": 2734.21, "total_tokens": 1373733312} {"current_steps": 7609, "total_steps": 9134, "loss": 0.7326, "learning_rate": 3.3608388401421943e-06, "epoch": 0.8329729877664961, "percentage": 83.3, "elapsed_time": "5 days, 19:34:46", "remaining_time": "1 day, 3:58:28", "throughput": 2734.23, "total_tokens": 1373911168} {"current_steps": 7610, "total_steps": 9134, "loss": 0.8214, "learning_rate": 3.356533980864959e-06, "epoch": 0.833082459837434, "percentage": 83.32, "elapsed_time": "5 days, 19:35:54", "remaining_time": "1 day, 3:57:22", "throughput": 2734.25, "total_tokens": 1374110080} {"current_steps": 7611, "total_steps": 9134, "loss": 0.9811, "learning_rate": 3.352231681968379e-06, "epoch": 0.8331919319083719, "percentage": 83.33, "elapsed_time": "5 days, 19:36:55", "remaining_time": "1 day, 3:56:15", "throughput": 2734.25, "total_tokens": 1374275616} {"current_steps": 7612, "total_steps": 9134, "loss": 0.7587, "learning_rate": 3.347931943961405e-06, "epoch": 0.8333014039793097, "percentage": 83.34, "elapsed_time": "5 days, 19:38:03", "remaining_time": "1 day, 3:55:10", "throughput": 2734.25, "total_tokens": 1374459296} {"current_steps": 7613, "total_steps": 9134, "loss": 0.8577, "learning_rate": 3.3436347673526936e-06, "epoch": 0.8334108760502477, "percentage": 83.35, "elapsed_time": "5 days, 19:39:10", "remaining_time": "1 day, 3:54:04", "throughput": 2734.23, "total_tokens": 1374632672} {"current_steps": 7614, "total_steps": 9134, "loss": 0.721, "learning_rate": 3.3393401526505856e-06, "epoch": 0.8335203481211856, "percentage": 83.36, "elapsed_time": "5 days, 19:40:14", "remaining_time": "1 day, 3:52:58", "throughput": 2734.2, "total_tokens": 1374798432} {"current_steps": 7615, "total_steps": 9134, "loss": 1.0255, "learning_rate": 3.335048100363125e-06, "epoch": 0.8336298201921235, "percentage": 83.37, "elapsed_time": "5 days, 19:41:15", "remaining_time": "1 day, 3:51:50", "throughput": 2734.21, "total_tokens": 1374968224} {"current_steps": 7616, "total_steps": 9134, "loss": 0.9368, "learning_rate": 3.330758610998072e-06, "epoch": 0.8337392922630614, "percentage": 83.38, "elapsed_time": "5 days, 19:42:19", "remaining_time": "1 day, 3:50:44", "throughput": 2734.22, "total_tokens": 1375150112} {"current_steps": 7617, "total_steps": 9134, "loss": 0.8971, "learning_rate": 3.3264716850628375e-06, "epoch": 0.8338487643339992, "percentage": 83.39, "elapsed_time": "5 days, 19:43:24", "remaining_time": "1 day, 3:49:38", "throughput": 2734.24, "total_tokens": 1375333792} {"current_steps": 7618, "total_steps": 9134, "loss": 1.0951, "learning_rate": 3.322187323064574e-06, "epoch": 0.8339582364049372, "percentage": 83.4, "elapsed_time": "5 days, 19:44:29", "remaining_time": "1 day, 3:48:32", "throughput": 2734.26, "total_tokens": 1375522624} {"current_steps": 7619, "total_steps": 9134, "loss": 0.8395, "learning_rate": 3.3179055255101096e-06, "epoch": 0.8340677084758751, "percentage": 83.41, "elapsed_time": "5 days, 19:45:35", "remaining_time": "1 day, 3:47:26", "throughput": 2734.27, "total_tokens": 1375707872} {"current_steps": 7620, "total_steps": 9134, "loss": 0.8208, "learning_rate": 3.3136262929059746e-06, "epoch": 0.834177180546813, "percentage": 83.42, "elapsed_time": "5 days, 19:46:39", "remaining_time": "1 day, 3:46:19", "throughput": 2734.27, "total_tokens": 1375885056} {"current_steps": 7621, "total_steps": 9134, "loss": 0.8335, "learning_rate": 3.30934962575839e-06, "epoch": 0.8342866526177509, "percentage": 83.44, "elapsed_time": "5 days, 19:47:47", "remaining_time": "1 day, 3:45:13", "throughput": 2734.27, "total_tokens": 1376069184} {"current_steps": 7622, "total_steps": 9134, "loss": 0.8384, "learning_rate": 3.3050755245732758e-06, "epoch": 0.8343961246886888, "percentage": 83.45, "elapsed_time": "5 days, 19:48:48", "remaining_time": "1 day, 3:44:06", "throughput": 2734.28, "total_tokens": 1376243232} {"current_steps": 7623, "total_steps": 9134, "loss": 1.0023, "learning_rate": 3.3008039898562603e-06, "epoch": 0.8345055967596267, "percentage": 83.46, "elapsed_time": "5 days, 19:49:49", "remaining_time": "1 day, 3:42:59", "throughput": 2734.27, "total_tokens": 1376403616} {"current_steps": 7624, "total_steps": 9134, "loss": 1.0856, "learning_rate": 3.296535022112643e-06, "epoch": 0.8346150688305646, "percentage": 83.47, "elapsed_time": "5 days, 19:50:56", "remaining_time": "1 day, 3:41:54", "throughput": 2734.29, "total_tokens": 1376597824} {"current_steps": 7625, "total_steps": 9134, "loss": 0.8147, "learning_rate": 3.2922686218474524e-06, "epoch": 0.8347245409015025, "percentage": 83.48, "elapsed_time": "5 days, 19:51:59", "remaining_time": "1 day, 3:40:47", "throughput": 2734.31, "total_tokens": 1376777920} {"current_steps": 7626, "total_steps": 9134, "loss": 0.7421, "learning_rate": 3.288004789565377e-06, "epoch": 0.8348340129724404, "percentage": 83.49, "elapsed_time": "5 days, 19:52:57", "remaining_time": "1 day, 3:39:39", "throughput": 2734.24, "total_tokens": 1376900672} {"current_steps": 7627, "total_steps": 9134, "loss": 0.851, "learning_rate": 3.2837435257708383e-06, "epoch": 0.8349434850433783, "percentage": 83.5, "elapsed_time": "5 days, 19:54:05", "remaining_time": "1 day, 3:38:33", "throughput": 2734.25, "total_tokens": 1377093088} {"current_steps": 7628, "total_steps": 9134, "loss": 0.9608, "learning_rate": 3.2794848309679134e-06, "epoch": 0.8350529571143163, "percentage": 83.51, "elapsed_time": "5 days, 19:55:12", "remaining_time": "1 day, 3:37:28", "throughput": 2734.27, "total_tokens": 1377285280} {"current_steps": 7629, "total_steps": 9134, "loss": 0.7284, "learning_rate": 3.2752287056604187e-06, "epoch": 0.8351624291852541, "percentage": 83.52, "elapsed_time": "5 days, 19:56:18", "remaining_time": "1 day, 3:36:22", "throughput": 2734.28, "total_tokens": 1377472544} {"current_steps": 7630, "total_steps": 9134, "loss": 0.8578, "learning_rate": 3.270975150351835e-06, "epoch": 0.835271901256192, "percentage": 83.53, "elapsed_time": "5 days, 19:57:22", "remaining_time": "1 day, 3:35:15", "throughput": 2734.27, "total_tokens": 1377643008} {"current_steps": 7631, "total_steps": 9134, "loss": 0.9372, "learning_rate": 3.2667241655453485e-06, "epoch": 0.8353813733271299, "percentage": 83.54, "elapsed_time": "5 days, 19:58:26", "remaining_time": "1 day, 3:34:09", "throughput": 2734.28, "total_tokens": 1377822656} {"current_steps": 7632, "total_steps": 9134, "loss": 1.0047, "learning_rate": 3.262475751743857e-06, "epoch": 0.8354908453980678, "percentage": 83.56, "elapsed_time": "5 days, 19:59:30", "remaining_time": "1 day, 3:33:02", "throughput": 2734.27, "total_tokens": 1377994016} {"current_steps": 7633, "total_steps": 9134, "loss": 0.6135, "learning_rate": 3.2582299094499168e-06, "epoch": 0.8356003174690058, "percentage": 83.57, "elapsed_time": "5 days, 20:00:31", "remaining_time": "1 day, 3:31:55", "throughput": 2734.26, "total_tokens": 1378154400} {"current_steps": 7634, "total_steps": 9134, "loss": 0.7317, "learning_rate": 3.253986639165826e-06, "epoch": 0.8357097895399436, "percentage": 83.58, "elapsed_time": "5 days, 20:01:35", "remaining_time": "1 day, 3:30:49", "throughput": 2734.24, "total_tokens": 1378318368} {"current_steps": 7635, "total_steps": 9134, "loss": 0.8143, "learning_rate": 3.2497459413935337e-06, "epoch": 0.8358192616108815, "percentage": 83.59, "elapsed_time": "5 days, 20:02:42", "remaining_time": "1 day, 3:29:43", "throughput": 2734.29, "total_tokens": 1378525568} {"current_steps": 7636, "total_steps": 9134, "loss": 0.7541, "learning_rate": 3.2455078166347242e-06, "epoch": 0.8359287336818194, "percentage": 83.6, "elapsed_time": "5 days, 20:03:49", "remaining_time": "1 day, 3:28:37", "throughput": 2734.33, "total_tokens": 1378729408} {"current_steps": 7637, "total_steps": 9134, "loss": 0.7979, "learning_rate": 3.241272265390752e-06, "epoch": 0.8360382057527573, "percentage": 83.61, "elapsed_time": "5 days, 20:04:52", "remaining_time": "1 day, 3:27:31", "throughput": 2734.32, "total_tokens": 1378898528} {"current_steps": 7638, "total_steps": 9134, "loss": 0.8118, "learning_rate": 3.2370392881626743e-06, "epoch": 0.8361476778236953, "percentage": 83.62, "elapsed_time": "5 days, 20:05:57", "remaining_time": "1 day, 3:26:24", "throughput": 2734.36, "total_tokens": 1379094976} {"current_steps": 7639, "total_steps": 9134, "loss": 0.7194, "learning_rate": 3.232808885451244e-06, "epoch": 0.8362571498946332, "percentage": 83.63, "elapsed_time": "5 days, 20:07:04", "remaining_time": "1 day, 3:25:19", "throughput": 2734.38, "total_tokens": 1379291424} {"current_steps": 7640, "total_steps": 9134, "loss": 0.692, "learning_rate": 3.228581057756913e-06, "epoch": 0.836366621965571, "percentage": 83.64, "elapsed_time": "5 days, 20:08:08", "remaining_time": "1 day, 3:24:12", "throughput": 2734.33, "total_tokens": 1379436800} {"current_steps": 7641, "total_steps": 9134, "loss": 0.9853, "learning_rate": 3.2243558055798234e-06, "epoch": 0.8364760940365089, "percentage": 83.65, "elapsed_time": "5 days, 20:09:13", "remaining_time": "1 day, 3:23:06", "throughput": 2734.34, "total_tokens": 1379622272} {"current_steps": 7642, "total_steps": 9134, "loss": 0.606, "learning_rate": 3.2201331294198057e-06, "epoch": 0.8365855661074468, "percentage": 83.67, "elapsed_time": "5 days, 20:10:13", "remaining_time": "1 day, 3:21:59", "throughput": 2734.31, "total_tokens": 1379767424} {"current_steps": 7643, "total_steps": 9134, "loss": 1.0203, "learning_rate": 3.21591302977641e-06, "epoch": 0.8366950381783848, "percentage": 83.68, "elapsed_time": "5 days, 20:11:20", "remaining_time": "1 day, 3:20:53", "throughput": 2734.3, "total_tokens": 1379947296} {"current_steps": 7644, "total_steps": 9134, "loss": 0.9275, "learning_rate": 3.2116955071488597e-06, "epoch": 0.8368045102493227, "percentage": 83.69, "elapsed_time": "5 days, 20:12:24", "remaining_time": "1 day, 3:19:46", "throughput": 2734.31, "total_tokens": 1380128960} {"current_steps": 7645, "total_steps": 9134, "loss": 1.1151, "learning_rate": 3.2074805620360775e-06, "epoch": 0.8369139823202606, "percentage": 83.7, "elapsed_time": "5 days, 20:13:30", "remaining_time": "1 day, 3:18:40", "throughput": 2734.32, "total_tokens": 1380315776} {"current_steps": 7646, "total_steps": 9134, "loss": 1.0043, "learning_rate": 3.2032681949366845e-06, "epoch": 0.8370234543911984, "percentage": 83.71, "elapsed_time": "5 days, 20:14:38", "remaining_time": "1 day, 3:17:35", "throughput": 2734.37, "total_tokens": 1380523872} {"current_steps": 7647, "total_steps": 9134, "loss": 1.0074, "learning_rate": 3.1990584063489955e-06, "epoch": 0.8371329264621363, "percentage": 83.72, "elapsed_time": "5 days, 20:15:45", "remaining_time": "1 day, 3:16:29", "throughput": 2734.36, "total_tokens": 1380703520} {"current_steps": 7648, "total_steps": 9134, "loss": 0.7592, "learning_rate": 3.194851196771015e-06, "epoch": 0.8372423985330743, "percentage": 83.73, "elapsed_time": "5 days, 20:16:50", "remaining_time": "1 day, 3:15:23", "throughput": 2734.34, "total_tokens": 1380868160} {"current_steps": 7649, "total_steps": 9134, "loss": 0.9049, "learning_rate": 3.190646566700464e-06, "epoch": 0.8373518706040122, "percentage": 83.74, "elapsed_time": "5 days, 20:17:57", "remaining_time": "1 day, 3:14:17", "throughput": 2734.37, "total_tokens": 1381070208} {"current_steps": 7650, "total_steps": 9134, "loss": 1.0248, "learning_rate": 3.1864445166347235e-06, "epoch": 0.8374613426749501, "percentage": 83.75, "elapsed_time": "5 days, 20:19:02", "remaining_time": "1 day, 3:13:11", "throughput": 2734.39, "total_tokens": 1381256576} {"current_steps": 7651, "total_steps": 9134, "loss": 0.9314, "learning_rate": 3.1822450470709003e-06, "epoch": 0.8375708147458879, "percentage": 83.76, "elapsed_time": "5 days, 20:20:06", "remaining_time": "1 day, 3:12:04", "throughput": 2734.4, "total_tokens": 1381438016} {"current_steps": 7652, "total_steps": 9134, "loss": 0.8797, "learning_rate": 3.178048158505778e-06, "epoch": 0.8376802868168258, "percentage": 83.77, "elapsed_time": "5 days, 20:21:13", "remaining_time": "1 day, 3:10:58", "throughput": 2734.41, "total_tokens": 1381624832} {"current_steps": 7653, "total_steps": 9134, "loss": 0.8262, "learning_rate": 3.1738538514358457e-06, "epoch": 0.8377897588877637, "percentage": 83.79, "elapsed_time": "5 days, 20:22:15", "remaining_time": "1 day, 3:09:52", "throughput": 2734.39, "total_tokens": 1381786560} {"current_steps": 7654, "total_steps": 9134, "loss": 0.8704, "learning_rate": 3.1696621263572755e-06, "epoch": 0.8378992309587017, "percentage": 83.8, "elapsed_time": "5 days, 20:23:18", "remaining_time": "1 day, 3:08:45", "throughput": 2734.38, "total_tokens": 1381950528} {"current_steps": 7655, "total_steps": 9134, "loss": 0.7766, "learning_rate": 3.165472983765938e-06, "epoch": 0.8380087030296396, "percentage": 83.81, "elapsed_time": "5 days, 20:24:20", "remaining_time": "1 day, 3:07:38", "throughput": 2734.33, "total_tokens": 1382095232} {"current_steps": 7656, "total_steps": 9134, "loss": 0.6433, "learning_rate": 3.161286424157417e-06, "epoch": 0.8381181751005775, "percentage": 83.82, "elapsed_time": "5 days, 20:25:21", "remaining_time": "1 day, 3:06:31", "throughput": 2734.32, "total_tokens": 1382256960} {"current_steps": 7657, "total_steps": 9134, "loss": 0.8679, "learning_rate": 3.1571024480269524e-06, "epoch": 0.8382276471715153, "percentage": 83.83, "elapsed_time": "5 days, 20:26:29", "remaining_time": "1 day, 3:05:25", "throughput": 2734.32, "total_tokens": 1382443104} {"current_steps": 7658, "total_steps": 9134, "loss": 0.7664, "learning_rate": 3.152921055869523e-06, "epoch": 0.8383371192424532, "percentage": 83.84, "elapsed_time": "5 days, 20:27:33", "remaining_time": "1 day, 3:04:19", "throughput": 2734.35, "total_tokens": 1382631488} {"current_steps": 7659, "total_steps": 9134, "loss": 0.9303, "learning_rate": 3.1487422481797565e-06, "epoch": 0.8384465913133912, "percentage": 83.85, "elapsed_time": "5 days, 20:28:40", "remaining_time": "1 day, 3:03:13", "throughput": 2734.38, "total_tokens": 1382831520} {"current_steps": 7660, "total_steps": 9134, "loss": 0.9343, "learning_rate": 3.1445660254520173e-06, "epoch": 0.8385560633843291, "percentage": 83.86, "elapsed_time": "5 days, 20:29:45", "remaining_time": "1 day, 3:02:07", "throughput": 2734.43, "total_tokens": 1383037824} {"current_steps": 7661, "total_steps": 9134, "loss": 0.7319, "learning_rate": 3.1403923881803354e-06, "epoch": 0.838665535455267, "percentage": 83.87, "elapsed_time": "5 days, 20:30:51", "remaining_time": "1 day, 3:01:01", "throughput": 2734.44, "total_tokens": 1383221728} {"current_steps": 7662, "total_steps": 9134, "loss": 1.0251, "learning_rate": 3.1362213368584442e-06, "epoch": 0.8387750075262049, "percentage": 83.88, "elapsed_time": "5 days, 20:31:54", "remaining_time": "1 day, 2:59:54", "throughput": 2734.45, "total_tokens": 1383397120} {"current_steps": 7663, "total_steps": 9134, "loss": 0.9082, "learning_rate": 3.132052871979774e-06, "epoch": 0.8388844795971427, "percentage": 83.9, "elapsed_time": "5 days, 20:33:02", "remaining_time": "1 day, 2:58:49", "throughput": 2734.47, "total_tokens": 1383594464} {"current_steps": 7664, "total_steps": 9134, "loss": 1.176, "learning_rate": 3.1278869940374378e-06, "epoch": 0.8389939516680807, "percentage": 83.91, "elapsed_time": "5 days, 20:34:07", "remaining_time": "1 day, 2:57:42", "throughput": 2734.46, "total_tokens": 1383768064} {"current_steps": 7665, "total_steps": 9134, "loss": 0.7747, "learning_rate": 3.12372370352427e-06, "epoch": 0.8391034237390186, "percentage": 83.92, "elapsed_time": "5 days, 20:35:13", "remaining_time": "1 day, 2:56:36", "throughput": 2734.46, "total_tokens": 1383945024} {"current_steps": 7666, "total_steps": 9134, "loss": 0.8138, "learning_rate": 3.119563000932757e-06, "epoch": 0.8392128958099565, "percentage": 83.93, "elapsed_time": "5 days, 20:36:19", "remaining_time": "1 day, 2:55:30", "throughput": 2734.45, "total_tokens": 1384124896} {"current_steps": 7667, "total_steps": 9134, "loss": 0.813, "learning_rate": 3.115404886755122e-06, "epoch": 0.8393223678808944, "percentage": 83.94, "elapsed_time": "5 days, 20:37:22", "remaining_time": "1 day, 2:54:24", "throughput": 2734.47, "total_tokens": 1384302976} {"current_steps": 7668, "total_steps": 9134, "loss": 0.818, "learning_rate": 3.1112493614832426e-06, "epoch": 0.8394318399518322, "percentage": 83.95, "elapsed_time": "5 days, 20:38:26", "remaining_time": "1 day, 2:53:17", "throughput": 2734.41, "total_tokens": 1384450592} {"current_steps": 7669, "total_steps": 9134, "loss": 0.9293, "learning_rate": 3.107096425608727e-06, "epoch": 0.8395413120227702, "percentage": 83.96, "elapsed_time": "5 days, 20:39:34", "remaining_time": "1 day, 2:52:12", "throughput": 2734.46, "total_tokens": 1384660928} {"current_steps": 7670, "total_steps": 9134, "loss": 0.7254, "learning_rate": 3.1029460796228483e-06, "epoch": 0.8396507840937081, "percentage": 83.97, "elapsed_time": "5 days, 20:40:35", "remaining_time": "1 day, 2:51:05", "throughput": 2734.45, "total_tokens": 1384825792} {"current_steps": 7671, "total_steps": 9134, "loss": 1.048, "learning_rate": 3.0987983240165914e-06, "epoch": 0.839760256164646, "percentage": 83.98, "elapsed_time": "5 days, 20:41:42", "remaining_time": "1 day, 2:49:59", "throughput": 2734.48, "total_tokens": 1385018880} {"current_steps": 7672, "total_steps": 9134, "loss": 0.721, "learning_rate": 3.0946531592806222e-06, "epoch": 0.8398697282355839, "percentage": 83.99, "elapsed_time": "5 days, 20:42:45", "remaining_time": "1 day, 2:48:52", "throughput": 2734.47, "total_tokens": 1385186208} {"current_steps": 7673, "total_steps": 9134, "loss": 0.8112, "learning_rate": 3.0905105859053068e-06, "epoch": 0.8399792003065218, "percentage": 84.0, "elapsed_time": "5 days, 20:43:50", "remaining_time": "1 day, 2:47:46", "throughput": 2734.48, "total_tokens": 1385369888} {"current_steps": 7674, "total_steps": 9134, "loss": 0.8217, "learning_rate": 3.0863706043807115e-06, "epoch": 0.8400886723774597, "percentage": 84.02, "elapsed_time": "5 days, 20:44:57", "remaining_time": "1 day, 2:46:40", "throughput": 2734.52, "total_tokens": 1385575520} {"current_steps": 7675, "total_steps": 9134, "loss": 0.6689, "learning_rate": 3.0822332151965754e-06, "epoch": 0.8401981444483976, "percentage": 84.03, "elapsed_time": "5 days, 20:46:02", "remaining_time": "1 day, 2:45:34", "throughput": 2734.55, "total_tokens": 1385768384} {"current_steps": 7676, "total_steps": 9134, "loss": 0.8717, "learning_rate": 3.078098418842354e-06, "epoch": 0.8403076165193355, "percentage": 84.04, "elapsed_time": "5 days, 20:47:07", "remaining_time": "1 day, 2:44:28", "throughput": 2734.55, "total_tokens": 1385946464} {"current_steps": 7677, "total_steps": 9134, "loss": 0.7271, "learning_rate": 3.073966215807181e-06, "epoch": 0.8404170885902734, "percentage": 84.05, "elapsed_time": "5 days, 20:48:09", "remaining_time": "1 day, 2:43:21", "throughput": 2734.54, "total_tokens": 1386109760} {"current_steps": 7678, "total_steps": 9134, "loss": 0.758, "learning_rate": 3.06983660657989e-06, "epoch": 0.8405265606612113, "percentage": 84.06, "elapsed_time": "5 days, 20:49:12", "remaining_time": "1 day, 2:42:14", "throughput": 2734.53, "total_tokens": 1386275296} {"current_steps": 7679, "total_steps": 9134, "loss": 0.8687, "learning_rate": 3.0657095916490046e-06, "epoch": 0.8406360327321493, "percentage": 84.07, "elapsed_time": "5 days, 20:50:17", "remaining_time": "1 day, 2:41:08", "throughput": 2734.53, "total_tokens": 1386454496} {"current_steps": 7680, "total_steps": 9134, "loss": 0.821, "learning_rate": 3.0615851715027426e-06, "epoch": 0.8407455048030871, "percentage": 84.08, "elapsed_time": "5 days, 20:51:22", "remaining_time": "1 day, 2:40:02", "throughput": 2734.54, "total_tokens": 1386634592} {"current_steps": 7681, "total_steps": 9134, "loss": 1.0898, "learning_rate": 3.0574633466290166e-06, "epoch": 0.840854976874025, "percentage": 84.09, "elapsed_time": "5 days, 20:52:29", "remaining_time": "1 day, 2:38:56", "throughput": 2734.6, "total_tokens": 1386850752} {"current_steps": 7682, "total_steps": 9134, "loss": 1.0014, "learning_rate": 3.0533441175154305e-06, "epoch": 0.8409644489449629, "percentage": 84.1, "elapsed_time": "5 days, 20:53:34", "remaining_time": "1 day, 2:37:50", "throughput": 2734.57, "total_tokens": 1387013824} {"current_steps": 7683, "total_steps": 9134, "loss": 0.8438, "learning_rate": 3.049227484649275e-06, "epoch": 0.8410739210159008, "percentage": 84.11, "elapsed_time": "5 days, 20:54:38", "remaining_time": "1 day, 2:36:43", "throughput": 2734.59, "total_tokens": 1387199968} {"current_steps": 7684, "total_steps": 9134, "loss": 0.872, "learning_rate": 3.04511344851755e-06, "epoch": 0.8411833930868388, "percentage": 84.13, "elapsed_time": "5 days, 20:55:43", "remaining_time": "1 day, 2:35:37", "throughput": 2734.6, "total_tokens": 1387379392} {"current_steps": 7685, "total_steps": 9134, "loss": 0.6675, "learning_rate": 3.041002009606933e-06, "epoch": 0.8412928651577766, "percentage": 84.14, "elapsed_time": "5 days, 20:56:43", "remaining_time": "1 day, 2:34:30", "throughput": 2734.58, "total_tokens": 1387537088} {"current_steps": 7686, "total_steps": 9134, "loss": 0.7315, "learning_rate": 3.036893168403801e-06, "epoch": 0.8414023372287145, "percentage": 84.15, "elapsed_time": "5 days, 20:57:45", "remaining_time": "1 day, 2:33:23", "throughput": 2734.56, "total_tokens": 1387696352} {"current_steps": 7687, "total_steps": 9134, "loss": 0.7395, "learning_rate": 3.0327869253942183e-06, "epoch": 0.8415118092996524, "percentage": 84.16, "elapsed_time": "5 days, 20:58:44", "remaining_time": "1 day, 2:32:16", "throughput": 2734.5, "total_tokens": 1387824032} {"current_steps": 7688, "total_steps": 9134, "loss": 0.6728, "learning_rate": 3.0286832810639515e-06, "epoch": 0.8416212813705903, "percentage": 84.17, "elapsed_time": "5 days, 20:59:46", "remaining_time": "1 day, 2:31:09", "throughput": 2734.5, "total_tokens": 1387993824} {"current_steps": 7689, "total_steps": 9134, "loss": 1.0413, "learning_rate": 3.024582235898449e-06, "epoch": 0.8417307534415283, "percentage": 84.18, "elapsed_time": "5 days, 21:00:51", "remaining_time": "1 day, 2:30:03", "throughput": 2734.5, "total_tokens": 1388176384} {"current_steps": 7690, "total_steps": 9134, "loss": 0.8173, "learning_rate": 3.0204837903828525e-06, "epoch": 0.8418402255124662, "percentage": 84.19, "elapsed_time": "5 days, 21:01:58", "remaining_time": "1 day, 2:28:57", "throughput": 2734.54, "total_tokens": 1388377984} {"current_steps": 7691, "total_steps": 9134, "loss": 0.908, "learning_rate": 3.0163879450020166e-06, "epoch": 0.841949697583404, "percentage": 84.2, "elapsed_time": "5 days, 21:02:56", "remaining_time": "1 day, 2:27:49", "throughput": 2734.5, "total_tokens": 1388514176} {"current_steps": 7692, "total_steps": 9134, "loss": 0.9092, "learning_rate": 3.0122947002404504e-06, "epoch": 0.8420591696543419, "percentage": 84.21, "elapsed_time": "5 days, 21:04:01", "remaining_time": "1 day, 2:26:43", "throughput": 2734.5, "total_tokens": 1388690464} {"current_steps": 7693, "total_steps": 9134, "loss": 1.1221, "learning_rate": 3.008204056582392e-06, "epoch": 0.8421686417252798, "percentage": 84.22, "elapsed_time": "5 days, 21:05:07", "remaining_time": "1 day, 2:25:37", "throughput": 2734.51, "total_tokens": 1388879968} {"current_steps": 7694, "total_steps": 9134, "loss": 0.7336, "learning_rate": 3.004116014511754e-06, "epoch": 0.8422781137962178, "percentage": 84.23, "elapsed_time": "5 days, 21:06:11", "remaining_time": "1 day, 2:24:31", "throughput": 2734.52, "total_tokens": 1389056256} {"current_steps": 7695, "total_steps": 9134, "loss": 1.0401, "learning_rate": 3.0000305745121443e-06, "epoch": 0.8423875858671557, "percentage": 84.25, "elapsed_time": "5 days, 21:07:17", "remaining_time": "1 day, 2:23:25", "throughput": 2734.51, "total_tokens": 1389235456} {"current_steps": 7696, "total_steps": 9134, "loss": 0.9094, "learning_rate": 2.995947737066859e-06, "epoch": 0.8424970579380936, "percentage": 84.26, "elapsed_time": "5 days, 21:08:25", "remaining_time": "1 day, 2:22:19", "throughput": 2734.57, "total_tokens": 1389449376} {"current_steps": 7697, "total_steps": 9134, "loss": 0.8304, "learning_rate": 2.9918675026588876e-06, "epoch": 0.8426065300090314, "percentage": 84.27, "elapsed_time": "5 days, 21:09:27", "remaining_time": "1 day, 2:21:12", "throughput": 2734.6, "total_tokens": 1389636192} {"current_steps": 7698, "total_steps": 9134, "loss": 0.9536, "learning_rate": 2.987789871770927e-06, "epoch": 0.8427160020799693, "percentage": 84.28, "elapsed_time": "5 days, 21:10:34", "remaining_time": "1 day, 2:20:07", "throughput": 2734.64, "total_tokens": 1389837120} {"current_steps": 7699, "total_steps": 9134, "loss": 0.9262, "learning_rate": 2.9837148448853353e-06, "epoch": 0.8428254741509073, "percentage": 84.29, "elapsed_time": "5 days, 21:11:37", "remaining_time": "1 day, 2:19:00", "throughput": 2734.66, "total_tokens": 1390019904} {"current_steps": 7700, "total_steps": 9134, "loss": 0.9046, "learning_rate": 2.979642422484197e-06, "epoch": 0.8429349462218452, "percentage": 84.3, "elapsed_time": "5 days, 21:12:44", "remaining_time": "1 day, 2:17:54", "throughput": 2734.71, "total_tokens": 1390229568} {"current_steps": 7701, "total_steps": 9134, "loss": 0.6904, "learning_rate": 2.9755726050492566e-06, "epoch": 0.8430444182927831, "percentage": 84.31, "elapsed_time": "5 days, 21:13:52", "remaining_time": "1 day, 2:16:49", "throughput": 2734.74, "total_tokens": 1390430272} {"current_steps": 7702, "total_steps": 9134, "loss": 1.0272, "learning_rate": 2.9715053930619798e-06, "epoch": 0.8431538903637209, "percentage": 84.32, "elapsed_time": "5 days, 21:14:57", "remaining_time": "1 day, 2:15:42", "throughput": 2734.74, "total_tokens": 1390609248} {"current_steps": 7703, "total_steps": 9134, "loss": 1.0622, "learning_rate": 2.9674407870035004e-06, "epoch": 0.8432633624346588, "percentage": 84.33, "elapsed_time": "5 days, 21:16:00", "remaining_time": "1 day, 2:14:36", "throughput": 2734.73, "total_tokens": 1390772992} {"current_steps": 7704, "total_steps": 9134, "loss": 1.0109, "learning_rate": 2.963378787354659e-06, "epoch": 0.8433728345055967, "percentage": 84.34, "elapsed_time": "5 days, 21:17:07", "remaining_time": "1 day, 2:13:30", "throughput": 2734.76, "total_tokens": 1390972352} {"current_steps": 7705, "total_steps": 9134, "loss": 0.8237, "learning_rate": 2.95931939459598e-06, "epoch": 0.8434823065765347, "percentage": 84.36, "elapsed_time": "5 days, 21:18:13", "remaining_time": "1 day, 2:12:24", "throughput": 2734.8, "total_tokens": 1391175968} {"current_steps": 7706, "total_steps": 9134, "loss": 0.8984, "learning_rate": 2.9552626092076765e-06, "epoch": 0.8435917786474726, "percentage": 84.37, "elapsed_time": "5 days, 21:19:21", "remaining_time": "1 day, 2:11:18", "throughput": 2734.83, "total_tokens": 1391375552} {"current_steps": 7707, "total_steps": 9134, "loss": 0.7692, "learning_rate": 2.951208431669675e-06, "epoch": 0.8437012507184105, "percentage": 84.38, "elapsed_time": "5 days, 21:20:27", "remaining_time": "1 day, 2:10:12", "throughput": 2734.85, "total_tokens": 1391563488} {"current_steps": 7708, "total_steps": 9134, "loss": 0.9528, "learning_rate": 2.9471568624615533e-06, "epoch": 0.8438107227893483, "percentage": 84.39, "elapsed_time": "5 days, 21:21:34", "remaining_time": "1 day, 2:09:06", "throughput": 2734.87, "total_tokens": 1391759936} {"current_steps": 7709, "total_steps": 9134, "loss": 1.0567, "learning_rate": 2.9431079020626253e-06, "epoch": 0.8439201948602862, "percentage": 84.4, "elapsed_time": "5 days, 21:22:39", "remaining_time": "1 day, 2:08:00", "throughput": 2734.88, "total_tokens": 1391940032} {"current_steps": 7710, "total_steps": 9134, "loss": 0.8089, "learning_rate": 2.939061550951863e-06, "epoch": 0.8440296669312242, "percentage": 84.41, "elapsed_time": "5 days, 21:23:46", "remaining_time": "1 day, 2:06:54", "throughput": 2734.87, "total_tokens": 1392120128} {"current_steps": 7711, "total_steps": 9134, "loss": 0.9647, "learning_rate": 2.9350178096079486e-06, "epoch": 0.8441391390021621, "percentage": 84.42, "elapsed_time": "5 days, 21:24:51", "remaining_time": "1 day, 2:05:48", "throughput": 2734.89, "total_tokens": 1392308960} {"current_steps": 7712, "total_steps": 9134, "loss": 0.8485, "learning_rate": 2.930976678509245e-06, "epoch": 0.8442486110731, "percentage": 84.43, "elapsed_time": "5 days, 21:25:56", "remaining_time": "1 day, 2:04:42", "throughput": 2734.92, "total_tokens": 1392500480} {"current_steps": 7713, "total_steps": 9134, "loss": 0.8408, "learning_rate": 2.926938158133813e-06, "epoch": 0.8443580831440379, "percentage": 84.44, "elapsed_time": "5 days, 21:27:04", "remaining_time": "1 day, 2:03:36", "throughput": 2734.97, "total_tokens": 1392715072} {"current_steps": 7714, "total_steps": 9134, "loss": 0.7933, "learning_rate": 2.9229022489594e-06, "epoch": 0.8444675552149757, "percentage": 84.45, "elapsed_time": "5 days, 21:28:08", "remaining_time": "1 day, 2:02:30", "throughput": 2734.99, "total_tokens": 1392900768} {"current_steps": 7715, "total_steps": 9134, "loss": 0.601, "learning_rate": 2.9188689514634408e-06, "epoch": 0.8445770272859137, "percentage": 84.46, "elapsed_time": "5 days, 21:29:08", "remaining_time": "1 day, 2:01:23", "throughput": 2734.95, "total_tokens": 1393043232} {"current_steps": 7716, "total_steps": 9134, "loss": 0.83, "learning_rate": 2.9148382661230766e-06, "epoch": 0.8446864993568516, "percentage": 84.48, "elapsed_time": "5 days, 21:30:12", "remaining_time": "1 day, 2:00:16", "throughput": 2734.97, "total_tokens": 1393228480} {"current_steps": 7717, "total_steps": 9134, "loss": 0.7581, "learning_rate": 2.9108101934151285e-06, "epoch": 0.8447959714277895, "percentage": 84.49, "elapsed_time": "5 days, 21:31:19", "remaining_time": "1 day, 1:59:10", "throughput": 2734.93, "total_tokens": 1393394016} {"current_steps": 7718, "total_steps": 9134, "loss": 0.7452, "learning_rate": 2.9067847338161063e-06, "epoch": 0.8449054434987274, "percentage": 84.5, "elapsed_time": "5 days, 21:32:23", "remaining_time": "1 day, 1:58:04", "throughput": 2734.92, "total_tokens": 1393559328} {"current_steps": 7719, "total_steps": 9134, "loss": 0.8109, "learning_rate": 2.9027618878022134e-06, "epoch": 0.8450149155696652, "percentage": 84.51, "elapsed_time": "5 days, 21:33:24", "remaining_time": "1 day, 1:56:57", "throughput": 2734.92, "total_tokens": 1393730240} {"current_steps": 7720, "total_steps": 9134, "loss": 0.7156, "learning_rate": 2.898741655849349e-06, "epoch": 0.8451243876406032, "percentage": 84.52, "elapsed_time": "5 days, 21:34:24", "remaining_time": "1 day, 1:55:50", "throughput": 2734.89, "total_tokens": 1393877408} {"current_steps": 7721, "total_steps": 9134, "loss": 0.8589, "learning_rate": 2.8947240384330945e-06, "epoch": 0.8452338597115411, "percentage": 84.53, "elapsed_time": "5 days, 21:35:29", "remaining_time": "1 day, 1:54:44", "throughput": 2734.9, "total_tokens": 1394059520} {"current_steps": 7722, "total_steps": 9134, "loss": 0.9219, "learning_rate": 2.89070903602873e-06, "epoch": 0.845343331782479, "percentage": 84.54, "elapsed_time": "5 days, 21:36:33", "remaining_time": "1 day, 1:53:37", "throughput": 2734.94, "total_tokens": 1394254176} {"current_steps": 7723, "total_steps": 9134, "loss": 1.1178, "learning_rate": 2.8866966491112144e-06, "epoch": 0.8454528038534169, "percentage": 84.55, "elapsed_time": "5 days, 21:37:41", "remaining_time": "1 day, 1:52:32", "throughput": 2735.0, "total_tokens": 1394473248} {"current_steps": 7724, "total_steps": 9134, "loss": 0.8521, "learning_rate": 2.8826868781552217e-06, "epoch": 0.8455622759243548, "percentage": 84.56, "elapsed_time": "5 days, 21:38:45", "remaining_time": "1 day, 1:51:25", "throughput": 2735.03, "total_tokens": 1394664768} {"current_steps": 7725, "total_steps": 9134, "loss": 0.8521, "learning_rate": 2.8786797236350806e-06, "epoch": 0.8456717479952927, "percentage": 84.57, "elapsed_time": "5 days, 21:39:51", "remaining_time": "1 day, 1:50:19", "throughput": 2735.06, "total_tokens": 1394859424} {"current_steps": 7726, "total_steps": 9134, "loss": 0.6363, "learning_rate": 2.8746751860248415e-06, "epoch": 0.8457812200662306, "percentage": 84.59, "elapsed_time": "5 days, 21:40:57", "remaining_time": "1 day, 1:49:13", "throughput": 2735.08, "total_tokens": 1395046464} {"current_steps": 7727, "total_steps": 9134, "loss": 0.9084, "learning_rate": 2.8706732657982347e-06, "epoch": 0.8458906921371685, "percentage": 84.6, "elapsed_time": "5 days, 21:41:57", "remaining_time": "1 day, 1:48:06", "throughput": 2735.05, "total_tokens": 1395197440} {"current_steps": 7728, "total_steps": 9134, "loss": 0.8158, "learning_rate": 2.866673963428676e-06, "epoch": 0.8460001642081064, "percentage": 84.61, "elapsed_time": "5 days, 21:43:00", "remaining_time": "1 day, 1:47:00", "throughput": 2735.04, "total_tokens": 1395364096} {"current_steps": 7729, "total_steps": 9134, "loss": 1.0561, "learning_rate": 2.862677279389275e-06, "epoch": 0.8461096362790443, "percentage": 84.62, "elapsed_time": "5 days, 21:44:05", "remaining_time": "1 day, 1:45:53", "throughput": 2735.1, "total_tokens": 1395572192} {"current_steps": 7730, "total_steps": 9134, "loss": 0.8771, "learning_rate": 2.85868321415283e-06, "epoch": 0.8462191083499823, "percentage": 84.63, "elapsed_time": "5 days, 21:45:08", "remaining_time": "1 day, 1:44:47", "throughput": 2735.09, "total_tokens": 1395741088} {"current_steps": 7731, "total_steps": 9134, "loss": 0.8788, "learning_rate": 2.8546917681918417e-06, "epoch": 0.8463285804209201, "percentage": 84.64, "elapsed_time": "5 days, 21:46:15", "remaining_time": "1 day, 1:43:41", "throughput": 2735.11, "total_tokens": 1395931488} {"current_steps": 7732, "total_steps": 9134, "loss": 0.7878, "learning_rate": 2.8507029419784696e-06, "epoch": 0.846438052491858, "percentage": 84.65, "elapsed_time": "5 days, 21:47:23", "remaining_time": "1 day, 1:42:35", "throughput": 2735.14, "total_tokens": 1396131968} {"current_steps": 7733, "total_steps": 9134, "loss": 1.047, "learning_rate": 2.8467167359846115e-06, "epoch": 0.8465475245627959, "percentage": 84.66, "elapsed_time": "5 days, 21:48:27", "remaining_time": "1 day, 1:41:29", "throughput": 2735.14, "total_tokens": 1396309600} {"current_steps": 7734, "total_steps": 9134, "loss": 1.0107, "learning_rate": 2.842733150681803e-06, "epoch": 0.8466569966337338, "percentage": 84.67, "elapsed_time": "5 days, 21:49:35", "remaining_time": "1 day, 1:40:23", "throughput": 2735.2, "total_tokens": 1396525312} {"current_steps": 7735, "total_steps": 9134, "loss": 0.7566, "learning_rate": 2.83875218654131e-06, "epoch": 0.8467664687046718, "percentage": 84.68, "elapsed_time": "5 days, 21:50:34", "remaining_time": "1 day, 1:39:16", "throughput": 2735.18, "total_tokens": 1396678752} {"current_steps": 7736, "total_steps": 9134, "loss": 0.9354, "learning_rate": 2.8347738440340663e-06, "epoch": 0.8468759407756096, "percentage": 84.69, "elapsed_time": "5 days, 21:51:42", "remaining_time": "1 day, 1:38:10", "throughput": 2735.18, "total_tokens": 1396863328} {"current_steps": 7737, "total_steps": 9134, "loss": 0.8837, "learning_rate": 2.830798123630707e-06, "epoch": 0.8469854128465475, "percentage": 84.71, "elapsed_time": "5 days, 21:52:46", "remaining_time": "1 day, 1:37:04", "throughput": 2735.2, "total_tokens": 1397048576} {"current_steps": 7738, "total_steps": 9134, "loss": 0.9969, "learning_rate": 2.8268250258015467e-06, "epoch": 0.8470948849174854, "percentage": 84.72, "elapsed_time": "5 days, 21:53:48", "remaining_time": "1 day, 1:35:57", "throughput": 2735.18, "total_tokens": 1397210304} {"current_steps": 7739, "total_steps": 9134, "loss": 0.7809, "learning_rate": 2.822854551016593e-06, "epoch": 0.8472043569884233, "percentage": 84.73, "elapsed_time": "5 days, 21:54:53", "remaining_time": "1 day, 1:34:51", "throughput": 2735.22, "total_tokens": 1397405408} {"current_steps": 7740, "total_steps": 9134, "loss": 0.6858, "learning_rate": 2.8188866997455626e-06, "epoch": 0.8473138290593613, "percentage": 84.74, "elapsed_time": "5 days, 21:55:58", "remaining_time": "1 day, 1:33:45", "throughput": 2735.21, "total_tokens": 1397577440} {"current_steps": 7741, "total_steps": 9134, "loss": 0.7818, "learning_rate": 2.814921472457821e-06, "epoch": 0.8474233011302992, "percentage": 84.75, "elapsed_time": "5 days, 21:57:06", "remaining_time": "1 day, 1:32:39", "throughput": 2735.27, "total_tokens": 1397793824} {"current_steps": 7742, "total_steps": 9134, "loss": 0.9396, "learning_rate": 2.810958869622471e-06, "epoch": 0.847532773201237, "percentage": 84.76, "elapsed_time": "5 days, 21:58:11", "remaining_time": "1 day, 1:31:33", "throughput": 2735.25, "total_tokens": 1397962496} {"current_steps": 7743, "total_steps": 9134, "loss": 0.8358, "learning_rate": 2.8069988917082566e-06, "epoch": 0.8476422452721749, "percentage": 84.77, "elapsed_time": "5 days, 21:59:14", "remaining_time": "1 day, 1:30:26", "throughput": 2735.23, "total_tokens": 1398127136} {"current_steps": 7744, "total_steps": 9134, "loss": 0.7324, "learning_rate": 2.8030415391836513e-06, "epoch": 0.8477517173431128, "percentage": 84.78, "elapsed_time": "5 days, 22:00:21", "remaining_time": "1 day, 1:29:21", "throughput": 2735.25, "total_tokens": 1398318656} {"current_steps": 7745, "total_steps": 9134, "loss": 0.8542, "learning_rate": 2.799086812516799e-06, "epoch": 0.8478611894140508, "percentage": 84.79, "elapsed_time": "5 days, 22:01:26", "remaining_time": "1 day, 1:28:14", "throughput": 2735.29, "total_tokens": 1398517344} {"current_steps": 7746, "total_steps": 9134, "loss": 0.8449, "learning_rate": 2.7951347121755373e-06, "epoch": 0.8479706614849887, "percentage": 84.8, "elapsed_time": "5 days, 22:02:23", "remaining_time": "1 day, 1:27:07", "throughput": 2735.23, "total_tokens": 1398642112} {"current_steps": 7747, "total_steps": 9134, "loss": 0.9099, "learning_rate": 2.791185238627389e-06, "epoch": 0.8480801335559266, "percentage": 84.81, "elapsed_time": "5 days, 22:03:31", "remaining_time": "1 day, 1:26:01", "throughput": 2735.25, "total_tokens": 1398841696} {"current_steps": 7748, "total_steps": 9134, "loss": 0.8627, "learning_rate": 2.7872383923395667e-06, "epoch": 0.8481896056268644, "percentage": 84.83, "elapsed_time": "5 days, 22:04:34", "remaining_time": "1 day, 1:24:55", "throughput": 2735.23, "total_tokens": 1399002080} {"current_steps": 7749, "total_steps": 9134, "loss": 0.8029, "learning_rate": 2.7832941737789912e-06, "epoch": 0.8482990776978023, "percentage": 84.84, "elapsed_time": "5 days, 22:05:40", "remaining_time": "1 day, 1:23:48", "throughput": 2735.21, "total_tokens": 1399171648} {"current_steps": 7750, "total_steps": 9134, "loss": 0.7536, "learning_rate": 2.7793525834122315e-06, "epoch": 0.8484085497687402, "percentage": 84.85, "elapsed_time": "5 days, 22:06:46", "remaining_time": "1 day, 1:22:42", "throughput": 2735.24, "total_tokens": 1399367648} {"current_steps": 7751, "total_steps": 9134, "loss": 1.0358, "learning_rate": 2.775413621705586e-06, "epoch": 0.8485180218396782, "percentage": 84.86, "elapsed_time": "5 days, 22:07:48", "remaining_time": "1 day, 1:21:36", "throughput": 2735.21, "total_tokens": 1399522208} {"current_steps": 7752, "total_steps": 9134, "loss": 0.9609, "learning_rate": 2.771477289125024e-06, "epoch": 0.8486274939106161, "percentage": 84.87, "elapsed_time": "5 days, 22:08:56", "remaining_time": "1 day, 1:20:30", "throughput": 2735.26, "total_tokens": 1399731648} {"current_steps": 7753, "total_steps": 9134, "loss": 0.7147, "learning_rate": 2.7675435861362064e-06, "epoch": 0.8487369659815539, "percentage": 84.88, "elapsed_time": "5 days, 22:10:03", "remaining_time": "1 day, 1:19:24", "throughput": 2735.29, "total_tokens": 1399932352} {"current_steps": 7754, "total_steps": 9134, "loss": 0.9408, "learning_rate": 2.7636125132044806e-06, "epoch": 0.8488464380524918, "percentage": 84.89, "elapsed_time": "5 days, 22:11:11", "remaining_time": "1 day, 1:18:19", "throughput": 2735.33, "total_tokens": 1400138432} {"current_steps": 7755, "total_steps": 9134, "loss": 1.0131, "learning_rate": 2.759684070794885e-06, "epoch": 0.8489559101234297, "percentage": 84.9, "elapsed_time": "5 days, 22:12:17", "remaining_time": "1 day, 1:17:13", "throughput": 2735.32, "total_tokens": 1400311360} {"current_steps": 7756, "total_steps": 9134, "loss": 0.9525, "learning_rate": 2.755758259372149e-06, "epoch": 0.8490653821943677, "percentage": 84.91, "elapsed_time": "5 days, 22:13:23", "remaining_time": "1 day, 1:16:07", "throughput": 2735.31, "total_tokens": 1400486304} {"current_steps": 7757, "total_steps": 9134, "loss": 0.7636, "learning_rate": 2.7518350794006804e-06, "epoch": 0.8491748542653056, "percentage": 84.92, "elapsed_time": "5 days, 22:14:30", "remaining_time": "1 day, 1:15:01", "throughput": 2735.35, "total_tokens": 1400690816} {"current_steps": 7758, "total_steps": 9134, "loss": 0.9384, "learning_rate": 2.7479145313445974e-06, "epoch": 0.8492843263362435, "percentage": 84.94, "elapsed_time": "5 days, 22:15:38", "remaining_time": "1 day, 1:13:55", "throughput": 2735.37, "total_tokens": 1400886592} {"current_steps": 7759, "total_steps": 9134, "loss": 0.712, "learning_rate": 2.743996615667685e-06, "epoch": 0.8493937984071813, "percentage": 84.95, "elapsed_time": "5 days, 22:16:41", "remaining_time": "1 day, 1:12:49", "throughput": 2735.39, "total_tokens": 1401071168} {"current_steps": 7760, "total_steps": 9134, "loss": 0.8476, "learning_rate": 2.7400813328334273e-06, "epoch": 0.8495032704781192, "percentage": 84.96, "elapsed_time": "5 days, 22:17:49", "remaining_time": "1 day, 1:11:43", "throughput": 2735.4, "total_tokens": 1401262912} {"current_steps": 7761, "total_steps": 9134, "loss": 0.9655, "learning_rate": 2.736168683304996e-06, "epoch": 0.8496127425490572, "percentage": 84.97, "elapsed_time": "5 days, 22:18:55", "remaining_time": "1 day, 1:10:37", "throughput": 2735.41, "total_tokens": 1401448832} {"current_steps": 7762, "total_steps": 9134, "loss": 0.7751, "learning_rate": 2.7322586675452454e-06, "epoch": 0.8497222146199951, "percentage": 84.98, "elapsed_time": "5 days, 22:20:01", "remaining_time": "1 day, 1:09:31", "throughput": 2735.43, "total_tokens": 1401637216} {"current_steps": 7763, "total_steps": 9134, "loss": 0.8916, "learning_rate": 2.728351286016725e-06, "epoch": 0.849831686690933, "percentage": 84.99, "elapsed_time": "5 days, 22:21:03", "remaining_time": "1 day, 1:08:24", "throughput": 2735.39, "total_tokens": 1401788416} {"current_steps": 7764, "total_steps": 9134, "loss": 0.7469, "learning_rate": 2.7244465391816742e-06, "epoch": 0.8499411587618709, "percentage": 85.0, "elapsed_time": "5 days, 22:22:07", "remaining_time": "1 day, 1:07:18", "throughput": 2735.36, "total_tokens": 1401946560} {"current_steps": 7765, "total_steps": 9134, "loss": 0.6088, "learning_rate": 2.720544427502009e-06, "epoch": 0.8500506308328087, "percentage": 85.01, "elapsed_time": "5 days, 22:23:15", "remaining_time": "1 day, 1:06:12", "throughput": 2735.35, "total_tokens": 1402127328} {"current_steps": 7766, "total_steps": 9134, "loss": 0.7795, "learning_rate": 2.7166449514393565e-06, "epoch": 0.8501601029037467, "percentage": 85.02, "elapsed_time": "5 days, 22:24:18", "remaining_time": "1 day, 1:05:06", "throughput": 2735.37, "total_tokens": 1402313472} {"current_steps": 7767, "total_steps": 9134, "loss": 0.7013, "learning_rate": 2.7127481114549965e-06, "epoch": 0.8502695749746846, "percentage": 85.03, "elapsed_time": "5 days, 22:25:22", "remaining_time": "1 day, 1:03:59", "throughput": 2735.37, "total_tokens": 1402485952} {"current_steps": 7768, "total_steps": 9134, "loss": 0.9505, "learning_rate": 2.708853908009934e-06, "epoch": 0.8503790470456225, "percentage": 85.04, "elapsed_time": "5 days, 22:26:29", "remaining_time": "1 day, 1:02:53", "throughput": 2735.41, "total_tokens": 1402691136} {"current_steps": 7769, "total_steps": 9134, "loss": 1.0753, "learning_rate": 2.7049623415648427e-06, "epoch": 0.8504885191165604, "percentage": 85.06, "elapsed_time": "5 days, 22:27:35", "remaining_time": "1 day, 1:01:47", "throughput": 2735.42, "total_tokens": 1402875936} {"current_steps": 7770, "total_steps": 9134, "loss": 0.9341, "learning_rate": 2.7010734125800824e-06, "epoch": 0.8505979911874982, "percentage": 85.07, "elapsed_time": "5 days, 22:28:39", "remaining_time": "1 day, 1:00:41", "throughput": 2735.44, "total_tokens": 1403061632} {"current_steps": 7771, "total_steps": 9134, "loss": 0.9258, "learning_rate": 2.6971871215157126e-06, "epoch": 0.8507074632584362, "percentage": 85.08, "elapsed_time": "5 days, 22:29:44", "remaining_time": "1 day, 0:59:35", "throughput": 2735.46, "total_tokens": 1403248224} {"current_steps": 7772, "total_steps": 9134, "loss": 0.9328, "learning_rate": 2.6933034688314624e-06, "epoch": 0.8508169353293741, "percentage": 85.09, "elapsed_time": "5 days, 22:30:49", "remaining_time": "1 day, 0:58:29", "throughput": 2735.46, "total_tokens": 1403426080} {"current_steps": 7773, "total_steps": 9134, "loss": 0.689, "learning_rate": 2.6894224549867815e-06, "epoch": 0.850926407400312, "percentage": 85.1, "elapsed_time": "5 days, 22:31:52", "remaining_time": "1 day, 0:57:22", "throughput": 2735.45, "total_tokens": 1403594528} {"current_steps": 7774, "total_steps": 9134, "loss": 0.8507, "learning_rate": 2.6855440804407635e-06, "epoch": 0.8510358794712499, "percentage": 85.11, "elapsed_time": "5 days, 22:32:58", "remaining_time": "1 day, 0:56:16", "throughput": 2735.49, "total_tokens": 1403793664} {"current_steps": 7775, "total_steps": 9134, "loss": 0.8813, "learning_rate": 2.68166834565223e-06, "epoch": 0.8511453515421878, "percentage": 85.12, "elapsed_time": "5 days, 22:34:03", "remaining_time": "1 day, 0:55:10", "throughput": 2735.52, "total_tokens": 1403989440} {"current_steps": 7776, "total_steps": 9134, "loss": 0.9282, "learning_rate": 2.6777952510796565e-06, "epoch": 0.8512548236131257, "percentage": 85.13, "elapsed_time": "5 days, 22:35:10", "remaining_time": "1 day, 0:54:04", "throughput": 2735.55, "total_tokens": 1404186336} {"current_steps": 7777, "total_steps": 9134, "loss": 1.127, "learning_rate": 2.6739247971812375e-06, "epoch": 0.8513642956840636, "percentage": 85.14, "elapsed_time": "5 days, 22:36:17", "remaining_time": "1 day, 0:52:58", "throughput": 2735.55, "total_tokens": 1404369792} {"current_steps": 7778, "total_steps": 9134, "loss": 1.0784, "learning_rate": 2.6700569844148372e-06, "epoch": 0.8514737677550015, "percentage": 85.15, "elapsed_time": "5 days, 22:37:23", "remaining_time": "1 day, 0:51:52", "throughput": 2735.6, "total_tokens": 1404575648} {"current_steps": 7779, "total_steps": 9134, "loss": 0.8727, "learning_rate": 2.666191813238006e-06, "epoch": 0.8515832398259394, "percentage": 85.17, "elapsed_time": "5 days, 22:38:26", "remaining_time": "1 day, 0:50:46", "throughput": 2735.57, "total_tokens": 1404734912} {"current_steps": 7780, "total_steps": 9134, "loss": 0.9576, "learning_rate": 2.662329284107987e-06, "epoch": 0.8516927118968773, "percentage": 85.18, "elapsed_time": "5 days, 22:39:30", "remaining_time": "1 day, 0:49:39", "throughput": 2735.53, "total_tokens": 1404890592} {"current_steps": 7781, "total_steps": 9134, "loss": 0.7759, "learning_rate": 2.6584693974817084e-06, "epoch": 0.8518021839678153, "percentage": 85.19, "elapsed_time": "5 days, 22:40:30", "remaining_time": "1 day, 0:48:32", "throughput": 2735.51, "total_tokens": 1405040896} {"current_steps": 7782, "total_steps": 9134, "loss": 1.1778, "learning_rate": 2.6546121538157998e-06, "epoch": 0.8519116560387531, "percentage": 85.2, "elapsed_time": "5 days, 22:41:36", "remaining_time": "1 day, 0:47:26", "throughput": 2735.54, "total_tokens": 1405236448} {"current_steps": 7783, "total_steps": 9134, "loss": 0.7133, "learning_rate": 2.650757553566546e-06, "epoch": 0.852021128109691, "percentage": 85.21, "elapsed_time": "5 days, 22:42:41", "remaining_time": "1 day, 0:46:20", "throughput": 2735.56, "total_tokens": 1405427296} {"current_steps": 7784, "total_steps": 9134, "loss": 0.744, "learning_rate": 2.6469055971899525e-06, "epoch": 0.8521306001806289, "percentage": 85.22, "elapsed_time": "5 days, 22:43:45", "remaining_time": "1 day, 0:45:14", "throughput": 2735.58, "total_tokens": 1405610976} {"current_steps": 7785, "total_steps": 9134, "loss": 1.1366, "learning_rate": 2.6430562851416983e-06, "epoch": 0.8522400722515668, "percentage": 85.23, "elapsed_time": "5 days, 22:44:46", "remaining_time": "1 day, 0:44:07", "throughput": 2735.57, "total_tokens": 1405772704} {"current_steps": 7786, "total_steps": 9134, "loss": 0.9202, "learning_rate": 2.6392096178771447e-06, "epoch": 0.8523495443225048, "percentage": 85.24, "elapsed_time": "5 days, 22:45:51", "remaining_time": "1 day, 0:43:01", "throughput": 2735.61, "total_tokens": 1405972064} {"current_steps": 7787, "total_steps": 9134, "loss": 0.8187, "learning_rate": 2.635365595851344e-06, "epoch": 0.8524590163934426, "percentage": 85.25, "elapsed_time": "5 days, 22:46:59", "remaining_time": "1 day, 0:41:55", "throughput": 2735.64, "total_tokens": 1406174336} {"current_steps": 7788, "total_steps": 9134, "loss": 0.8218, "learning_rate": 2.6315242195190436e-06, "epoch": 0.8525684884643805, "percentage": 85.26, "elapsed_time": "5 days, 22:48:02", "remaining_time": "1 day, 0:40:48", "throughput": 2735.6, "total_tokens": 1406321504} {"current_steps": 7789, "total_steps": 9134, "loss": 0.8718, "learning_rate": 2.6276854893346636e-06, "epoch": 0.8526779605353184, "percentage": 85.27, "elapsed_time": "5 days, 22:49:04", "remaining_time": "1 day, 0:39:42", "throughput": 2735.58, "total_tokens": 1406480992} {"current_steps": 7790, "total_steps": 9134, "loss": 0.8997, "learning_rate": 2.6238494057523183e-06, "epoch": 0.8527874326062563, "percentage": 85.29, "elapsed_time": "5 days, 22:50:05", "remaining_time": "1 day, 0:38:35", "throughput": 2735.53, "total_tokens": 1406623904} {"current_steps": 7791, "total_steps": 9134, "loss": 1.0995, "learning_rate": 2.6200159692258195e-06, "epoch": 0.8528969046771943, "percentage": 85.3, "elapsed_time": "5 days, 22:51:13", "remaining_time": "1 day, 0:37:29", "throughput": 2735.59, "total_tokens": 1406842528} {"current_steps": 7792, "total_steps": 9134, "loss": 1.093, "learning_rate": 2.616185180208644e-06, "epoch": 0.8530063767481322, "percentage": 85.31, "elapsed_time": "5 days, 22:52:19", "remaining_time": "1 day, 0:36:23", "throughput": 2735.61, "total_tokens": 1407031360} {"current_steps": 7793, "total_steps": 9134, "loss": 0.9311, "learning_rate": 2.612357039153973e-06, "epoch": 0.85311584881907, "percentage": 85.32, "elapsed_time": "5 days, 22:53:24", "remaining_time": "1 day, 0:35:17", "throughput": 2735.62, "total_tokens": 1407216832} {"current_steps": 7794, "total_steps": 9134, "loss": 0.8651, "learning_rate": 2.608531546514667e-06, "epoch": 0.8532253208900079, "percentage": 85.33, "elapsed_time": "5 days, 22:54:31", "remaining_time": "1 day, 0:34:11", "throughput": 2735.67, "total_tokens": 1407421792} {"current_steps": 7795, "total_steps": 9134, "loss": 0.9297, "learning_rate": 2.6047087027432746e-06, "epoch": 0.8533347929609458, "percentage": 85.34, "elapsed_time": "5 days, 22:55:37", "remaining_time": "1 day, 0:33:05", "throughput": 2735.72, "total_tokens": 1407629888} {"current_steps": 7796, "total_steps": 9134, "loss": 1.033, "learning_rate": 2.600888508292029e-06, "epoch": 0.8534442650318838, "percentage": 85.35, "elapsed_time": "5 days, 22:56:45", "remaining_time": "1 day, 0:31:59", "throughput": 2735.74, "total_tokens": 1407827904} {"current_steps": 7797, "total_steps": 9134, "loss": 0.7996, "learning_rate": 2.597070963612852e-06, "epoch": 0.8535537371028217, "percentage": 85.36, "elapsed_time": "5 days, 22:57:48", "remaining_time": "1 day, 0:30:53", "throughput": 2735.74, "total_tokens": 1408001728} {"current_steps": 7798, "total_steps": 9134, "loss": 1.094, "learning_rate": 2.5932560691573487e-06, "epoch": 0.8536632091737596, "percentage": 85.37, "elapsed_time": "5 days, 22:58:55", "remaining_time": "1 day, 0:29:47", "throughput": 2735.77, "total_tokens": 1408196832} {"current_steps": 7799, "total_steps": 9134, "loss": 0.6372, "learning_rate": 2.5894438253768223e-06, "epoch": 0.8537726812446974, "percentage": 85.38, "elapsed_time": "5 days, 23:00:00", "remaining_time": "1 day, 0:28:41", "throughput": 2735.75, "total_tokens": 1408365952} {"current_steps": 7800, "total_steps": 9134, "loss": 0.8728, "learning_rate": 2.5856342327222505e-06, "epoch": 0.8538821533156353, "percentage": 85.4, "elapsed_time": "5 days, 23:01:05", "remaining_time": "1 day, 0:27:35", "throughput": 2735.74, "total_tokens": 1408534400} {"current_steps": 7801, "total_steps": 9134, "loss": 0.6661, "learning_rate": 2.581827291644301e-06, "epoch": 0.8539916253865732, "percentage": 85.41, "elapsed_time": "5 days, 23:02:09", "remaining_time": "1 day, 0:26:28", "throughput": 2735.73, "total_tokens": 1408706432} {"current_steps": 7802, "total_steps": 9134, "loss": 0.8886, "learning_rate": 2.5780230025933245e-06, "epoch": 0.8541010974575112, "percentage": 85.42, "elapsed_time": "5 days, 23:03:14", "remaining_time": "1 day, 0:25:22", "throughput": 2735.71, "total_tokens": 1408875552} {"current_steps": 7803, "total_steps": 9134, "loss": 0.8864, "learning_rate": 2.5742213660193637e-06, "epoch": 0.8542105695284491, "percentage": 85.43, "elapsed_time": "5 days, 23:04:19", "remaining_time": "1 day, 0:24:16", "throughput": 2735.73, "total_tokens": 1409063488} {"current_steps": 7804, "total_steps": 9134, "loss": 0.9737, "learning_rate": 2.5704223823721453e-06, "epoch": 0.8543200415993869, "percentage": 85.44, "elapsed_time": "5 days, 23:05:23", "remaining_time": "1 day, 0:23:10", "throughput": 2735.76, "total_tokens": 1409255232} {"current_steps": 7805, "total_steps": 9134, "loss": 0.899, "learning_rate": 2.5666260521010758e-06, "epoch": 0.8544295136703248, "percentage": 85.45, "elapsed_time": "5 days, 23:06:24", "remaining_time": "1 day, 0:22:03", "throughput": 2735.72, "total_tokens": 1409398816} {"current_steps": 7806, "total_steps": 9134, "loss": 1.0309, "learning_rate": 2.562832375655269e-06, "epoch": 0.8545389857412627, "percentage": 85.46, "elapsed_time": "5 days, 23:07:28", "remaining_time": "1 day, 0:20:57", "throughput": 2735.7, "total_tokens": 1409565472} {"current_steps": 7807, "total_steps": 9134, "loss": 0.7464, "learning_rate": 2.5590413534834906e-06, "epoch": 0.8546484578122007, "percentage": 85.47, "elapsed_time": "5 days, 23:08:34", "remaining_time": "1 day, 0:19:50", "throughput": 2735.71, "total_tokens": 1409750720} {"current_steps": 7808, "total_steps": 9134, "loss": 0.8388, "learning_rate": 2.555252986034229e-06, "epoch": 0.8547579298831386, "percentage": 85.48, "elapsed_time": "5 days, 23:09:42", "remaining_time": "1 day, 0:18:45", "throughput": 2735.71, "total_tokens": 1409935520} {"current_steps": 7809, "total_steps": 9134, "loss": 1.0589, "learning_rate": 2.55146727375562e-06, "epoch": 0.8548674019540765, "percentage": 85.49, "elapsed_time": "5 days, 23:10:49", "remaining_time": "1 day, 0:17:39", "throughput": 2735.73, "total_tokens": 1410129504} {"current_steps": 7810, "total_steps": 9134, "loss": 0.712, "learning_rate": 2.547684217095528e-06, "epoch": 0.8549768740250143, "percentage": 85.5, "elapsed_time": "5 days, 23:11:57", "remaining_time": "1 day, 0:16:33", "throughput": 2735.78, "total_tokens": 1410342080} {"current_steps": 7811, "total_steps": 9134, "loss": 1.0402, "learning_rate": 2.5439038165014666e-06, "epoch": 0.8550863460959522, "percentage": 85.52, "elapsed_time": "5 days, 23:13:04", "remaining_time": "1 day, 0:15:27", "throughput": 2735.78, "total_tokens": 1410527328} {"current_steps": 7812, "total_steps": 9134, "loss": 0.5315, "learning_rate": 2.5401260724206537e-06, "epoch": 0.8551958181668902, "percentage": 85.53, "elapsed_time": "5 days, 23:14:07", "remaining_time": "1 day, 0:14:21", "throughput": 2735.82, "total_tokens": 1410716832} {"current_steps": 7813, "total_steps": 9134, "loss": 1.1034, "learning_rate": 2.5363509852999983e-06, "epoch": 0.8553052902378281, "percentage": 85.54, "elapsed_time": "5 days, 23:15:15", "remaining_time": "1 day, 0:13:15", "throughput": 2735.86, "total_tokens": 1410928736} {"current_steps": 7814, "total_steps": 9134, "loss": 0.959, "learning_rate": 2.532578555586068e-06, "epoch": 0.855414762308766, "percentage": 85.55, "elapsed_time": "5 days, 23:16:21", "remaining_time": "1 day, 0:12:09", "throughput": 2735.89, "total_tokens": 1411123168} {"current_steps": 7815, "total_steps": 9134, "loss": 0.9765, "learning_rate": 2.5288087837251564e-06, "epoch": 0.8555242343797039, "percentage": 85.56, "elapsed_time": "5 days, 23:17:24", "remaining_time": "1 day, 0:11:03", "throughput": 2735.89, "total_tokens": 1411292512} {"current_steps": 7816, "total_steps": 9134, "loss": 0.9359, "learning_rate": 2.5250416701631976e-06, "epoch": 0.8556337064506417, "percentage": 85.57, "elapsed_time": "5 days, 23:18:31", "remaining_time": "1 day, 0:09:57", "throughput": 2735.86, "total_tokens": 1411463424} {"current_steps": 7817, "total_steps": 9134, "loss": 0.7694, "learning_rate": 2.521277215345852e-06, "epoch": 0.8557431785215797, "percentage": 85.58, "elapsed_time": "5 days, 23:19:36", "remaining_time": "1 day, 0:08:51", "throughput": 2735.83, "total_tokens": 1411622688} {"current_steps": 7818, "total_steps": 9134, "loss": 0.9374, "learning_rate": 2.517515419718433e-06, "epoch": 0.8558526505925176, "percentage": 85.59, "elapsed_time": "5 days, 23:20:40", "remaining_time": "1 day, 0:07:44", "throughput": 2735.85, "total_tokens": 1411810624} {"current_steps": 7819, "total_steps": 9134, "loss": 0.6854, "learning_rate": 2.5137562837259626e-06, "epoch": 0.8559621226634555, "percentage": 85.6, "elapsed_time": "5 days, 23:21:46", "remaining_time": "1 day, 0:06:38", "throughput": 2735.85, "total_tokens": 1411989152} {"current_steps": 7820, "total_steps": 9134, "loss": 0.9311, "learning_rate": 2.5099998078131376e-06, "epoch": 0.8560715947343934, "percentage": 85.61, "elapsed_time": "5 days, 23:22:53", "remaining_time": "1 day, 0:05:33", "throughput": 2735.89, "total_tokens": 1412194336} {"current_steps": 7821, "total_steps": 9134, "loss": 0.867, "learning_rate": 2.5062459924243442e-06, "epoch": 0.8561810668053312, "percentage": 85.63, "elapsed_time": "5 days, 23:23:53", "remaining_time": "1 day, 0:04:25", "throughput": 2735.86, "total_tokens": 1412343072} {"current_steps": 7822, "total_steps": 9134, "loss": 0.936, "learning_rate": 2.5024948380036468e-06, "epoch": 0.8562905388762692, "percentage": 85.64, "elapsed_time": "5 days, 23:24:54", "remaining_time": "1 day, 0:03:19", "throughput": 2735.82, "total_tokens": 1412488448} {"current_steps": 7823, "total_steps": 9134, "loss": 0.9399, "learning_rate": 2.4987463449947986e-06, "epoch": 0.8564000109472071, "percentage": 85.65, "elapsed_time": "5 days, 23:25:59", "remaining_time": "1 day, 0:02:12", "throughput": 2735.84, "total_tokens": 1412679296} {"current_steps": 7824, "total_steps": 9134, "loss": 0.9686, "learning_rate": 2.495000513841253e-06, "epoch": 0.856509483018145, "percentage": 85.66, "elapsed_time": "5 days, 23:27:03", "remaining_time": "1 day, 0:01:06", "throughput": 2735.83, "total_tokens": 1412844160} {"current_steps": 7825, "total_steps": 9134, "loss": 0.7123, "learning_rate": 2.491257344986114e-06, "epoch": 0.8566189550890829, "percentage": 85.67, "elapsed_time": "5 days, 23:28:01", "remaining_time": "23:59:59", "throughput": 2735.79, "total_tokens": 1412986400} {"current_steps": 7826, "total_steps": 9134, "loss": 0.927, "learning_rate": 2.4875168388722057e-06, "epoch": 0.8567284271600208, "percentage": 85.68, "elapsed_time": "5 days, 23:29:09", "remaining_time": "23:58:53", "throughput": 2735.84, "total_tokens": 1413198752} {"current_steps": 7827, "total_steps": 9134, "loss": 0.7741, "learning_rate": 2.4837789959420184e-06, "epoch": 0.8568378992309587, "percentage": 85.69, "elapsed_time": "5 days, 23:30:17", "remaining_time": "23:57:47", "throughput": 2735.84, "total_tokens": 1413380192} {"current_steps": 7828, "total_steps": 9134, "loss": 1.1526, "learning_rate": 2.4800438166377337e-06, "epoch": 0.8569473713018966, "percentage": 85.7, "elapsed_time": "5 days, 23:31:23", "remaining_time": "23:56:41", "throughput": 2735.83, "total_tokens": 1413557824} {"current_steps": 7829, "total_steps": 9134, "loss": 0.7669, "learning_rate": 2.4763113014012155e-06, "epoch": 0.8570568433728345, "percentage": 85.71, "elapsed_time": "5 days, 23:32:27", "remaining_time": "23:55:35", "throughput": 2735.85, "total_tokens": 1413743072} {"current_steps": 7830, "total_steps": 9134, "loss": 0.9124, "learning_rate": 2.472581450674011e-06, "epoch": 0.8571663154437724, "percentage": 85.72, "elapsed_time": "5 days, 23:33:34", "remaining_time": "23:54:29", "throughput": 2735.89, "total_tokens": 1413950496} {"current_steps": 7831, "total_steps": 9134, "loss": 1.0738, "learning_rate": 2.468854264897355e-06, "epoch": 0.8572757875147103, "percentage": 85.73, "elapsed_time": "5 days, 23:34:41", "remaining_time": "23:53:23", "throughput": 2735.92, "total_tokens": 1414148064} {"current_steps": 7832, "total_steps": 9134, "loss": 0.8156, "learning_rate": 2.4651297445121625e-06, "epoch": 0.8573852595856483, "percentage": 85.75, "elapsed_time": "5 days, 23:35:45", "remaining_time": "23:52:17", "throughput": 2735.92, "total_tokens": 1414321440} {"current_steps": 7833, "total_steps": 9134, "loss": 1.0631, "learning_rate": 2.461407889959047e-06, "epoch": 0.8574947316565861, "percentage": 85.76, "elapsed_time": "5 days, 23:36:53", "remaining_time": "23:51:11", "throughput": 2735.97, "total_tokens": 1414532448} {"current_steps": 7834, "total_steps": 9134, "loss": 0.9928, "learning_rate": 2.4576887016782927e-06, "epoch": 0.857604203727524, "percentage": 85.77, "elapsed_time": "5 days, 23:37:55", "remaining_time": "23:50:05", "throughput": 2735.97, "total_tokens": 1414705152} {"current_steps": 7835, "total_steps": 9134, "loss": 0.7673, "learning_rate": 2.4539721801098704e-06, "epoch": 0.8577136757984619, "percentage": 85.78, "elapsed_time": "5 days, 23:39:02", "remaining_time": "23:48:59", "throughput": 2735.95, "total_tokens": 1414876288} {"current_steps": 7836, "total_steps": 9134, "loss": 1.0046, "learning_rate": 2.4502583256934388e-06, "epoch": 0.8578231478693998, "percentage": 85.79, "elapsed_time": "5 days, 23:40:05", "remaining_time": "23:47:52", "throughput": 2735.94, "total_tokens": 1415042944} {"current_steps": 7837, "total_steps": 9134, "loss": 0.872, "learning_rate": 2.4465471388683383e-06, "epoch": 0.8579326199403378, "percentage": 85.8, "elapsed_time": "5 days, 23:41:07", "remaining_time": "23:46:46", "throughput": 2735.93, "total_tokens": 1415205792} {"current_steps": 7838, "total_steps": 9134, "loss": 0.6125, "learning_rate": 2.4428386200735924e-06, "epoch": 0.8580420920112756, "percentage": 85.81, "elapsed_time": "5 days, 23:42:14", "remaining_time": "23:45:40", "throughput": 2735.96, "total_tokens": 1415408288} {"current_steps": 7839, "total_steps": 9134, "loss": 0.6882, "learning_rate": 2.439132769747926e-06, "epoch": 0.8581515640822135, "percentage": 85.82, "elapsed_time": "5 days, 23:43:19", "remaining_time": "23:44:34", "throughput": 2735.98, "total_tokens": 1415593536} {"current_steps": 7840, "total_steps": 9134, "loss": 0.9777, "learning_rate": 2.435429588329716e-06, "epoch": 0.8582610361531514, "percentage": 85.83, "elapsed_time": "5 days, 23:44:27", "remaining_time": "23:43:28", "throughput": 2736.03, "total_tokens": 1415807680} {"current_steps": 7841, "total_steps": 9134, "loss": 1.1333, "learning_rate": 2.431729076257053e-06, "epoch": 0.8583705082240893, "percentage": 85.84, "elapsed_time": "5 days, 23:45:33", "remaining_time": "23:42:22", "throughput": 2736.05, "total_tokens": 1415999200} {"current_steps": 7842, "total_steps": 9134, "loss": 0.8651, "learning_rate": 2.4280312339676953e-06, "epoch": 0.8584799802950273, "percentage": 85.86, "elapsed_time": "5 days, 23:46:34", "remaining_time": "23:41:15", "throughput": 2736.04, "total_tokens": 1416158688} {"current_steps": 7843, "total_steps": 9134, "loss": 0.8586, "learning_rate": 2.4243360618990934e-06, "epoch": 0.8585894523659652, "percentage": 85.87, "elapsed_time": "5 days, 23:47:42", "remaining_time": "23:40:09", "throughput": 2736.08, "total_tokens": 1416366336} {"current_steps": 7844, "total_steps": 9134, "loss": 0.9977, "learning_rate": 2.4206435604883782e-06, "epoch": 0.858698924436903, "percentage": 85.88, "elapsed_time": "5 days, 23:48:48", "remaining_time": "23:39:03", "throughput": 2736.09, "total_tokens": 1416551584} {"current_steps": 7845, "total_steps": 9134, "loss": 0.8665, "learning_rate": 2.416953730172361e-06, "epoch": 0.8588083965078409, "percentage": 85.89, "elapsed_time": "5 days, 23:49:51", "remaining_time": "23:37:57", "throughput": 2736.06, "total_tokens": 1416710176} {"current_steps": 7846, "total_steps": 9134, "loss": 0.8248, "learning_rate": 2.4132665713875542e-06, "epoch": 0.8589178685787788, "percentage": 85.9, "elapsed_time": "5 days, 23:50:56", "remaining_time": "23:36:51", "throughput": 2736.06, "total_tokens": 1416887808} {"current_steps": 7847, "total_steps": 9134, "loss": 1.0299, "learning_rate": 2.409582084570125e-06, "epoch": 0.8590273406497168, "percentage": 85.91, "elapsed_time": "5 days, 23:52:03", "remaining_time": "23:35:45", "throughput": 2736.05, "total_tokens": 1417063424} {"current_steps": 7848, "total_steps": 9134, "loss": 0.7771, "learning_rate": 2.4059002701559587e-06, "epoch": 0.8591368127206547, "percentage": 85.92, "elapsed_time": "5 days, 23:53:08", "remaining_time": "23:34:39", "throughput": 2736.06, "total_tokens": 1417249344} {"current_steps": 7849, "total_steps": 9134, "loss": 1.0066, "learning_rate": 2.4022211285805895e-06, "epoch": 0.8592462847915926, "percentage": 85.93, "elapsed_time": "5 days, 23:54:12", "remaining_time": "23:33:33", "throughput": 2736.08, "total_tokens": 1417431904} {"current_steps": 7850, "total_steps": 9134, "loss": 0.9284, "learning_rate": 2.39854466027927e-06, "epoch": 0.8593557568625304, "percentage": 85.94, "elapsed_time": "5 days, 23:55:15", "remaining_time": "23:32:26", "throughput": 2736.11, "total_tokens": 1417621184} {"current_steps": 7851, "total_steps": 9134, "loss": 0.8133, "learning_rate": 2.394870865686899e-06, "epoch": 0.8594652289334683, "percentage": 85.95, "elapsed_time": "5 days, 23:56:19", "remaining_time": "23:31:20", "throughput": 2736.09, "total_tokens": 1417787840} {"current_steps": 7852, "total_steps": 9134, "loss": 0.8186, "learning_rate": 2.3911997452380987e-06, "epoch": 0.8595747010044062, "percentage": 85.96, "elapsed_time": "5 days, 23:57:22", "remaining_time": "23:30:13", "throughput": 2736.07, "total_tokens": 1417950464} {"current_steps": 7853, "total_steps": 9134, "loss": 0.9724, "learning_rate": 2.387531299367146e-06, "epoch": 0.8596841730753442, "percentage": 85.98, "elapsed_time": "5 days, 23:58:27", "remaining_time": "23:29:07", "throughput": 2736.06, "total_tokens": 1418118464} {"current_steps": 7854, "total_steps": 9134, "loss": 0.8241, "learning_rate": 2.3838655285080085e-06, "epoch": 0.8597936451462821, "percentage": 85.99, "elapsed_time": "5 days, 23:59:34", "remaining_time": "23:28:01", "throughput": 2736.1, "total_tokens": 1418322976} {"current_steps": 7855, "total_steps": 9134, "loss": 0.8793, "learning_rate": 2.3802024330943556e-06, "epoch": 0.8599031172172199, "percentage": 86.0, "elapsed_time": "6 days, 0:00:30", "remaining_time": "23:26:54", "throughput": 2736.07, "total_tokens": 1418464544} {"current_steps": 7856, "total_steps": 9134, "loss": 0.8008, "learning_rate": 2.376542013559502e-06, "epoch": 0.8600125892881578, "percentage": 86.01, "elapsed_time": "6 days, 0:01:37", "remaining_time": "23:25:48", "throughput": 2736.07, "total_tokens": 1418648224} {"current_steps": 7857, "total_steps": 9134, "loss": 0.7788, "learning_rate": 2.3728842703364894e-06, "epoch": 0.8601220613590957, "percentage": 86.02, "elapsed_time": "6 days, 0:02:42", "remaining_time": "23:24:42", "throughput": 2736.11, "total_tokens": 1418841984} {"current_steps": 7858, "total_steps": 9134, "loss": 0.8563, "learning_rate": 2.3692292038580006e-06, "epoch": 0.8602315334300337, "percentage": 86.03, "elapsed_time": "6 days, 0:03:47", "remaining_time": "23:23:35", "throughput": 2736.11, "total_tokens": 1419022080} {"current_steps": 7859, "total_steps": 9134, "loss": 0.692, "learning_rate": 2.3655768145564416e-06, "epoch": 0.8603410055009716, "percentage": 86.04, "elapsed_time": "6 days, 0:04:51", "remaining_time": "23:22:29", "throughput": 2736.15, "total_tokens": 1419219648} {"current_steps": 7860, "total_steps": 9134, "loss": 0.655, "learning_rate": 2.361927102863873e-06, "epoch": 0.8604504775719095, "percentage": 86.05, "elapsed_time": "6 days, 0:05:56", "remaining_time": "23:21:23", "throughput": 2736.14, "total_tokens": 1419388768} {"current_steps": 7861, "total_steps": 9134, "loss": 1.0623, "learning_rate": 2.3582800692120542e-06, "epoch": 0.8605599496428473, "percentage": 86.06, "elapsed_time": "6 days, 0:07:03", "remaining_time": "23:20:17", "throughput": 2736.16, "total_tokens": 1419586112} {"current_steps": 7862, "total_steps": 9134, "loss": 0.8117, "learning_rate": 2.354635714032419e-06, "epoch": 0.8606694217137852, "percentage": 86.07, "elapsed_time": "6 days, 0:08:06", "remaining_time": "23:19:11", "throughput": 2736.16, "total_tokens": 1419757472} {"current_steps": 7863, "total_steps": 9134, "loss": 1.0653, "learning_rate": 2.3509940377560878e-06, "epoch": 0.8607788937847232, "percentage": 86.08, "elapsed_time": "6 days, 0:09:14", "remaining_time": "23:18:05", "throughput": 2736.14, "total_tokens": 1419934208} {"current_steps": 7864, "total_steps": 9134, "loss": 1.0587, "learning_rate": 2.3473550408138645e-06, "epoch": 0.8608883658556611, "percentage": 86.1, "elapsed_time": "6 days, 0:10:21", "remaining_time": "23:16:59", "throughput": 2736.12, "total_tokens": 1420104896} {"current_steps": 7865, "total_steps": 9134, "loss": 0.9916, "learning_rate": 2.343718723636232e-06, "epoch": 0.860997837926599, "percentage": 86.11, "elapsed_time": "6 days, 0:11:24", "remaining_time": "23:15:53", "throughput": 2736.13, "total_tokens": 1420281408} {"current_steps": 7866, "total_steps": 9134, "loss": 0.8977, "learning_rate": 2.3400850866533654e-06, "epoch": 0.8611073099975369, "percentage": 86.12, "elapsed_time": "6 days, 0:12:26", "remaining_time": "23:14:46", "throughput": 2736.11, "total_tokens": 1420445600} {"current_steps": 7867, "total_steps": 9134, "loss": 0.902, "learning_rate": 2.3364541302951154e-06, "epoch": 0.8612167820684747, "percentage": 86.13, "elapsed_time": "6 days, 0:13:34", "remaining_time": "23:13:40", "throughput": 2736.12, "total_tokens": 1420635104} {"current_steps": 7868, "total_steps": 9134, "loss": 0.8734, "learning_rate": 2.3328258549910166e-06, "epoch": 0.8613262541394127, "percentage": 86.14, "elapsed_time": "6 days, 0:14:40", "remaining_time": "23:12:34", "throughput": 2736.11, "total_tokens": 1420809824} {"current_steps": 7869, "total_steps": 9134, "loss": 0.9852, "learning_rate": 2.3292002611702863e-06, "epoch": 0.8614357262103506, "percentage": 86.15, "elapsed_time": "6 days, 0:15:48", "remaining_time": "23:11:29", "throughput": 2736.1, "total_tokens": 1420987232} {"current_steps": 7870, "total_steps": 9134, "loss": 0.9151, "learning_rate": 2.325577349261826e-06, "epoch": 0.8615451982812885, "percentage": 86.16, "elapsed_time": "6 days, 0:16:53", "remaining_time": "23:10:22", "throughput": 2736.12, "total_tokens": 1421175840} {"current_steps": 7871, "total_steps": 9134, "loss": 0.9278, "learning_rate": 2.321957119694221e-06, "epoch": 0.8616546703522264, "percentage": 86.17, "elapsed_time": "6 days, 0:17:59", "remaining_time": "23:09:17", "throughput": 2736.15, "total_tokens": 1421374752} {"current_steps": 7872, "total_steps": 9134, "loss": 1.0867, "learning_rate": 2.3183395728957334e-06, "epoch": 0.8617641424231642, "percentage": 86.18, "elapsed_time": "6 days, 0:19:07", "remaining_time": "23:08:11", "throughput": 2736.19, "total_tokens": 1421580384} {"current_steps": 7873, "total_steps": 9134, "loss": 0.8585, "learning_rate": 2.3147247092943107e-06, "epoch": 0.8618736144941022, "percentage": 86.19, "elapsed_time": "6 days, 0:20:15", "remaining_time": "23:07:05", "throughput": 2736.23, "total_tokens": 1421784448} {"current_steps": 7874, "total_steps": 9134, "loss": 0.8153, "learning_rate": 2.311112529317591e-06, "epoch": 0.8619830865650401, "percentage": 86.21, "elapsed_time": "6 days, 0:21:13", "remaining_time": "23:05:58", "throughput": 2736.2, "total_tokens": 1421932960} {"current_steps": 7875, "total_steps": 9134, "loss": 0.8775, "learning_rate": 2.307503033392888e-06, "epoch": 0.862092558635978, "percentage": 86.22, "elapsed_time": "6 days, 0:22:21", "remaining_time": "23:04:52", "throughput": 2736.24, "total_tokens": 1422136128} {"current_steps": 7876, "total_steps": 9134, "loss": 0.8707, "learning_rate": 2.303896221947194e-06, "epoch": 0.8622020307069159, "percentage": 86.23, "elapsed_time": "6 days, 0:23:23", "remaining_time": "23:03:45", "throughput": 2736.25, "total_tokens": 1422313536} {"current_steps": 7877, "total_steps": 9134, "loss": 0.9514, "learning_rate": 2.3002920954071916e-06, "epoch": 0.8623115027778538, "percentage": 86.24, "elapsed_time": "6 days, 0:24:22", "remaining_time": "23:02:38", "throughput": 2736.25, "total_tokens": 1422473472} {"current_steps": 7878, "total_steps": 9134, "loss": 0.7847, "learning_rate": 2.296690654199238e-06, "epoch": 0.8624209748487917, "percentage": 86.25, "elapsed_time": "6 days, 0:25:28", "remaining_time": "23:01:32", "throughput": 2736.27, "total_tokens": 1422662080} {"current_steps": 7879, "total_steps": 9134, "loss": 0.7288, "learning_rate": 2.293091898749378e-06, "epoch": 0.8625304469197296, "percentage": 86.26, "elapsed_time": "6 days, 0:26:33", "remaining_time": "23:00:26", "throughput": 2736.26, "total_tokens": 1422838816} {"current_steps": 7880, "total_steps": 9134, "loss": 0.8464, "learning_rate": 2.2894958294833317e-06, "epoch": 0.8626399189906675, "percentage": 86.27, "elapsed_time": "6 days, 0:27:35", "remaining_time": "22:59:20", "throughput": 2736.25, "total_tokens": 1423000768} {"current_steps": 7881, "total_steps": 9134, "loss": 0.8793, "learning_rate": 2.2859024468265265e-06, "epoch": 0.8627493910616054, "percentage": 86.28, "elapsed_time": "6 days, 0:28:40", "remaining_time": "22:58:14", "throughput": 2736.25, "total_tokens": 1423182880} {"current_steps": 7882, "total_steps": 9134, "loss": 0.9295, "learning_rate": 2.2823117512040304e-06, "epoch": 0.8628588631325433, "percentage": 86.29, "elapsed_time": "6 days, 0:29:42", "remaining_time": "22:57:07", "throughput": 2736.26, "total_tokens": 1423353792} {"current_steps": 7883, "total_steps": 9134, "loss": 0.8576, "learning_rate": 2.2787237430406285e-06, "epoch": 0.8629683352034813, "percentage": 86.3, "elapsed_time": "6 days, 0:30:41", "remaining_time": "22:56:00", "throughput": 2736.24, "total_tokens": 1423506560} {"current_steps": 7884, "total_steps": 9134, "loss": 1.2177, "learning_rate": 2.2751384227607727e-06, "epoch": 0.8630778072744191, "percentage": 86.31, "elapsed_time": "6 days, 0:31:47", "remaining_time": "22:54:54", "throughput": 2736.27, "total_tokens": 1423701440} {"current_steps": 7885, "total_steps": 9134, "loss": 0.971, "learning_rate": 2.2715557907885986e-06, "epoch": 0.863187279345357, "percentage": 86.33, "elapsed_time": "6 days, 0:32:51", "remaining_time": "22:53:47", "throughput": 2736.26, "total_tokens": 1423872800} {"current_steps": 7886, "total_steps": 9134, "loss": 1.0315, "learning_rate": 2.2679758475479235e-06, "epoch": 0.8632967514162949, "percentage": 86.34, "elapsed_time": "6 days, 0:33:55", "remaining_time": "22:52:41", "throughput": 2736.28, "total_tokens": 1424060512} {"current_steps": 7887, "total_steps": 9134, "loss": 0.9044, "learning_rate": 2.264398593462247e-06, "epoch": 0.8634062234872328, "percentage": 86.35, "elapsed_time": "6 days, 0:35:03", "remaining_time": "22:51:35", "throughput": 2736.37, "total_tokens": 1424288768} {"current_steps": 7888, "total_steps": 9134, "loss": 1.0692, "learning_rate": 2.260824028954764e-06, "epoch": 0.8635156955581708, "percentage": 86.36, "elapsed_time": "6 days, 0:36:05", "remaining_time": "22:50:29", "throughput": 2736.35, "total_tokens": 1424446016} {"current_steps": 7889, "total_steps": 9134, "loss": 0.7548, "learning_rate": 2.2572521544483166e-06, "epoch": 0.8636251676291086, "percentage": 86.37, "elapsed_time": "6 days, 0:37:10", "remaining_time": "22:49:23", "throughput": 2736.35, "total_tokens": 1424625440} {"current_steps": 7890, "total_steps": 9134, "loss": 0.7942, "learning_rate": 2.2536829703654727e-06, "epoch": 0.8637346397000465, "percentage": 86.38, "elapsed_time": "6 days, 0:38:16", "remaining_time": "22:48:17", "throughput": 2736.37, "total_tokens": 1424815168} {"current_steps": 7891, "total_steps": 9134, "loss": 0.8447, "learning_rate": 2.2501164771284418e-06, "epoch": 0.8638441117709844, "percentage": 86.39, "elapsed_time": "6 days, 0:39:23", "remaining_time": "22:47:11", "throughput": 2736.41, "total_tokens": 1425019456} {"current_steps": 7892, "total_steps": 9134, "loss": 0.6941, "learning_rate": 2.246552675159147e-06, "epoch": 0.8639535838419223, "percentage": 86.4, "elapsed_time": "6 days, 0:40:26", "remaining_time": "22:46:04", "throughput": 2736.4, "total_tokens": 1425190144} {"current_steps": 7893, "total_steps": 9134, "loss": 0.9953, "learning_rate": 2.2429915648791684e-06, "epoch": 0.8640630559128603, "percentage": 86.41, "elapsed_time": "6 days, 0:41:33", "remaining_time": "22:44:58", "throughput": 2736.46, "total_tokens": 1425405856} {"current_steps": 7894, "total_steps": 9134, "loss": 0.8594, "learning_rate": 2.239433146709785e-06, "epoch": 0.8641725279837982, "percentage": 86.42, "elapsed_time": "6 days, 0:42:37", "remaining_time": "22:43:52", "throughput": 2736.46, "total_tokens": 1425579904} {"current_steps": 7895, "total_steps": 9134, "loss": 0.9179, "learning_rate": 2.2358774210719523e-06, "epoch": 0.864282000054736, "percentage": 86.44, "elapsed_time": "6 days, 0:43:39", "remaining_time": "22:42:46", "throughput": 2736.42, "total_tokens": 1425729312} {"current_steps": 7896, "total_steps": 9134, "loss": 0.8734, "learning_rate": 2.2323243883862976e-06, "epoch": 0.8643914721256739, "percentage": 86.45, "elapsed_time": "6 days, 0:44:45", "remaining_time": "22:41:40", "throughput": 2736.4, "total_tokens": 1425897984} {"current_steps": 7897, "total_steps": 9134, "loss": 0.9315, "learning_rate": 2.2287740490731514e-06, "epoch": 0.8645009441966118, "percentage": 86.46, "elapsed_time": "6 days, 0:45:53", "remaining_time": "22:40:34", "throughput": 2736.43, "total_tokens": 1426101600} {"current_steps": 7898, "total_steps": 9134, "loss": 0.7682, "learning_rate": 2.2252264035524968e-06, "epoch": 0.8646104162675498, "percentage": 86.47, "elapsed_time": "6 days, 0:46:57", "remaining_time": "22:39:28", "throughput": 2736.45, "total_tokens": 1426287520} {"current_steps": 7899, "total_steps": 9134, "loss": 0.8621, "learning_rate": 2.2216814522440233e-06, "epoch": 0.8647198883384877, "percentage": 86.48, "elapsed_time": "6 days, 0:48:03", "remaining_time": "22:38:22", "throughput": 2736.49, "total_tokens": 1426484416} {"current_steps": 7900, "total_steps": 9134, "loss": 0.7531, "learning_rate": 2.21813919556709e-06, "epoch": 0.8648293604094256, "percentage": 86.49, "elapsed_time": "6 days, 0:49:11", "remaining_time": "22:37:16", "throughput": 2736.5, "total_tokens": 1426677056} {"current_steps": 7901, "total_steps": 9134, "loss": 0.8248, "learning_rate": 2.214599633940739e-06, "epoch": 0.8649388324803634, "percentage": 86.5, "elapsed_time": "6 days, 0:50:18", "remaining_time": "22:36:10", "throughput": 2736.52, "total_tokens": 1426873280} {"current_steps": 7902, "total_steps": 9134, "loss": 0.8414, "learning_rate": 2.211062767783692e-06, "epoch": 0.8650483045513013, "percentage": 86.51, "elapsed_time": "6 days, 0:51:25", "remaining_time": "22:35:04", "throughput": 2736.5, "total_tokens": 1427047328} {"current_steps": 7903, "total_steps": 9134, "loss": 0.7419, "learning_rate": 2.207528597514355e-06, "epoch": 0.8651577766222392, "percentage": 86.52, "elapsed_time": "6 days, 0:52:27", "remaining_time": "22:33:58", "throughput": 2736.46, "total_tokens": 1427194272} {"current_steps": 7904, "total_steps": 9134, "loss": 0.7807, "learning_rate": 2.2039971235508135e-06, "epoch": 0.8652672486931772, "percentage": 86.53, "elapsed_time": "6 days, 0:53:34", "remaining_time": "22:32:52", "throughput": 2736.48, "total_tokens": 1427386016} {"current_steps": 7905, "total_steps": 9134, "loss": 1.0509, "learning_rate": 2.200468346310833e-06, "epoch": 0.8653767207641151, "percentage": 86.54, "elapsed_time": "6 days, 0:54:41", "remaining_time": "22:31:46", "throughput": 2736.54, "total_tokens": 1427602176} {"current_steps": 7906, "total_steps": 9134, "loss": 1.077, "learning_rate": 2.1969422662118572e-06, "epoch": 0.8654861928350529, "percentage": 86.56, "elapsed_time": "6 days, 0:55:40", "remaining_time": "22:30:39", "throughput": 2736.5, "total_tokens": 1427741952} {"current_steps": 7907, "total_steps": 9134, "loss": 1.0904, "learning_rate": 2.193418883671025e-06, "epoch": 0.8655956649059908, "percentage": 86.57, "elapsed_time": "6 days, 0:56:47", "remaining_time": "22:29:33", "throughput": 2736.5, "total_tokens": 1427925184} {"current_steps": 7908, "total_steps": 9134, "loss": 0.6643, "learning_rate": 2.189898199105139e-06, "epoch": 0.8657051369769287, "percentage": 86.58, "elapsed_time": "6 days, 0:57:53", "remaining_time": "22:28:27", "throughput": 2736.49, "total_tokens": 1428103040} {"current_steps": 7909, "total_steps": 9134, "loss": 0.7444, "learning_rate": 2.1863802129306886e-06, "epoch": 0.8658146090478667, "percentage": 86.59, "elapsed_time": "6 days, 0:58:59", "remaining_time": "22:27:21", "throughput": 2736.48, "total_tokens": 1428278208} {"current_steps": 7910, "total_steps": 9134, "loss": 1.0175, "learning_rate": 2.182864925563849e-06, "epoch": 0.8659240811188046, "percentage": 86.6, "elapsed_time": "6 days, 1:00:05", "remaining_time": "22:26:15", "throughput": 2736.5, "total_tokens": 1428468608} {"current_steps": 7911, "total_steps": 9134, "loss": 0.7739, "learning_rate": 2.1793523374204706e-06, "epoch": 0.8660335531897425, "percentage": 86.61, "elapsed_time": "6 days, 1:01:08", "remaining_time": "22:25:09", "throughput": 2736.49, "total_tokens": 1428634816} {"current_steps": 7912, "total_steps": 9134, "loss": 0.5897, "learning_rate": 2.175842448916085e-06, "epoch": 0.8661430252606803, "percentage": 86.62, "elapsed_time": "6 days, 1:02:15", "remaining_time": "22:24:03", "throughput": 2736.49, "total_tokens": 1428819616} {"current_steps": 7913, "total_steps": 9134, "loss": 0.75, "learning_rate": 2.1723352604658994e-06, "epoch": 0.8662524973316182, "percentage": 86.63, "elapsed_time": "6 days, 1:03:16", "remaining_time": "22:22:56", "throughput": 2736.47, "total_tokens": 1428977984} {"current_steps": 7914, "total_steps": 9134, "loss": 0.6415, "learning_rate": 2.1688307724848227e-06, "epoch": 0.8663619694025562, "percentage": 86.64, "elapsed_time": "6 days, 1:04:22", "remaining_time": "22:21:50", "throughput": 2736.49, "total_tokens": 1429164128} {"current_steps": 7915, "total_steps": 9134, "loss": 0.9209, "learning_rate": 2.1653289853874103e-06, "epoch": 0.8664714414734941, "percentage": 86.65, "elapsed_time": "6 days, 1:05:23", "remaining_time": "22:20:43", "throughput": 2736.47, "total_tokens": 1429324064} {"current_steps": 7916, "total_steps": 9134, "loss": 0.8351, "learning_rate": 2.161829899587933e-06, "epoch": 0.866580913544432, "percentage": 86.67, "elapsed_time": "6 days, 1:06:31", "remaining_time": "22:19:38", "throughput": 2736.47, "total_tokens": 1429507520} {"current_steps": 7917, "total_steps": 9134, "loss": 1.0325, "learning_rate": 2.158333515500316e-06, "epoch": 0.8666903856153699, "percentage": 86.68, "elapsed_time": "6 days, 1:07:36", "remaining_time": "22:18:31", "throughput": 2736.46, "total_tokens": 1429681792} {"current_steps": 7918, "total_steps": 9134, "loss": 0.9532, "learning_rate": 2.1548398335381802e-06, "epoch": 0.8667998576863077, "percentage": 86.69, "elapsed_time": "6 days, 1:08:41", "remaining_time": "22:17:25", "throughput": 2736.49, "total_tokens": 1429875776} {"current_steps": 7919, "total_steps": 9134, "loss": 0.7295, "learning_rate": 2.151348854114821e-06, "epoch": 0.8669093297572457, "percentage": 86.7, "elapsed_time": "6 days, 1:09:47", "remaining_time": "22:16:19", "throughput": 2736.53, "total_tokens": 1430077824} {"current_steps": 7920, "total_steps": 9134, "loss": 0.9101, "learning_rate": 2.147860577643207e-06, "epoch": 0.8670188018281836, "percentage": 86.71, "elapsed_time": "6 days, 1:10:55", "remaining_time": "22:15:14", "throughput": 2736.56, "total_tokens": 1430275840} {"current_steps": 7921, "total_steps": 9134, "loss": 1.249, "learning_rate": 2.144375004536012e-06, "epoch": 0.8671282738991215, "percentage": 86.72, "elapsed_time": "6 days, 1:12:02", "remaining_time": "22:14:08", "throughput": 2736.6, "total_tokens": 1430482144} {"current_steps": 7922, "total_steps": 9134, "loss": 0.8179, "learning_rate": 2.1408921352055496e-06, "epoch": 0.8672377459700594, "percentage": 86.73, "elapsed_time": "6 days, 1:13:09", "remaining_time": "22:13:02", "throughput": 2736.65, "total_tokens": 1430691136} {"current_steps": 7923, "total_steps": 9134, "loss": 0.8916, "learning_rate": 2.1374119700638575e-06, "epoch": 0.8673472180409972, "percentage": 86.74, "elapsed_time": "6 days, 1:14:14", "remaining_time": "22:11:56", "throughput": 2736.63, "total_tokens": 1430857344} {"current_steps": 7924, "total_steps": 9134, "loss": 0.7561, "learning_rate": 2.1339345095226144e-06, "epoch": 0.8674566901119352, "percentage": 86.75, "elapsed_time": "6 days, 1:15:19", "remaining_time": "22:10:50", "throughput": 2736.67, "total_tokens": 1431059168} {"current_steps": 7925, "total_steps": 9134, "loss": 0.7718, "learning_rate": 2.1304597539932137e-06, "epoch": 0.8675661621828731, "percentage": 86.76, "elapsed_time": "6 days, 1:16:18", "remaining_time": "22:09:43", "throughput": 2736.65, "total_tokens": 1431208800} {"current_steps": 7926, "total_steps": 9134, "loss": 0.8912, "learning_rate": 2.1269877038867013e-06, "epoch": 0.867675634253811, "percentage": 86.77, "elapsed_time": "6 days, 1:17:21", "remaining_time": "22:08:36", "throughput": 2736.66, "total_tokens": 1431385088} {"current_steps": 7927, "total_steps": 9134, "loss": 0.941, "learning_rate": 2.1235183596138214e-06, "epoch": 0.8677851063247489, "percentage": 86.79, "elapsed_time": "6 days, 1:18:28", "remaining_time": "22:07:30", "throughput": 2736.69, "total_tokens": 1431588704} {"current_steps": 7928, "total_steps": 9134, "loss": 0.7733, "learning_rate": 2.120051721584984e-06, "epoch": 0.8678945783956868, "percentage": 86.8, "elapsed_time": "6 days, 1:19:36", "remaining_time": "22:06:25", "throughput": 2736.73, "total_tokens": 1431794336} {"current_steps": 7929, "total_steps": 9134, "loss": 1.0319, "learning_rate": 2.1165877902102867e-06, "epoch": 0.8680040504666247, "percentage": 86.81, "elapsed_time": "6 days, 1:20:40", "remaining_time": "22:05:18", "throughput": 2736.75, "total_tokens": 1431978240} {"current_steps": 7930, "total_steps": 9134, "loss": 0.8809, "learning_rate": 2.113126565899515e-06, "epoch": 0.8681135225375626, "percentage": 86.82, "elapsed_time": "6 days, 1:21:44", "remaining_time": "22:04:12", "throughput": 2736.77, "total_tokens": 1432164384} {"current_steps": 7931, "total_steps": 9134, "loss": 1.0229, "learning_rate": 2.1096680490621107e-06, "epoch": 0.8682229946085005, "percentage": 86.83, "elapsed_time": "6 days, 1:22:45", "remaining_time": "22:03:05", "throughput": 2736.76, "total_tokens": 1432323872} {"current_steps": 7932, "total_steps": 9134, "loss": 0.8813, "learning_rate": 2.106212240107225e-06, "epoch": 0.8683324666794384, "percentage": 86.84, "elapsed_time": "6 days, 1:23:47", "remaining_time": "22:01:59", "throughput": 2736.74, "total_tokens": 1432488512} {"current_steps": 7933, "total_steps": 9134, "loss": 0.6869, "learning_rate": 2.102759139443658e-06, "epoch": 0.8684419387503763, "percentage": 86.85, "elapsed_time": "6 days, 1:24:46", "remaining_time": "22:00:52", "throughput": 2736.7, "total_tokens": 1432624928} {"current_steps": 7934, "total_steps": 9134, "loss": 0.9822, "learning_rate": 2.0993087474799166e-06, "epoch": 0.8685514108213143, "percentage": 86.86, "elapsed_time": "6 days, 1:25:52", "remaining_time": "21:59:46", "throughput": 2736.76, "total_tokens": 1432839520} {"current_steps": 7935, "total_steps": 9134, "loss": 1.054, "learning_rate": 2.0958610646241717e-06, "epoch": 0.8686608828922521, "percentage": 86.87, "elapsed_time": "6 days, 1:26:59", "remaining_time": "21:58:40", "throughput": 2736.83, "total_tokens": 1433056576} {"current_steps": 7936, "total_steps": 9134, "loss": 0.7834, "learning_rate": 2.09241609128428e-06, "epoch": 0.86877035496319, "percentage": 86.88, "elapsed_time": "6 days, 1:28:02", "remaining_time": "21:57:33", "throughput": 2736.82, "total_tokens": 1433224128} {"current_steps": 7937, "total_steps": 9134, "loss": 0.887, "learning_rate": 2.0889738278677686e-06, "epoch": 0.8688798270341279, "percentage": 86.9, "elapsed_time": "6 days, 1:29:07", "remaining_time": "21:56:27", "throughput": 2736.82, "total_tokens": 1433401984} {"current_steps": 7938, "total_steps": 9134, "loss": 0.7389, "learning_rate": 2.085534274781853e-06, "epoch": 0.8689892991050658, "percentage": 86.91, "elapsed_time": "6 days, 1:30:13", "remaining_time": "21:55:21", "throughput": 2736.83, "total_tokens": 1433591264} {"current_steps": 7939, "total_steps": 9134, "loss": 0.8667, "learning_rate": 2.0820974324334356e-06, "epoch": 0.8690987711760038, "percentage": 86.92, "elapsed_time": "6 days, 1:31:16", "remaining_time": "21:54:15", "throughput": 2736.83, "total_tokens": 1433762176} {"current_steps": 7940, "total_steps": 9134, "loss": 1.0546, "learning_rate": 2.0786633012290723e-06, "epoch": 0.8692082432469416, "percentage": 86.93, "elapsed_time": "6 days, 1:32:21", "remaining_time": "21:53:09", "throughput": 2736.81, "total_tokens": 1433930848} {"current_steps": 7941, "total_steps": 9134, "loss": 0.8716, "learning_rate": 2.0752318815750265e-06, "epoch": 0.8693177153178795, "percentage": 86.94, "elapsed_time": "6 days, 1:33:21", "remaining_time": "21:52:02", "throughput": 2736.78, "total_tokens": 1434077120} {"current_steps": 7942, "total_steps": 9134, "loss": 0.7107, "learning_rate": 2.0718031738772265e-06, "epoch": 0.8694271873888174, "percentage": 86.95, "elapsed_time": "6 days, 1:34:26", "remaining_time": "21:50:56", "throughput": 2736.81, "total_tokens": 1434270432} {"current_steps": 7943, "total_steps": 9134, "loss": 0.6412, "learning_rate": 2.068377178541275e-06, "epoch": 0.8695366594597553, "percentage": 86.96, "elapsed_time": "6 days, 1:35:30", "remaining_time": "21:49:49", "throughput": 2736.79, "total_tokens": 1434432832} {"current_steps": 7944, "total_steps": 9134, "loss": 0.8234, "learning_rate": 2.0649538959724686e-06, "epoch": 0.8696461315306933, "percentage": 86.97, "elapsed_time": "6 days, 1:36:36", "remaining_time": "21:48:43", "throughput": 2736.78, "total_tokens": 1434610240} {"current_steps": 7945, "total_steps": 9134, "loss": 0.6637, "learning_rate": 2.0615333265757737e-06, "epoch": 0.8697556036016312, "percentage": 86.98, "elapsed_time": "6 days, 1:37:43", "remaining_time": "21:47:38", "throughput": 2736.79, "total_tokens": 1434799744} {"current_steps": 7946, "total_steps": 9134, "loss": 0.6997, "learning_rate": 2.058115470755831e-06, "epoch": 0.869865075672569, "percentage": 86.99, "elapsed_time": "6 days, 1:38:46", "remaining_time": "21:46:31", "throughput": 2736.78, "total_tokens": 1434969088} {"current_steps": 7947, "total_steps": 9134, "loss": 0.8498, "learning_rate": 2.0547003289169724e-06, "epoch": 0.8699745477435069, "percentage": 87.0, "elapsed_time": "6 days, 1:39:50", "remaining_time": "21:45:25", "throughput": 2736.75, "total_tokens": 1435127008} {"current_steps": 7948, "total_steps": 9134, "loss": 0.8177, "learning_rate": 2.0512879014631976e-06, "epoch": 0.8700840198144448, "percentage": 87.02, "elapsed_time": "6 days, 1:40:55", "remaining_time": "21:44:19", "throughput": 2736.81, "total_tokens": 1435333536} {"current_steps": 7949, "total_steps": 9134, "loss": 0.8377, "learning_rate": 2.047878188798197e-06, "epoch": 0.8701934918853828, "percentage": 87.03, "elapsed_time": "6 days, 1:42:03", "remaining_time": "21:43:13", "throughput": 2736.82, "total_tokens": 1435527296} {"current_steps": 7950, "total_steps": 9134, "loss": 0.7697, "learning_rate": 2.0444711913253312e-06, "epoch": 0.8703029639563207, "percentage": 87.04, "elapsed_time": "6 days, 1:43:07", "remaining_time": "21:42:07", "throughput": 2736.84, "total_tokens": 1435710304} {"current_steps": 7951, "total_steps": 9134, "loss": 0.8658, "learning_rate": 2.041066909447639e-06, "epoch": 0.8704124360272586, "percentage": 87.05, "elapsed_time": "6 days, 1:44:14", "remaining_time": "21:41:01", "throughput": 2736.86, "total_tokens": 1435906752} {"current_steps": 7952, "total_steps": 9134, "loss": 0.8749, "learning_rate": 2.0376653435678405e-06, "epoch": 0.8705219080981964, "percentage": 87.06, "elapsed_time": "6 days, 1:45:20", "remaining_time": "21:39:55", "throughput": 2736.9, "total_tokens": 1436108352} {"current_steps": 7953, "total_steps": 9134, "loss": 0.6855, "learning_rate": 2.0342664940883353e-06, "epoch": 0.8706313801691343, "percentage": 87.07, "elapsed_time": "6 days, 1:46:24", "remaining_time": "21:38:49", "throughput": 2736.9, "total_tokens": 1436282400} {"current_steps": 7954, "total_steps": 9134, "loss": 1.1256, "learning_rate": 2.030870361411202e-06, "epoch": 0.8707408522400722, "percentage": 87.08, "elapsed_time": "6 days, 1:47:30", "remaining_time": "21:37:43", "throughput": 2736.92, "total_tokens": 1436473696} {"current_steps": 7955, "total_steps": 9134, "loss": 1.1362, "learning_rate": 2.027476945938189e-06, "epoch": 0.8708503243110102, "percentage": 87.09, "elapsed_time": "6 days, 1:48:35", "remaining_time": "21:36:36", "throughput": 2736.91, "total_tokens": 1436646400} {"current_steps": 7956, "total_steps": 9134, "loss": 0.8049, "learning_rate": 2.0240862480707475e-06, "epoch": 0.8709597963819481, "percentage": 87.1, "elapsed_time": "6 days, 1:49:39", "remaining_time": "21:35:30", "throughput": 2736.93, "total_tokens": 1436832992} {"current_steps": 7957, "total_steps": 9134, "loss": 1.0491, "learning_rate": 2.0206982682099723e-06, "epoch": 0.8710692684528859, "percentage": 87.11, "elapsed_time": "6 days, 1:50:43", "remaining_time": "21:34:24", "throughput": 2736.97, "total_tokens": 1437024960} {"current_steps": 7958, "total_steps": 9134, "loss": 0.8016, "learning_rate": 2.017313006756666e-06, "epoch": 0.8711787405238238, "percentage": 87.13, "elapsed_time": "6 days, 1:51:48", "remaining_time": "21:33:18", "throughput": 2736.96, "total_tokens": 1437203040} {"current_steps": 7959, "total_steps": 9134, "loss": 0.8894, "learning_rate": 2.0139304641112966e-06, "epoch": 0.8712882125947617, "percentage": 87.14, "elapsed_time": "6 days, 1:52:56", "remaining_time": "21:32:12", "throughput": 2736.98, "total_tokens": 1437396800} {"current_steps": 7960, "total_steps": 9134, "loss": 0.9047, "learning_rate": 2.010550640674011e-06, "epoch": 0.8713976846656997, "percentage": 87.15, "elapsed_time": "6 days, 1:54:01", "remaining_time": "21:31:06", "throughput": 2736.98, "total_tokens": 1437573088} {"current_steps": 7961, "total_steps": 9134, "loss": 0.8187, "learning_rate": 2.0071735368446364e-06, "epoch": 0.8715071567366376, "percentage": 87.16, "elapsed_time": "6 days, 1:55:06", "remaining_time": "21:30:00", "throughput": 2737.02, "total_tokens": 1437775360} {"current_steps": 7962, "total_steps": 9134, "loss": 0.8468, "learning_rate": 2.003799153022673e-06, "epoch": 0.8716166288075755, "percentage": 87.17, "elapsed_time": "6 days, 1:56:13", "remaining_time": "21:28:54", "throughput": 2737.05, "total_tokens": 1437974272} {"current_steps": 7963, "total_steps": 9134, "loss": 0.7723, "learning_rate": 2.0004274896073176e-06, "epoch": 0.8717261008785133, "percentage": 87.18, "elapsed_time": "6 days, 1:57:18", "remaining_time": "21:27:48", "throughput": 2737.08, "total_tokens": 1438170720} {"current_steps": 7964, "total_steps": 9134, "loss": 0.97, "learning_rate": 1.9970585469974127e-06, "epoch": 0.8718355729494512, "percentage": 87.19, "elapsed_time": "6 days, 1:58:25", "remaining_time": "21:26:42", "throughput": 2737.12, "total_tokens": 1438372320} {"current_steps": 7965, "total_steps": 9134, "loss": 0.8117, "learning_rate": 1.9936923255915175e-06, "epoch": 0.8719450450203892, "percentage": 87.2, "elapsed_time": "6 days, 1:59:32", "remaining_time": "21:25:36", "throughput": 2737.18, "total_tokens": 1438589376} {"current_steps": 7966, "total_steps": 9134, "loss": 0.7077, "learning_rate": 1.9903288257878292e-06, "epoch": 0.8720545170913271, "percentage": 87.21, "elapsed_time": "6 days, 2:00:37", "remaining_time": "21:24:30", "throughput": 2737.21, "total_tokens": 1438776416} {"current_steps": 7967, "total_steps": 9134, "loss": 0.9362, "learning_rate": 1.986968047984261e-06, "epoch": 0.872163989162265, "percentage": 87.22, "elapsed_time": "6 days, 2:01:45", "remaining_time": "21:23:24", "throughput": 2737.25, "total_tokens": 1438984064} {"current_steps": 7968, "total_steps": 9134, "loss": 0.9842, "learning_rate": 1.983609992578375e-06, "epoch": 0.8722734612332029, "percentage": 87.23, "elapsed_time": "6 days, 2:02:50", "remaining_time": "21:22:18", "throughput": 2737.27, "total_tokens": 1439177376} {"current_steps": 7969, "total_steps": 9134, "loss": 1.1032, "learning_rate": 1.9802546599674313e-06, "epoch": 0.8723829333041407, "percentage": 87.25, "elapsed_time": "6 days, 2:03:54", "remaining_time": "21:21:12", "throughput": 2737.27, "total_tokens": 1439351424} {"current_steps": 7970, "total_steps": 9134, "loss": 0.9115, "learning_rate": 1.9769020505483544e-06, "epoch": 0.8724924053750787, "percentage": 87.26, "elapsed_time": "6 days, 2:04:59", "remaining_time": "21:20:06", "throughput": 2737.27, "total_tokens": 1439527040} {"current_steps": 7971, "total_steps": 9134, "loss": 0.9054, "learning_rate": 1.973552164717746e-06, "epoch": 0.8726018774460166, "percentage": 87.27, "elapsed_time": "6 days, 2:06:07", "remaining_time": "21:19:00", "throughput": 2737.31, "total_tokens": 1439734912} {"current_steps": 7972, "total_steps": 9134, "loss": 0.9975, "learning_rate": 1.9702050028719056e-06, "epoch": 0.8727113495169545, "percentage": 87.28, "elapsed_time": "6 days, 2:07:14", "remaining_time": "21:17:54", "throughput": 2737.31, "total_tokens": 1439918816} {"current_steps": 7973, "total_steps": 9134, "loss": 0.8377, "learning_rate": 1.9668605654067805e-06, "epoch": 0.8728208215878924, "percentage": 87.29, "elapsed_time": "6 days, 2:08:18", "remaining_time": "21:16:48", "throughput": 2737.31, "total_tokens": 1440094208} {"current_steps": 7974, "total_steps": 9134, "loss": 0.9173, "learning_rate": 1.9635188527180244e-06, "epoch": 0.8729302936588302, "percentage": 87.3, "elapsed_time": "6 days, 2:09:22", "remaining_time": "21:15:42", "throughput": 2737.32, "total_tokens": 1440272512} {"current_steps": 7975, "total_steps": 9134, "loss": 0.7722, "learning_rate": 1.960179865200948e-06, "epoch": 0.8730397657297682, "percentage": 87.31, "elapsed_time": "6 days, 2:10:21", "remaining_time": "21:14:35", "throughput": 2737.28, "total_tokens": 1440415872} {"current_steps": 7976, "total_steps": 9134, "loss": 0.83, "learning_rate": 1.9568436032505493e-06, "epoch": 0.8731492378007061, "percentage": 87.32, "elapsed_time": "6 days, 2:11:29", "remaining_time": "21:13:29", "throughput": 2737.28, "total_tokens": 1440602688} {"current_steps": 7977, "total_steps": 9134, "loss": 0.897, "learning_rate": 1.953510067261499e-06, "epoch": 0.873258709871644, "percentage": 87.33, "elapsed_time": "6 days, 2:12:35", "remaining_time": "21:12:23", "throughput": 2737.3, "total_tokens": 1440794656} {"current_steps": 7978, "total_steps": 9134, "loss": 1.0808, "learning_rate": 1.950179257628154e-06, "epoch": 0.8733681819425819, "percentage": 87.34, "elapsed_time": "6 days, 2:13:41", "remaining_time": "21:11:17", "throughput": 2737.33, "total_tokens": 1440986400} {"current_steps": 7979, "total_steps": 9134, "loss": 0.9389, "learning_rate": 1.946851174744538e-06, "epoch": 0.8734776540135198, "percentage": 87.35, "elapsed_time": "6 days, 2:14:45", "remaining_time": "21:10:11", "throughput": 2737.35, "total_tokens": 1441177024} {"current_steps": 7980, "total_steps": 9134, "loss": 0.8517, "learning_rate": 1.943525819004352e-06, "epoch": 0.8735871260844577, "percentage": 87.37, "elapsed_time": "6 days, 2:15:53", "remaining_time": "21:09:05", "throughput": 2737.38, "total_tokens": 1441377504} {"current_steps": 7981, "total_steps": 9134, "loss": 0.9728, "learning_rate": 1.9402031908009904e-06, "epoch": 0.8736965981553956, "percentage": 87.38, "elapsed_time": "6 days, 2:16:55", "remaining_time": "21:07:59", "throughput": 2737.37, "total_tokens": 1441543040} {"current_steps": 7982, "total_steps": 9134, "loss": 0.9247, "learning_rate": 1.936883290527508e-06, "epoch": 0.8738060702263335, "percentage": 87.39, "elapsed_time": "6 days, 2:18:02", "remaining_time": "21:06:53", "throughput": 2737.37, "total_tokens": 1441724256} {"current_steps": 7983, "total_steps": 9134, "loss": 0.8652, "learning_rate": 1.9335661185766436e-06, "epoch": 0.8739155422972714, "percentage": 87.4, "elapsed_time": "6 days, 2:19:08", "remaining_time": "21:05:47", "throughput": 2737.39, "total_tokens": 1441917344} {"current_steps": 7984, "total_steps": 9134, "loss": 0.8265, "learning_rate": 1.9302516753408136e-06, "epoch": 0.8740250143682093, "percentage": 87.41, "elapsed_time": "6 days, 2:20:11", "remaining_time": "21:04:40", "throughput": 2737.38, "total_tokens": 1442082432} {"current_steps": 7985, "total_steps": 9134, "loss": 0.8603, "learning_rate": 1.926939961212107e-06, "epoch": 0.8741344864391473, "percentage": 87.42, "elapsed_time": "6 days, 2:21:16", "remaining_time": "21:03:34", "throughput": 2737.42, "total_tokens": 1442282240} {"current_steps": 7986, "total_steps": 9134, "loss": 1.0881, "learning_rate": 1.923630976582294e-06, "epoch": 0.8742439585100851, "percentage": 87.43, "elapsed_time": "6 days, 2:22:19", "remaining_time": "21:02:28", "throughput": 2737.4, "total_tokens": 1442443296} {"current_steps": 7987, "total_steps": 9134, "loss": 1.0638, "learning_rate": 1.9203247218428226e-06, "epoch": 0.874353430581023, "percentage": 87.44, "elapsed_time": "6 days, 2:23:26", "remaining_time": "21:01:22", "throughput": 2737.41, "total_tokens": 1442633920} {"current_steps": 7988, "total_steps": 9134, "loss": 1.1263, "learning_rate": 1.9170211973848106e-06, "epoch": 0.8744629026519609, "percentage": 87.45, "elapsed_time": "6 days, 2:24:30", "remaining_time": "21:00:16", "throughput": 2737.4, "total_tokens": 1442801696} {"current_steps": 7989, "total_steps": 9134, "loss": 0.8317, "learning_rate": 1.9137204035990704e-06, "epoch": 0.8745723747228988, "percentage": 87.46, "elapsed_time": "6 days, 2:25:36", "remaining_time": "20:59:10", "throughput": 2737.42, "total_tokens": 1442992544} {"current_steps": 7990, "total_steps": 9134, "loss": 0.805, "learning_rate": 1.9104223408760698e-06, "epoch": 0.8746818467938368, "percentage": 87.48, "elapsed_time": "6 days, 2:26:39", "remaining_time": "20:58:03", "throughput": 2737.4, "total_tokens": 1443156288} {"current_steps": 7991, "total_steps": 9134, "loss": 0.9913, "learning_rate": 1.907127009605969e-06, "epoch": 0.8747913188647746, "percentage": 87.49, "elapsed_time": "6 days, 2:27:41", "remaining_time": "20:56:57", "throughput": 2737.37, "total_tokens": 1443312416} {"current_steps": 7992, "total_steps": 9134, "loss": 0.9264, "learning_rate": 1.9038344101785954e-06, "epoch": 0.8749007909357125, "percentage": 87.5, "elapsed_time": "6 days, 2:28:45", "remaining_time": "20:55:51", "throughput": 2737.35, "total_tokens": 1443474368} {"current_steps": 7993, "total_steps": 9134, "loss": 0.8144, "learning_rate": 1.9005445429834595e-06, "epoch": 0.8750102630066504, "percentage": 87.51, "elapsed_time": "6 days, 2:29:49", "remaining_time": "20:54:44", "throughput": 2737.35, "total_tokens": 1443650656} {"current_steps": 7994, "total_steps": 9134, "loss": 1.0021, "learning_rate": 1.8972574084097472e-06, "epoch": 0.8751197350775883, "percentage": 87.52, "elapsed_time": "6 days, 2:30:56", "remaining_time": "20:53:39", "throughput": 2737.37, "total_tokens": 1443844640} {"current_steps": 7995, "total_steps": 9134, "loss": 0.955, "learning_rate": 1.8939730068463114e-06, "epoch": 0.8752292071485263, "percentage": 87.53, "elapsed_time": "6 days, 2:32:04", "remaining_time": "20:52:33", "throughput": 2737.39, "total_tokens": 1444039744} {"current_steps": 7996, "total_steps": 9134, "loss": 0.8502, "learning_rate": 1.8906913386817077e-06, "epoch": 0.8753386792194642, "percentage": 87.54, "elapsed_time": "6 days, 2:33:09", "remaining_time": "20:51:27", "throughput": 2737.38, "total_tokens": 1444210880} {"current_steps": 7997, "total_steps": 9134, "loss": 0.8335, "learning_rate": 1.8874124043041314e-06, "epoch": 0.875448151290402, "percentage": 87.55, "elapsed_time": "6 days, 2:34:14", "remaining_time": "20:50:21", "throughput": 2737.39, "total_tokens": 1444397248} {"current_steps": 7998, "total_steps": 9134, "loss": 0.6665, "learning_rate": 1.8841362041014944e-06, "epoch": 0.8755576233613399, "percentage": 87.56, "elapsed_time": "6 days, 2:35:15", "remaining_time": "20:49:14", "throughput": 2737.4, "total_tokens": 1444570624} {"current_steps": 7999, "total_steps": 9134, "loss": 1.1255, "learning_rate": 1.8808627384613448e-06, "epoch": 0.8756670954322778, "percentage": 87.57, "elapsed_time": "6 days, 2:36:21", "remaining_time": "20:48:08", "throughput": 2737.43, "total_tokens": 1444762592} {"current_steps": 8000, "total_steps": 9134, "loss": 1.0141, "learning_rate": 1.8775920077709397e-06, "epoch": 0.8757765675032158, "percentage": 87.58, "elapsed_time": "6 days, 2:37:25", "remaining_time": "20:47:02", "throughput": 2737.43, "total_tokens": 1444942688} {"current_steps": 8001, "total_steps": 9134, "loss": 0.6989, "learning_rate": 1.8743240124172002e-06, "epoch": 0.8758860395741537, "percentage": 87.6, "elapsed_time": "6 days, 2:41:03", "remaining_time": "20:46:17", "throughput": 2736.62, "total_tokens": 1445108672} {"current_steps": 8002, "total_steps": 9134, "loss": 0.7678, "learning_rate": 1.8710587527867196e-06, "epoch": 0.8759955116450916, "percentage": 87.61, "elapsed_time": "6 days, 2:42:03", "remaining_time": "20:45:10", "throughput": 2736.58, "total_tokens": 1445253152} {"current_steps": 8003, "total_steps": 9134, "loss": 0.7638, "learning_rate": 1.8677962292657724e-06, "epoch": 0.8761049837160294, "percentage": 87.62, "elapsed_time": "6 days, 2:43:06", "remaining_time": "20:44:04", "throughput": 2736.57, "total_tokens": 1445420032} {"current_steps": 8004, "total_steps": 9134, "loss": 0.7675, "learning_rate": 1.8645364422403083e-06, "epoch": 0.8762144557869673, "percentage": 87.63, "elapsed_time": "6 days, 2:44:10", "remaining_time": "20:42:58", "throughput": 2736.58, "total_tokens": 1445598560} {"current_steps": 8005, "total_steps": 9134, "loss": 0.9291, "learning_rate": 1.8612793920959632e-06, "epoch": 0.8763239278579052, "percentage": 87.64, "elapsed_time": "6 days, 2:45:08", "remaining_time": "20:41:51", "throughput": 2736.56, "total_tokens": 1445749088} {"current_steps": 8006, "total_steps": 9134, "loss": 0.7447, "learning_rate": 1.8580250792180232e-06, "epoch": 0.8764333999288432, "percentage": 87.65, "elapsed_time": "6 days, 2:46:13", "remaining_time": "20:40:44", "throughput": 2736.58, "total_tokens": 1445935904} {"current_steps": 8007, "total_steps": 9134, "loss": 1.0742, "learning_rate": 1.8547735039914859e-06, "epoch": 0.8765428719997811, "percentage": 87.66, "elapsed_time": "6 days, 2:47:19", "remaining_time": "20:39:38", "throughput": 2736.59, "total_tokens": 1446120928} {"current_steps": 8008, "total_steps": 9134, "loss": 0.9839, "learning_rate": 1.8515246668009883e-06, "epoch": 0.8766523440707189, "percentage": 87.67, "elapsed_time": "6 days, 2:48:23", "remaining_time": "20:38:32", "throughput": 2736.59, "total_tokens": 1446295424} {"current_steps": 8009, "total_steps": 9134, "loss": 0.8744, "learning_rate": 1.8482785680308728e-06, "epoch": 0.8767618161416568, "percentage": 87.68, "elapsed_time": "6 days, 2:49:28", "remaining_time": "20:37:26", "throughput": 2736.62, "total_tokens": 1446488960} {"current_steps": 8010, "total_steps": 9134, "loss": 0.8698, "learning_rate": 1.845035208065146e-06, "epoch": 0.8768712882125947, "percentage": 87.69, "elapsed_time": "6 days, 2:50:32", "remaining_time": "20:36:20", "throughput": 2736.64, "total_tokens": 1446676000} {"current_steps": 8011, "total_steps": 9134, "loss": 0.8216, "learning_rate": 1.8417945872874875e-06, "epoch": 0.8769807602835327, "percentage": 87.71, "elapsed_time": "6 days, 2:51:33", "remaining_time": "20:35:13", "throughput": 2736.62, "total_tokens": 1446831232} {"current_steps": 8012, "total_steps": 9134, "loss": 1.0143, "learning_rate": 1.8385567060812598e-06, "epoch": 0.8770902323544706, "percentage": 87.72, "elapsed_time": "6 days, 2:52:38", "remaining_time": "20:34:07", "throughput": 2736.63, "total_tokens": 1447016928} {"current_steps": 8013, "total_steps": 9134, "loss": 0.7935, "learning_rate": 1.8353215648294925e-06, "epoch": 0.8771997044254085, "percentage": 87.73, "elapsed_time": "6 days, 2:53:42", "remaining_time": "20:33:01", "throughput": 2736.67, "total_tokens": 1447212928} {"current_steps": 8014, "total_steps": 9134, "loss": 0.8023, "learning_rate": 1.8320891639149101e-06, "epoch": 0.8773091764963463, "percentage": 87.74, "elapsed_time": "6 days, 2:54:45", "remaining_time": "20:31:54", "throughput": 2736.68, "total_tokens": 1447387424} {"current_steps": 8015, "total_steps": 9134, "loss": 0.8365, "learning_rate": 1.828859503719879e-06, "epoch": 0.8774186485672842, "percentage": 87.75, "elapsed_time": "6 days, 2:55:49", "remaining_time": "20:30:48", "throughput": 2736.67, "total_tokens": 1447562592} {"current_steps": 8016, "total_steps": 9134, "loss": 0.7126, "learning_rate": 1.82563258462648e-06, "epoch": 0.8775281206382222, "percentage": 87.76, "elapsed_time": "6 days, 2:56:51", "remaining_time": "20:29:41", "throughput": 2736.65, "total_tokens": 1447718720} {"current_steps": 8017, "total_steps": 9134, "loss": 0.7217, "learning_rate": 1.8224084070164405e-06, "epoch": 0.8776375927091601, "percentage": 87.77, "elapsed_time": "6 days, 2:57:55", "remaining_time": "20:28:35", "throughput": 2736.68, "total_tokens": 1447912704} {"current_steps": 8018, "total_steps": 9134, "loss": 1.1072, "learning_rate": 1.8191869712711807e-06, "epoch": 0.877747064780098, "percentage": 87.78, "elapsed_time": "6 days, 2:59:02", "remaining_time": "20:27:29", "throughput": 2736.71, "total_tokens": 1448108928} {"current_steps": 8019, "total_steps": 9134, "loss": 1.1257, "learning_rate": 1.81596827777179e-06, "epoch": 0.8778565368510359, "percentage": 87.79, "elapsed_time": "6 days, 3:00:06", "remaining_time": "20:26:23", "throughput": 2736.74, "total_tokens": 1448298880} {"current_steps": 8020, "total_steps": 9134, "loss": 1.0175, "learning_rate": 1.8127523268990282e-06, "epoch": 0.8779660089219737, "percentage": 87.8, "elapsed_time": "6 days, 3:01:10", "remaining_time": "20:25:17", "throughput": 2736.74, "total_tokens": 1448476064} {"current_steps": 8021, "total_steps": 9134, "loss": 1.049, "learning_rate": 1.8095391190333404e-06, "epoch": 0.8780754809929117, "percentage": 87.81, "elapsed_time": "6 days, 3:02:14", "remaining_time": "20:24:10", "throughput": 2736.74, "total_tokens": 1448653248} {"current_steps": 8022, "total_steps": 9134, "loss": 0.6419, "learning_rate": 1.8063286545548398e-06, "epoch": 0.8781849530638496, "percentage": 87.83, "elapsed_time": "6 days, 3:03:19", "remaining_time": "20:23:04", "throughput": 2736.75, "total_tokens": 1448834688} {"current_steps": 8023, "total_steps": 9134, "loss": 1.2523, "learning_rate": 1.8031209338433246e-06, "epoch": 0.8782944251347875, "percentage": 87.84, "elapsed_time": "6 days, 3:04:23", "remaining_time": "20:21:58", "throughput": 2736.8, "total_tokens": 1449035392} {"current_steps": 8024, "total_steps": 9134, "loss": 0.9236, "learning_rate": 1.799915957278256e-06, "epoch": 0.8784038972057254, "percentage": 87.85, "elapsed_time": "6 days, 3:05:30", "remaining_time": "20:20:52", "throughput": 2736.85, "total_tokens": 1449248640} {"current_steps": 8025, "total_steps": 9134, "loss": 1.3181, "learning_rate": 1.79671372523878e-06, "epoch": 0.8785133692766632, "percentage": 87.86, "elapsed_time": "6 days, 3:06:37", "remaining_time": "20:19:46", "throughput": 2736.88, "total_tokens": 1449445760} {"current_steps": 8026, "total_steps": 9134, "loss": 0.7695, "learning_rate": 1.7935142381037135e-06, "epoch": 0.8786228413476012, "percentage": 87.87, "elapsed_time": "6 days, 3:07:41", "remaining_time": "20:18:40", "throughput": 2736.84, "total_tokens": 1449598304} {"current_steps": 8027, "total_steps": 9134, "loss": 0.6428, "learning_rate": 1.7903174962515478e-06, "epoch": 0.8787323134185391, "percentage": 87.88, "elapsed_time": "6 days, 3:08:44", "remaining_time": "20:17:34", "throughput": 2736.85, "total_tokens": 1449779296} {"current_steps": 8028, "total_steps": 9134, "loss": 0.8285, "learning_rate": 1.7871235000604503e-06, "epoch": 0.878841785489477, "percentage": 87.89, "elapsed_time": "6 days, 3:09:48", "remaining_time": "20:16:27", "throughput": 2736.85, "total_tokens": 1449953344} {"current_steps": 8029, "total_steps": 9134, "loss": 0.8732, "learning_rate": 1.7839322499082738e-06, "epoch": 0.8789512575604149, "percentage": 87.9, "elapsed_time": "6 days, 3:10:52", "remaining_time": "20:15:21", "throughput": 2736.85, "total_tokens": 1450129184} {"current_steps": 8030, "total_steps": 9134, "loss": 0.9521, "learning_rate": 1.7807437461725252e-06, "epoch": 0.8790607296313528, "percentage": 87.91, "elapsed_time": "6 days, 3:12:00", "remaining_time": "20:14:15", "throughput": 2736.89, "total_tokens": 1450331008} {"current_steps": 8031, "total_steps": 9134, "loss": 1.0078, "learning_rate": 1.7775579892304051e-06, "epoch": 0.8791702017022907, "percentage": 87.92, "elapsed_time": "6 days, 3:13:01", "remaining_time": "20:13:09", "throughput": 2736.86, "total_tokens": 1450483776} {"current_steps": 8032, "total_steps": 9134, "loss": 0.8961, "learning_rate": 1.7743749794587817e-06, "epoch": 0.8792796737732286, "percentage": 87.94, "elapsed_time": "6 days, 3:14:04", "remaining_time": "20:12:02", "throughput": 2736.85, "total_tokens": 1450654688} {"current_steps": 8033, "total_steps": 9134, "loss": 0.7725, "learning_rate": 1.7711947172342009e-06, "epoch": 0.8793891458441665, "percentage": 87.95, "elapsed_time": "6 days, 3:15:09", "remaining_time": "20:10:56", "throughput": 2736.89, "total_tokens": 1450849568} {"current_steps": 8034, "total_steps": 9134, "loss": 0.7195, "learning_rate": 1.7680172029328757e-06, "epoch": 0.8794986179151044, "percentage": 87.96, "elapsed_time": "6 days, 3:16:14", "remaining_time": "20:09:50", "throughput": 2736.93, "total_tokens": 1451050720} {"current_steps": 8035, "total_steps": 9134, "loss": 1.1587, "learning_rate": 1.7648424369307e-06, "epoch": 0.8796080899860423, "percentage": 87.97, "elapsed_time": "6 days, 3:17:18", "remaining_time": "20:08:44", "throughput": 2736.94, "total_tokens": 1451231264} {"current_steps": 8036, "total_steps": 9134, "loss": 1.1482, "learning_rate": 1.7616704196032564e-06, "epoch": 0.8797175620569803, "percentage": 87.98, "elapsed_time": "6 days, 3:18:21", "remaining_time": "20:07:37", "throughput": 2736.93, "total_tokens": 1451401504} {"current_steps": 8037, "total_steps": 9134, "loss": 0.7707, "learning_rate": 1.758501151325767e-06, "epoch": 0.8798270341279181, "percentage": 87.99, "elapsed_time": "6 days, 3:19:26", "remaining_time": "20:06:31", "throughput": 2736.93, "total_tokens": 1451575104} {"current_steps": 8038, "total_steps": 9134, "loss": 0.6864, "learning_rate": 1.7553346324731712e-06, "epoch": 0.879936506198856, "percentage": 88.0, "elapsed_time": "6 days, 3:20:30", "remaining_time": "20:05:25", "throughput": 2736.94, "total_tokens": 1451754528} {"current_steps": 8039, "total_steps": 9134, "loss": 0.7789, "learning_rate": 1.7521708634200413e-06, "epoch": 0.8800459782697939, "percentage": 88.01, "elapsed_time": "6 days, 3:21:33", "remaining_time": "20:04:19", "throughput": 2736.96, "total_tokens": 1451941568} {"current_steps": 8040, "total_steps": 9134, "loss": 0.898, "learning_rate": 1.7490098445406667e-06, "epoch": 0.8801554503407318, "percentage": 88.02, "elapsed_time": "6 days, 3:22:40", "remaining_time": "20:03:13", "throughput": 2737.02, "total_tokens": 1452157504} {"current_steps": 8041, "total_steps": 9134, "loss": 0.7523, "learning_rate": 1.7458515762089706e-06, "epoch": 0.8802649224116698, "percentage": 88.03, "elapsed_time": "6 days, 3:23:46", "remaining_time": "20:02:07", "throughput": 2737.03, "total_tokens": 1452342528} {"current_steps": 8042, "total_steps": 9134, "loss": 0.9647, "learning_rate": 1.742696058798582e-06, "epoch": 0.8803743944826076, "percentage": 88.04, "elapsed_time": "6 days, 3:24:52", "remaining_time": "20:01:01", "throughput": 2737.02, "total_tokens": 1452514784} {"current_steps": 8043, "total_steps": 9134, "loss": 0.7674, "learning_rate": 1.7395432926827909e-06, "epoch": 0.8804838665535455, "percentage": 88.06, "elapsed_time": "6 days, 3:25:53", "remaining_time": "19:59:54", "throughput": 2737.04, "total_tokens": 1452692192} {"current_steps": 8044, "total_steps": 9134, "loss": 0.7177, "learning_rate": 1.7363932782345603e-06, "epoch": 0.8805933386244834, "percentage": 88.07, "elapsed_time": "6 days, 3:26:55", "remaining_time": "19:58:48", "throughput": 2737.08, "total_tokens": 1452884384} {"current_steps": 8045, "total_steps": 9134, "loss": 0.9239, "learning_rate": 1.7332460158265313e-06, "epoch": 0.8807028106954213, "percentage": 88.08, "elapsed_time": "6 days, 3:28:02", "remaining_time": "19:57:42", "throughput": 2737.11, "total_tokens": 1453081504} {"current_steps": 8046, "total_steps": 9134, "loss": 0.705, "learning_rate": 1.7301015058310194e-06, "epoch": 0.8808122827663593, "percentage": 88.09, "elapsed_time": "6 days, 3:29:05", "remaining_time": "19:56:35", "throughput": 2737.13, "total_tokens": 1453268320} {"current_steps": 8047, "total_steps": 9134, "loss": 0.6399, "learning_rate": 1.726959748620019e-06, "epoch": 0.8809217548372972, "percentage": 88.1, "elapsed_time": "6 days, 3:30:12", "remaining_time": "19:55:29", "throughput": 2737.14, "total_tokens": 1453453792} {"current_steps": 8048, "total_steps": 9134, "loss": 0.8233, "learning_rate": 1.7238207445651855e-06, "epoch": 0.881031226908235, "percentage": 88.11, "elapsed_time": "6 days, 3:31:16", "remaining_time": "19:54:23", "throughput": 2737.15, "total_tokens": 1453638144} {"current_steps": 8049, "total_steps": 9134, "loss": 0.7879, "learning_rate": 1.7206844940378636e-06, "epoch": 0.8811406989791729, "percentage": 88.12, "elapsed_time": "6 days, 3:32:18", "remaining_time": "19:53:17", "throughput": 2737.15, "total_tokens": 1453804800} {"current_steps": 8050, "total_steps": 9134, "loss": 0.9437, "learning_rate": 1.7175509974090647e-06, "epoch": 0.8812501710501108, "percentage": 88.13, "elapsed_time": "6 days, 3:33:24", "remaining_time": "19:52:11", "throughput": 2737.16, "total_tokens": 1453989600} {"current_steps": 8051, "total_steps": 9134, "loss": 0.866, "learning_rate": 1.714420255049473e-06, "epoch": 0.8813596431210488, "percentage": 88.14, "elapsed_time": "6 days, 3:34:29", "remaining_time": "19:51:04", "throughput": 2737.15, "total_tokens": 1454163872} {"current_steps": 8052, "total_steps": 9134, "loss": 0.9615, "learning_rate": 1.7112922673294507e-06, "epoch": 0.8814691151919867, "percentage": 88.15, "elapsed_time": "6 days, 3:35:32", "remaining_time": "19:49:58", "throughput": 2737.16, "total_tokens": 1454343296} {"current_steps": 8053, "total_steps": 9134, "loss": 0.7319, "learning_rate": 1.708167034619032e-06, "epoch": 0.8815785872629246, "percentage": 88.17, "elapsed_time": "6 days, 3:36:36", "remaining_time": "19:48:52", "throughput": 2737.13, "total_tokens": 1454501888} {"current_steps": 8054, "total_steps": 9134, "loss": 0.9225, "learning_rate": 1.705044557287927e-06, "epoch": 0.8816880593338624, "percentage": 88.18, "elapsed_time": "6 days, 3:37:40", "remaining_time": "19:47:46", "throughput": 2737.14, "total_tokens": 1454681536} {"current_steps": 8055, "total_steps": 9134, "loss": 0.8514, "learning_rate": 1.701924835705515e-06, "epoch": 0.8817975314048003, "percentage": 88.19, "elapsed_time": "6 days, 3:38:46", "remaining_time": "19:46:40", "throughput": 2737.16, "total_tokens": 1454873952} {"current_steps": 8056, "total_steps": 9134, "loss": 0.9843, "learning_rate": 1.6988078702408622e-06, "epoch": 0.8819070034757382, "percentage": 88.2, "elapsed_time": "6 days, 3:39:48", "remaining_time": "19:45:33", "throughput": 2737.13, "total_tokens": 1455029408} {"current_steps": 8057, "total_steps": 9134, "loss": 0.6851, "learning_rate": 1.6956936612626928e-06, "epoch": 0.8820164755466762, "percentage": 88.21, "elapsed_time": "6 days, 3:40:53", "remaining_time": "19:44:27", "throughput": 2737.16, "total_tokens": 1455220704} {"current_steps": 8058, "total_steps": 9134, "loss": 0.8278, "learning_rate": 1.6925822091394121e-06, "epoch": 0.8821259476176141, "percentage": 88.22, "elapsed_time": "6 days, 3:41:59", "remaining_time": "19:43:21", "throughput": 2737.22, "total_tokens": 1455431936} {"current_steps": 8059, "total_steps": 9134, "loss": 0.8114, "learning_rate": 1.689473514239101e-06, "epoch": 0.8822354196885519, "percentage": 88.23, "elapsed_time": "6 days, 3:43:07", "remaining_time": "19:42:15", "throughput": 2737.28, "total_tokens": 1455650784} {"current_steps": 8060, "total_steps": 9134, "loss": 1.0355, "learning_rate": 1.6863675769295096e-06, "epoch": 0.8823448917594898, "percentage": 88.24, "elapsed_time": "6 days, 3:44:09", "remaining_time": "19:41:09", "throughput": 2737.27, "total_tokens": 1455812288} {"current_steps": 8061, "total_steps": 9134, "loss": 0.6941, "learning_rate": 1.683264397578066e-06, "epoch": 0.8824543638304277, "percentage": 88.25, "elapsed_time": "6 days, 3:45:13", "remaining_time": "19:40:02", "throughput": 2737.25, "total_tokens": 1455980512} {"current_steps": 8062, "total_steps": 9134, "loss": 0.7013, "learning_rate": 1.6801639765518712e-06, "epoch": 0.8825638359013657, "percentage": 88.26, "elapsed_time": "6 days, 3:46:17", "remaining_time": "19:38:56", "throughput": 2737.25, "total_tokens": 1456156800} {"current_steps": 8063, "total_steps": 9134, "loss": 0.9795, "learning_rate": 1.6770663142176957e-06, "epoch": 0.8826733079723036, "percentage": 88.27, "elapsed_time": "6 days, 3:47:20", "remaining_time": "19:37:50", "throughput": 2737.25, "total_tokens": 1456328608} {"current_steps": 8064, "total_steps": 9134, "loss": 0.8617, "learning_rate": 1.6739714109419907e-06, "epoch": 0.8827827800432415, "percentage": 88.29, "elapsed_time": "6 days, 3:48:24", "remaining_time": "19:36:44", "throughput": 2737.27, "total_tokens": 1456512736} {"current_steps": 8065, "total_steps": 9134, "loss": 0.8722, "learning_rate": 1.6708792670908746e-06, "epoch": 0.8828922521141793, "percentage": 88.3, "elapsed_time": "6 days, 3:49:28", "remaining_time": "19:35:37", "throughput": 2737.31, "total_tokens": 1456709408} {"current_steps": 8066, "total_steps": 9134, "loss": 0.8306, "learning_rate": 1.6677898830301463e-06, "epoch": 0.8830017241851172, "percentage": 88.31, "elapsed_time": "6 days, 3:50:35", "remaining_time": "19:34:31", "throughput": 2737.32, "total_tokens": 1456896672} {"current_steps": 8067, "total_steps": 9134, "loss": 0.7984, "learning_rate": 1.664703259125272e-06, "epoch": 0.8831111962560552, "percentage": 88.32, "elapsed_time": "6 days, 3:51:34", "remaining_time": "19:33:25", "throughput": 2737.27, "total_tokens": 1457034208} {"current_steps": 8068, "total_steps": 9134, "loss": 0.7835, "learning_rate": 1.66161939574139e-06, "epoch": 0.8832206683269931, "percentage": 88.33, "elapsed_time": "6 days, 3:52:37", "remaining_time": "19:32:18", "throughput": 2737.24, "total_tokens": 1457187648} {"current_steps": 8069, "total_steps": 9134, "loss": 1.1522, "learning_rate": 1.6585382932433197e-06, "epoch": 0.883330140397931, "percentage": 88.34, "elapsed_time": "6 days, 3:53:41", "remaining_time": "19:31:12", "throughput": 2737.21, "total_tokens": 1457349376} {"current_steps": 8070, "total_steps": 9134, "loss": 1.0939, "learning_rate": 1.6554599519955417e-06, "epoch": 0.8834396124688689, "percentage": 88.35, "elapsed_time": "6 days, 3:54:48", "remaining_time": "19:30:06", "throughput": 2737.29, "total_tokens": 1457573376} {"current_steps": 8071, "total_steps": 9134, "loss": 1.0179, "learning_rate": 1.652384372362234e-06, "epoch": 0.8835490845398067, "percentage": 88.36, "elapsed_time": "6 days, 3:55:54", "remaining_time": "19:29:00", "throughput": 2737.31, "total_tokens": 1457766240} {"current_steps": 8072, "total_steps": 9134, "loss": 0.7176, "learning_rate": 1.649311554707214e-06, "epoch": 0.8836585566107447, "percentage": 88.37, "elapsed_time": "6 days, 3:56:56", "remaining_time": "19:27:54", "throughput": 2737.33, "total_tokens": 1457947232} {"current_steps": 8073, "total_steps": 9134, "loss": 0.8226, "learning_rate": 1.6462414993940023e-06, "epoch": 0.8837680286816826, "percentage": 88.38, "elapsed_time": "6 days, 3:58:03", "remaining_time": "19:26:48", "throughput": 2737.39, "total_tokens": 1458161600} {"current_steps": 8074, "total_steps": 9134, "loss": 0.8731, "learning_rate": 1.6431742067857775e-06, "epoch": 0.8838775007526205, "percentage": 88.4, "elapsed_time": "6 days, 3:59:06", "remaining_time": "19:25:41", "throughput": 2737.4, "total_tokens": 1458339232} {"current_steps": 8075, "total_steps": 9134, "loss": 0.6466, "learning_rate": 1.6401096772453912e-06, "epoch": 0.8839869728235584, "percentage": 88.41, "elapsed_time": "6 days, 4:00:07", "remaining_time": "19:24:35", "throughput": 2737.37, "total_tokens": 1458492224} {"current_steps": 8076, "total_steps": 9134, "loss": 0.8376, "learning_rate": 1.6370479111353754e-06, "epoch": 0.8840964448944962, "percentage": 88.42, "elapsed_time": "6 days, 4:01:14", "remaining_time": "19:23:29", "throughput": 2737.38, "total_tokens": 1458677472} {"current_steps": 8077, "total_steps": 9134, "loss": 1.002, "learning_rate": 1.633988908817924e-06, "epoch": 0.8842059169654342, "percentage": 88.43, "elapsed_time": "6 days, 4:02:21", "remaining_time": "19:22:23", "throughput": 2737.35, "total_tokens": 1458847264} {"current_steps": 8078, "total_steps": 9134, "loss": 0.8866, "learning_rate": 1.6309326706549221e-06, "epoch": 0.8843153890363721, "percentage": 88.44, "elapsed_time": "6 days, 4:03:22", "remaining_time": "19:21:16", "throughput": 2737.34, "total_tokens": 1459009664} {"current_steps": 8079, "total_steps": 9134, "loss": 0.8243, "learning_rate": 1.627879197007906e-06, "epoch": 0.88442486110731, "percentage": 88.45, "elapsed_time": "6 days, 4:04:25", "remaining_time": "19:20:10", "throughput": 2737.37, "total_tokens": 1459196928} {"current_steps": 8080, "total_steps": 9134, "loss": 0.7807, "learning_rate": 1.6248284882381087e-06, "epoch": 0.8845343331782479, "percentage": 88.46, "elapsed_time": "6 days, 4:05:29", "remaining_time": "19:19:04", "throughput": 2737.37, "total_tokens": 1459371648} {"current_steps": 8081, "total_steps": 9134, "loss": 0.9257, "learning_rate": 1.6217805447064083e-06, "epoch": 0.8846438052491858, "percentage": 88.47, "elapsed_time": "6 days, 4:06:36", "remaining_time": "19:17:58", "throughput": 2737.4, "total_tokens": 1459573248} {"current_steps": 8082, "total_steps": 9134, "loss": 0.8314, "learning_rate": 1.6187353667733856e-06, "epoch": 0.8847532773201237, "percentage": 88.48, "elapsed_time": "6 days, 4:07:42", "remaining_time": "19:16:52", "throughput": 2737.42, "total_tokens": 1459762080} {"current_steps": 8083, "total_steps": 9134, "loss": 1.12, "learning_rate": 1.6156929547992638e-06, "epoch": 0.8848627493910616, "percentage": 88.49, "elapsed_time": "6 days, 4:08:46", "remaining_time": "19:15:46", "throughput": 2737.4, "total_tokens": 1459927840} {"current_steps": 8084, "total_steps": 9134, "loss": 0.672, "learning_rate": 1.6126533091439661e-06, "epoch": 0.8849722214619995, "percentage": 88.5, "elapsed_time": "6 days, 4:09:50", "remaining_time": "19:14:40", "throughput": 2737.43, "total_tokens": 1460118912} {"current_steps": 8085, "total_steps": 9134, "loss": 0.7913, "learning_rate": 1.6096164301670712e-06, "epoch": 0.8850816935329374, "percentage": 88.52, "elapsed_time": "6 days, 4:10:55", "remaining_time": "19:13:33", "throughput": 2737.45, "total_tokens": 1460306400} {"current_steps": 8086, "total_steps": 9134, "loss": 0.722, "learning_rate": 1.6065823182278366e-06, "epoch": 0.8851911656038753, "percentage": 88.53, "elapsed_time": "6 days, 4:12:01", "remaining_time": "19:12:27", "throughput": 2737.47, "total_tokens": 1460497248} {"current_steps": 8087, "total_steps": 9134, "loss": 0.9942, "learning_rate": 1.6035509736851973e-06, "epoch": 0.8853006376748133, "percentage": 88.54, "elapsed_time": "6 days, 4:13:01", "remaining_time": "19:11:21", "throughput": 2737.45, "total_tokens": 1460651808} {"current_steps": 8088, "total_steps": 9134, "loss": 0.9091, "learning_rate": 1.6005223968977468e-06, "epoch": 0.8854101097457511, "percentage": 88.55, "elapsed_time": "6 days, 4:14:02", "remaining_time": "19:10:14", "throughput": 2737.43, "total_tokens": 1460810400} {"current_steps": 8089, "total_steps": 9134, "loss": 0.9068, "learning_rate": 1.597496588223768e-06, "epoch": 0.885519581816689, "percentage": 88.56, "elapsed_time": "6 days, 4:15:06", "remaining_time": "19:09:08", "throughput": 2737.44, "total_tokens": 1460989152} {"current_steps": 8090, "total_steps": 9134, "loss": 0.8857, "learning_rate": 1.5944735480212026e-06, "epoch": 0.8856290538876269, "percentage": 88.57, "elapsed_time": "6 days, 4:16:09", "remaining_time": "19:08:02", "throughput": 2737.46, "total_tokens": 1461173056} {"current_steps": 8091, "total_steps": 9134, "loss": 0.818, "learning_rate": 1.5914532766476753e-06, "epoch": 0.8857385259585648, "percentage": 88.58, "elapsed_time": "6 days, 4:17:10", "remaining_time": "19:06:55", "throughput": 2737.45, "total_tokens": 1461334112} {"current_steps": 8092, "total_steps": 9134, "loss": 1.0169, "learning_rate": 1.5884357744604756e-06, "epoch": 0.8858479980295028, "percentage": 88.59, "elapsed_time": "6 days, 4:18:08", "remaining_time": "19:05:48", "throughput": 2737.4, "total_tokens": 1461464928} {"current_steps": 8093, "total_steps": 9134, "loss": 1.1004, "learning_rate": 1.5854210418165678e-06, "epoch": 0.8859574701004407, "percentage": 88.6, "elapsed_time": "6 days, 4:19:15", "remaining_time": "19:04:42", "throughput": 2737.46, "total_tokens": 1461685120} {"current_steps": 8094, "total_steps": 9134, "loss": 0.6956, "learning_rate": 1.5824090790725887e-06, "epoch": 0.8860669421713785, "percentage": 88.61, "elapsed_time": "6 days, 4:20:19", "remaining_time": "19:03:36", "throughput": 2737.47, "total_tokens": 1461862976} {"current_steps": 8095, "total_steps": 9134, "loss": 0.8613, "learning_rate": 1.579399886584848e-06, "epoch": 0.8861764142423164, "percentage": 88.62, "elapsed_time": "6 days, 4:21:21", "remaining_time": "19:02:29", "throughput": 2737.47, "total_tokens": 1462030752} {"current_steps": 8096, "total_steps": 9134, "loss": 0.8494, "learning_rate": 1.5763934647093275e-06, "epoch": 0.8862858863132543, "percentage": 88.64, "elapsed_time": "6 days, 4:22:25", "remaining_time": "19:01:23", "throughput": 2737.44, "total_tokens": 1462192256} {"current_steps": 8097, "total_steps": 9134, "loss": 1.0877, "learning_rate": 1.5733898138016845e-06, "epoch": 0.8863953583841923, "percentage": 88.65, "elapsed_time": "6 days, 4:23:27", "remaining_time": "19:00:17", "throughput": 2737.42, "total_tokens": 1462351744} {"current_steps": 8098, "total_steps": 9134, "loss": 0.8029, "learning_rate": 1.5703889342172401e-06, "epoch": 0.8865048304551302, "percentage": 88.66, "elapsed_time": "6 days, 4:24:34", "remaining_time": "18:59:11", "throughput": 2737.45, "total_tokens": 1462551776} {"current_steps": 8099, "total_steps": 9134, "loss": 0.859, "learning_rate": 1.5673908263109966e-06, "epoch": 0.886614302526068, "percentage": 88.67, "elapsed_time": "6 days, 4:25:35", "remaining_time": "18:58:04", "throughput": 2737.42, "total_tokens": 1462700288} {"current_steps": 8100, "total_steps": 9134, "loss": 0.963, "learning_rate": 1.564395490437623e-06, "epoch": 0.8867237745970059, "percentage": 88.68, "elapsed_time": "6 days, 4:26:42", "remaining_time": "18:56:58", "throughput": 2737.45, "total_tokens": 1462899872} {"current_steps": 8101, "total_steps": 9134, "loss": 0.9545, "learning_rate": 1.5614029269514634e-06, "epoch": 0.8868332466679438, "percentage": 88.69, "elapsed_time": "6 days, 4:27:46", "remaining_time": "18:55:52", "throughput": 2737.48, "total_tokens": 1463092736} {"current_steps": 8102, "total_steps": 9134, "loss": 0.9477, "learning_rate": 1.558413136206527e-06, "epoch": 0.8869427187388818, "percentage": 88.7, "elapsed_time": "6 days, 4:28:52", "remaining_time": "18:54:46", "throughput": 2737.53, "total_tokens": 1463301728} {"current_steps": 8103, "total_steps": 9134, "loss": 0.6839, "learning_rate": 1.5554261185565022e-06, "epoch": 0.8870521908098197, "percentage": 88.71, "elapsed_time": "6 days, 4:29:53", "remaining_time": "18:53:39", "throughput": 2737.51, "total_tokens": 1463452928} {"current_steps": 8104, "total_steps": 9134, "loss": 0.8789, "learning_rate": 1.552441874354757e-06, "epoch": 0.8871616628807576, "percentage": 88.72, "elapsed_time": "6 days, 4:30:56", "remaining_time": "18:52:33", "throughput": 2737.48, "total_tokens": 1463607488} {"current_steps": 8105, "total_steps": 9134, "loss": 0.6964, "learning_rate": 1.5494604039543058e-06, "epoch": 0.8872711349516954, "percentage": 88.73, "elapsed_time": "6 days, 4:32:01", "remaining_time": "18:51:27", "throughput": 2737.5, "total_tokens": 1463797888} {"current_steps": 8106, "total_steps": 9134, "loss": 0.8435, "learning_rate": 1.5464817077078614e-06, "epoch": 0.8873806070226333, "percentage": 88.75, "elapsed_time": "6 days, 4:33:01", "remaining_time": "18:50:20", "throughput": 2737.47, "total_tokens": 1463946624} {"current_steps": 8107, "total_steps": 9134, "loss": 0.9518, "learning_rate": 1.543505785967797e-06, "epoch": 0.8874900790935712, "percentage": 88.76, "elapsed_time": "6 days, 4:34:05", "remaining_time": "18:49:14", "throughput": 2737.48, "total_tokens": 1464126720} {"current_steps": 8108, "total_steps": 9134, "loss": 0.6915, "learning_rate": 1.5405326390861562e-06, "epoch": 0.8875995511645092, "percentage": 88.77, "elapsed_time": "6 days, 4:35:08", "remaining_time": "18:48:08", "throughput": 2737.5, "total_tokens": 1464311968} {"current_steps": 8109, "total_steps": 9134, "loss": 0.9181, "learning_rate": 1.5375622674146577e-06, "epoch": 0.8877090232354471, "percentage": 88.78, "elapsed_time": "6 days, 4:36:14", "remaining_time": "18:47:02", "throughput": 2737.51, "total_tokens": 1464499680} {"current_steps": 8110, "total_steps": 9134, "loss": 0.9051, "learning_rate": 1.5345946713046872e-06, "epoch": 0.887818495306385, "percentage": 88.79, "elapsed_time": "6 days, 4:37:18", "remaining_time": "18:45:55", "throughput": 2737.55, "total_tokens": 1464691424} {"current_steps": 8111, "total_steps": 9134, "loss": 0.7612, "learning_rate": 1.5316298511073164e-06, "epoch": 0.8879279673773228, "percentage": 88.8, "elapsed_time": "6 days, 4:38:20", "remaining_time": "18:44:49", "throughput": 2737.54, "total_tokens": 1464858304} {"current_steps": 8112, "total_steps": 9134, "loss": 1.09, "learning_rate": 1.528667807173262e-06, "epoch": 0.8880374394482607, "percentage": 88.81, "elapsed_time": "6 days, 4:39:27", "remaining_time": "18:43:43", "throughput": 2737.57, "total_tokens": 1465057888} {"current_steps": 8113, "total_steps": 9134, "loss": 0.6979, "learning_rate": 1.5257085398529436e-06, "epoch": 0.8881469115191987, "percentage": 88.82, "elapsed_time": "6 days, 4:40:28", "remaining_time": "18:42:37", "throughput": 2737.59, "total_tokens": 1465237536} {"current_steps": 8114, "total_steps": 9134, "loss": 0.8239, "learning_rate": 1.5227520494964232e-06, "epoch": 0.8882563835901366, "percentage": 88.83, "elapsed_time": "6 days, 4:41:35", "remaining_time": "18:41:31", "throughput": 2737.63, "total_tokens": 1465443392} {"current_steps": 8115, "total_steps": 9134, "loss": 0.7103, "learning_rate": 1.5197983364534597e-06, "epoch": 0.8883658556610745, "percentage": 88.84, "elapsed_time": "6 days, 4:42:40", "remaining_time": "18:40:25", "throughput": 2737.66, "total_tokens": 1465636704} {"current_steps": 8116, "total_steps": 9134, "loss": 0.6803, "learning_rate": 1.5168474010734622e-06, "epoch": 0.8884753277320123, "percentage": 88.85, "elapsed_time": "6 days, 4:43:44", "remaining_time": "18:39:18", "throughput": 2737.68, "total_tokens": 1465819488} {"current_steps": 8117, "total_steps": 9134, "loss": 0.8589, "learning_rate": 1.5138992437055299e-06, "epoch": 0.8885847998029502, "percentage": 88.87, "elapsed_time": "6 days, 4:44:48", "remaining_time": "18:38:12", "throughput": 2737.71, "total_tokens": 1466013472} {"current_steps": 8118, "total_steps": 9134, "loss": 0.8557, "learning_rate": 1.5109538646984167e-06, "epoch": 0.8886942718738882, "percentage": 88.88, "elapsed_time": "6 days, 4:45:51", "remaining_time": "18:37:06", "throughput": 2737.72, "total_tokens": 1466190656} {"current_steps": 8119, "total_steps": 9134, "loss": 1.0078, "learning_rate": 1.5080112644005523e-06, "epoch": 0.8888037439448261, "percentage": 88.89, "elapsed_time": "6 days, 4:46:55", "remaining_time": "18:36:00", "throughput": 2737.72, "total_tokens": 1466368736} {"current_steps": 8120, "total_steps": 9134, "loss": 0.888, "learning_rate": 1.5050714431600554e-06, "epoch": 0.888913216015764, "percentage": 88.9, "elapsed_time": "6 days, 4:48:02", "remaining_time": "18:34:54", "throughput": 2737.76, "total_tokens": 1466570336} {"current_steps": 8121, "total_steps": 9134, "loss": 0.85, "learning_rate": 1.502134401324687e-06, "epoch": 0.8890226880867019, "percentage": 88.91, "elapsed_time": "6 days, 4:49:02", "remaining_time": "18:33:47", "throughput": 2737.72, "total_tokens": 1466713696} {"current_steps": 8122, "total_steps": 9134, "loss": 0.9244, "learning_rate": 1.499200139241902e-06, "epoch": 0.8891321601576397, "percentage": 88.92, "elapsed_time": "6 days, 4:50:08", "remaining_time": "18:32:41", "throughput": 2737.72, "total_tokens": 1466895360} {"current_steps": 8123, "total_steps": 9134, "loss": 0.9121, "learning_rate": 1.4962686572588091e-06, "epoch": 0.8892416322285777, "percentage": 88.93, "elapsed_time": "6 days, 4:51:10", "remaining_time": "18:31:35", "throughput": 2737.74, "total_tokens": 1467075008} {"current_steps": 8124, "total_steps": 9134, "loss": 0.8043, "learning_rate": 1.493339955722206e-06, "epoch": 0.8893511042995156, "percentage": 88.94, "elapsed_time": "6 days, 4:52:14", "remaining_time": "18:30:28", "throughput": 2737.74, "total_tokens": 1467251744} {"current_steps": 8125, "total_steps": 9134, "loss": 1.006, "learning_rate": 1.4904140349785488e-06, "epoch": 0.8894605763704535, "percentage": 88.95, "elapsed_time": "6 days, 4:53:20", "remaining_time": "18:29:23", "throughput": 2737.77, "total_tokens": 1467444608} {"current_steps": 8126, "total_steps": 9134, "loss": 0.882, "learning_rate": 1.4874908953739691e-06, "epoch": 0.8895700484413914, "percentage": 88.96, "elapsed_time": "6 days, 4:54:24", "remaining_time": "18:28:16", "throughput": 2737.77, "total_tokens": 1467621344} {"current_steps": 8127, "total_steps": 9134, "loss": 0.6848, "learning_rate": 1.4845705372542707e-06, "epoch": 0.8896795205123293, "percentage": 88.98, "elapsed_time": "6 days, 4:55:27", "remaining_time": "18:27:10", "throughput": 2737.76, "total_tokens": 1467790240} {"current_steps": 8128, "total_steps": 9134, "loss": 0.7481, "learning_rate": 1.481652960964916e-06, "epoch": 0.8897889925832672, "percentage": 88.99, "elapsed_time": "6 days, 4:56:30", "remaining_time": "18:26:04", "throughput": 2737.74, "total_tokens": 1467948384} {"current_steps": 8129, "total_steps": 9134, "loss": 0.7216, "learning_rate": 1.4787381668510653e-06, "epoch": 0.8898984646542051, "percentage": 89.0, "elapsed_time": "6 days, 4:57:37", "remaining_time": "18:24:58", "throughput": 2737.71, "total_tokens": 1468117056} {"current_steps": 8130, "total_steps": 9134, "loss": 0.7021, "learning_rate": 1.4758261552575175e-06, "epoch": 0.890007936725143, "percentage": 89.01, "elapsed_time": "6 days, 4:58:41", "remaining_time": "18:23:52", "throughput": 2737.73, "total_tokens": 1468303424} {"current_steps": 8131, "total_steps": 9134, "loss": 0.712, "learning_rate": 1.4729169265287695e-06, "epoch": 0.8901174087960809, "percentage": 89.02, "elapsed_time": "6 days, 4:59:46", "remaining_time": "18:22:45", "throughput": 2737.76, "total_tokens": 1468495392} {"current_steps": 8132, "total_steps": 9134, "loss": 0.8649, "learning_rate": 1.470010481008971e-06, "epoch": 0.8902268808670188, "percentage": 89.03, "elapsed_time": "6 days, 5:00:50", "remaining_time": "18:21:39", "throughput": 2737.74, "total_tokens": 1468663392} {"current_steps": 8133, "total_steps": 9134, "loss": 0.7878, "learning_rate": 1.4671068190419524e-06, "epoch": 0.8903363529379567, "percentage": 89.04, "elapsed_time": "6 days, 5:01:57", "remaining_time": "18:20:33", "throughput": 2737.77, "total_tokens": 1468858720} {"current_steps": 8134, "total_steps": 9134, "loss": 0.8735, "learning_rate": 1.4642059409712082e-06, "epoch": 0.8904458250088946, "percentage": 89.05, "elapsed_time": "6 days, 5:03:02", "remaining_time": "18:19:27", "throughput": 2737.76, "total_tokens": 1469031424} {"current_steps": 8135, "total_steps": 9134, "loss": 0.7509, "learning_rate": 1.461307847139909e-06, "epoch": 0.8905552970798325, "percentage": 89.06, "elapsed_time": "6 days, 5:04:05", "remaining_time": "18:18:21", "throughput": 2737.77, "total_tokens": 1469213312} {"current_steps": 8136, "total_steps": 9134, "loss": 1.0316, "learning_rate": 1.4584125378908935e-06, "epoch": 0.8906647691507704, "percentage": 89.07, "elapsed_time": "6 days, 5:05:12", "remaining_time": "18:17:15", "throughput": 2737.81, "total_tokens": 1469415808} {"current_steps": 8137, "total_steps": 9134, "loss": 0.8483, "learning_rate": 1.455520013566672e-06, "epoch": 0.8907742412217083, "percentage": 89.08, "elapsed_time": "6 days, 5:06:14", "remaining_time": "18:16:09", "throughput": 2737.79, "total_tokens": 1469572832} {"current_steps": 8138, "total_steps": 9134, "loss": 1.114, "learning_rate": 1.45263027450942e-06, "epoch": 0.8908837132926463, "percentage": 89.1, "elapsed_time": "6 days, 5:07:18", "remaining_time": "18:15:03", "throughput": 2737.81, "total_tokens": 1469761216} {"current_steps": 8139, "total_steps": 9134, "loss": 0.8024, "learning_rate": 1.4497433210609923e-06, "epoch": 0.8909931853635841, "percentage": 89.11, "elapsed_time": "6 days, 5:08:19", "remaining_time": "18:13:56", "throughput": 2737.77, "total_tokens": 1469909056} {"current_steps": 8140, "total_steps": 9134, "loss": 0.8456, "learning_rate": 1.4468591535629127e-06, "epoch": 0.891102657434522, "percentage": 89.12, "elapsed_time": "6 days, 5:09:25", "remaining_time": "18:12:50", "throughput": 2737.8, "total_tokens": 1470105280} {"current_steps": 8141, "total_steps": 9134, "loss": 1.0542, "learning_rate": 1.443977772356367e-06, "epoch": 0.8912121295054599, "percentage": 89.13, "elapsed_time": "6 days, 5:10:28", "remaining_time": "18:11:44", "throughput": 2737.79, "total_tokens": 1470271488} {"current_steps": 8142, "total_steps": 9134, "loss": 0.7493, "learning_rate": 1.4410991777822209e-06, "epoch": 0.8913216015763978, "percentage": 89.14, "elapsed_time": "6 days, 5:11:30", "remaining_time": "18:10:37", "throughput": 2737.78, "total_tokens": 1470434784} {"current_steps": 8143, "total_steps": 9134, "loss": 0.8244, "learning_rate": 1.4382233701810022e-06, "epoch": 0.8914310736473358, "percentage": 89.15, "elapsed_time": "6 days, 5:12:35", "remaining_time": "18:09:31", "throughput": 2737.78, "total_tokens": 1470615776} {"current_steps": 8144, "total_steps": 9134, "loss": 1.0386, "learning_rate": 1.4353503498929193e-06, "epoch": 0.8915405457182737, "percentage": 89.16, "elapsed_time": "6 days, 5:13:41", "remaining_time": "18:08:25", "throughput": 2737.82, "total_tokens": 1470816928} {"current_steps": 8145, "total_steps": 9134, "loss": 0.878, "learning_rate": 1.4324801172578366e-06, "epoch": 0.8916500177892115, "percentage": 89.17, "elapsed_time": "6 days, 5:14:47", "remaining_time": "18:07:19", "throughput": 2737.84, "total_tokens": 1471008896} {"current_steps": 8146, "total_steps": 9134, "loss": 0.9795, "learning_rate": 1.4296126726153102e-06, "epoch": 0.8917594898601494, "percentage": 89.18, "elapsed_time": "6 days, 5:15:52", "remaining_time": "18:06:13", "throughput": 2737.87, "total_tokens": 1471199072} {"current_steps": 8147, "total_steps": 9134, "loss": 0.7253, "learning_rate": 1.4267480163045384e-06, "epoch": 0.8918689619310873, "percentage": 89.19, "elapsed_time": "6 days, 5:16:55", "remaining_time": "18:05:07", "throughput": 2737.87, "total_tokens": 1471373120} {"current_steps": 8148, "total_steps": 9134, "loss": 1.068, "learning_rate": 1.4238861486644162e-06, "epoch": 0.8919784340020253, "percentage": 89.21, "elapsed_time": "6 days, 5:18:00", "remaining_time": "18:04:01", "throughput": 2737.91, "total_tokens": 1471572256} {"current_steps": 8149, "total_steps": 9134, "loss": 0.6819, "learning_rate": 1.4210270700334927e-06, "epoch": 0.8920879060729632, "percentage": 89.22, "elapsed_time": "6 days, 5:19:00", "remaining_time": "18:02:54", "throughput": 2737.88, "total_tokens": 1471724128} {"current_steps": 8150, "total_steps": 9134, "loss": 0.907, "learning_rate": 1.4181707807499917e-06, "epoch": 0.892197378143901, "percentage": 89.23, "elapsed_time": "6 days, 5:20:05", "remaining_time": "18:01:48", "throughput": 2737.9, "total_tokens": 1471910496} {"current_steps": 8151, "total_steps": 9134, "loss": 1.1784, "learning_rate": 1.4153172811518067e-06, "epoch": 0.8923068502148389, "percentage": 89.24, "elapsed_time": "6 days, 5:21:08", "remaining_time": "18:00:42", "throughput": 2737.9, "total_tokens": 1472081632} {"current_steps": 8152, "total_steps": 9134, "loss": 0.9356, "learning_rate": 1.4124665715764957e-06, "epoch": 0.8924163222857768, "percentage": 89.25, "elapsed_time": "6 days, 5:22:07", "remaining_time": "17:59:35", "throughput": 2737.9, "total_tokens": 1472245376} {"current_steps": 8153, "total_steps": 9134, "loss": 0.8015, "learning_rate": 1.4096186523613052e-06, "epoch": 0.8925257943567148, "percentage": 89.26, "elapsed_time": "6 days, 5:23:12", "remaining_time": "17:58:29", "throughput": 2737.94, "total_tokens": 1472442496} {"current_steps": 8154, "total_steps": 9134, "loss": 0.7774, "learning_rate": 1.4067735238431245e-06, "epoch": 0.8926352664276527, "percentage": 89.27, "elapsed_time": "6 days, 5:24:16", "remaining_time": "17:57:23", "throughput": 2737.96, "total_tokens": 1472630432} {"current_steps": 8155, "total_steps": 9134, "loss": 0.9688, "learning_rate": 1.4039311863585425e-06, "epoch": 0.8927447384985906, "percentage": 89.28, "elapsed_time": "6 days, 5:25:16", "remaining_time": "17:56:16", "throughput": 2737.94, "total_tokens": 1472784544} {"current_steps": 8156, "total_steps": 9134, "loss": 0.7513, "learning_rate": 1.4010916402437845e-06, "epoch": 0.8928542105695284, "percentage": 89.29, "elapsed_time": "6 days, 5:26:23", "remaining_time": "17:55:10", "throughput": 2737.99, "total_tokens": 1472992640} {"current_steps": 8157, "total_steps": 9134, "loss": 0.933, "learning_rate": 1.3982548858347738e-06, "epoch": 0.8929636826404663, "percentage": 89.3, "elapsed_time": "6 days, 5:27:27", "remaining_time": "17:54:04", "throughput": 2738.04, "total_tokens": 1473193568} {"current_steps": 8158, "total_steps": 9134, "loss": 0.9874, "learning_rate": 1.3954209234670917e-06, "epoch": 0.8930731547114042, "percentage": 89.31, "elapsed_time": "6 days, 5:28:33", "remaining_time": "17:52:58", "throughput": 2738.1, "total_tokens": 1473410624} {"current_steps": 8159, "total_steps": 9134, "loss": 0.5702, "learning_rate": 1.3925897534759925e-06, "epoch": 0.8931826267823422, "percentage": 89.33, "elapsed_time": "6 days, 5:29:41", "remaining_time": "17:51:52", "throughput": 2738.13, "total_tokens": 1473609760} {"current_steps": 8160, "total_steps": 9134, "loss": 0.7562, "learning_rate": 1.389761376196394e-06, "epoch": 0.8932920988532801, "percentage": 89.34, "elapsed_time": "6 days, 5:30:46", "remaining_time": "17:50:46", "throughput": 2738.14, "total_tokens": 1473795680} {"current_steps": 8161, "total_steps": 9134, "loss": 0.7635, "learning_rate": 1.3869357919628845e-06, "epoch": 0.893401570924218, "percentage": 89.35, "elapsed_time": "6 days, 5:31:51", "remaining_time": "17:49:40", "throughput": 2738.14, "total_tokens": 1473973536} {"current_steps": 8162, "total_steps": 9134, "loss": 1.0854, "learning_rate": 1.3841130011097408e-06, "epoch": 0.8935110429951558, "percentage": 89.36, "elapsed_time": "6 days, 5:32:58", "remaining_time": "17:48:34", "throughput": 2738.16, "total_tokens": 1474168640} {"current_steps": 8163, "total_steps": 9134, "loss": 0.8992, "learning_rate": 1.3812930039708738e-06, "epoch": 0.8936205150660937, "percentage": 89.37, "elapsed_time": "6 days, 5:34:02", "remaining_time": "17:47:28", "throughput": 2738.17, "total_tokens": 1474343808} {"current_steps": 8164, "total_steps": 9134, "loss": 0.8204, "learning_rate": 1.378475800879897e-06, "epoch": 0.8937299871370317, "percentage": 89.38, "elapsed_time": "6 days, 5:35:08", "remaining_time": "17:46:22", "throughput": 2738.18, "total_tokens": 1474531296} {"current_steps": 8165, "total_steps": 9134, "loss": 0.7473, "learning_rate": 1.3756613921700774e-06, "epoch": 0.8938394592079696, "percentage": 89.39, "elapsed_time": "6 days, 5:36:15", "remaining_time": "17:45:16", "throughput": 2738.19, "total_tokens": 1474721472} {"current_steps": 8166, "total_steps": 9134, "loss": 0.7822, "learning_rate": 1.372849778174351e-06, "epoch": 0.8939489312789075, "percentage": 89.4, "elapsed_time": "6 days, 5:37:20", "remaining_time": "17:44:10", "throughput": 2738.2, "total_tokens": 1474903360} {"current_steps": 8167, "total_steps": 9134, "loss": 0.844, "learning_rate": 1.3700409592253299e-06, "epoch": 0.8940584033498453, "percentage": 89.41, "elapsed_time": "6 days, 5:38:22", "remaining_time": "17:43:04", "throughput": 2738.18, "total_tokens": 1475066656} {"current_steps": 8168, "total_steps": 9134, "loss": 0.7506, "learning_rate": 1.3672349356552899e-06, "epoch": 0.8941678754207832, "percentage": 89.42, "elapsed_time": "6 days, 5:39:25", "remaining_time": "17:41:57", "throughput": 2738.17, "total_tokens": 1475230848} {"current_steps": 8169, "total_steps": 9134, "loss": 0.6415, "learning_rate": 1.3644317077961794e-06, "epoch": 0.8942773474917212, "percentage": 89.44, "elapsed_time": "6 days, 5:40:30", "remaining_time": "17:40:51", "throughput": 2738.16, "total_tokens": 1475406464} {"current_steps": 8170, "total_steps": 9134, "loss": 0.885, "learning_rate": 1.3616312759796079e-06, "epoch": 0.8943868195626591, "percentage": 89.45, "elapsed_time": "6 days, 5:41:37", "remaining_time": "17:39:45", "throughput": 2738.23, "total_tokens": 1475626656} {"current_steps": 8171, "total_steps": 9134, "loss": 0.5948, "learning_rate": 1.3588336405368745e-06, "epoch": 0.894496291633597, "percentage": 89.46, "elapsed_time": "6 days, 5:42:38", "remaining_time": "17:38:39", "throughput": 2738.2, "total_tokens": 1475775840} {"current_steps": 8172, "total_steps": 9134, "loss": 0.8246, "learning_rate": 1.3560388017989256e-06, "epoch": 0.8946057637045349, "percentage": 89.47, "elapsed_time": "6 days, 5:43:44", "remaining_time": "17:37:33", "throughput": 2738.26, "total_tokens": 1475989536} {"current_steps": 8173, "total_steps": 9134, "loss": 0.9701, "learning_rate": 1.3532467600963883e-06, "epoch": 0.8947152357754727, "percentage": 89.48, "elapsed_time": "6 days, 5:44:52", "remaining_time": "17:36:27", "throughput": 2738.27, "total_tokens": 1476180608} {"current_steps": 8174, "total_steps": 9134, "loss": 0.9495, "learning_rate": 1.350457515759554e-06, "epoch": 0.8948247078464107, "percentage": 89.49, "elapsed_time": "6 days, 5:45:52", "remaining_time": "17:35:21", "throughput": 2738.29, "total_tokens": 1476354432} {"current_steps": 8175, "total_steps": 9134, "loss": 0.7738, "learning_rate": 1.3476710691183837e-06, "epoch": 0.8949341799173486, "percentage": 89.5, "elapsed_time": "6 days, 5:46:58", "remaining_time": "17:34:15", "throughput": 2738.32, "total_tokens": 1476556032} {"current_steps": 8176, "total_steps": 9134, "loss": 0.7371, "learning_rate": 1.3448874205025137e-06, "epoch": 0.8950436519882865, "percentage": 89.51, "elapsed_time": "6 days, 5:48:04", "remaining_time": "17:33:09", "throughput": 2738.37, "total_tokens": 1476760544} {"current_steps": 8177, "total_steps": 9134, "loss": 0.8386, "learning_rate": 1.342106570241239e-06, "epoch": 0.8951531240592244, "percentage": 89.52, "elapsed_time": "6 days, 5:49:12", "remaining_time": "17:32:03", "throughput": 2738.42, "total_tokens": 1476972448} {"current_steps": 8178, "total_steps": 9134, "loss": 0.7986, "learning_rate": 1.3393285186635268e-06, "epoch": 0.8952625961301623, "percentage": 89.53, "elapsed_time": "6 days, 5:50:14", "remaining_time": "17:30:56", "throughput": 2738.43, "total_tokens": 1477148288} {"current_steps": 8179, "total_steps": 9134, "loss": 0.878, "learning_rate": 1.3365532660980256e-06, "epoch": 0.8953720682011002, "percentage": 89.54, "elapsed_time": "6 days, 5:51:18", "remaining_time": "17:29:50", "throughput": 2738.41, "total_tokens": 1477313152} {"current_steps": 8180, "total_steps": 9134, "loss": 0.6281, "learning_rate": 1.333780812873031e-06, "epoch": 0.8954815402720381, "percentage": 89.56, "elapsed_time": "6 days, 5:52:20", "remaining_time": "17:28:44", "throughput": 2738.37, "total_tokens": 1477464352} {"current_steps": 8181, "total_steps": 9134, "loss": 0.892, "learning_rate": 1.3310111593165254e-06, "epoch": 0.895591012342976, "percentage": 89.57, "elapsed_time": "6 days, 5:53:24", "remaining_time": "17:27:38", "throughput": 2738.4, "total_tokens": 1477651168} {"current_steps": 8182, "total_steps": 9134, "loss": 0.9016, "learning_rate": 1.3282443057561545e-06, "epoch": 0.8957004844139139, "percentage": 89.58, "elapsed_time": "6 days, 5:54:27", "remaining_time": "17:26:31", "throughput": 2738.42, "total_tokens": 1477836416} {"current_steps": 8183, "total_steps": 9134, "loss": 0.9771, "learning_rate": 1.3254802525192289e-06, "epoch": 0.8958099564848518, "percentage": 89.59, "elapsed_time": "6 days, 5:55:31", "remaining_time": "17:25:25", "throughput": 2738.43, "total_tokens": 1478016960} {"current_steps": 8184, "total_steps": 9134, "loss": 0.9035, "learning_rate": 1.3227189999327316e-06, "epoch": 0.8959194285557897, "percentage": 89.6, "elapsed_time": "6 days, 5:56:32", "remaining_time": "17:24:19", "throughput": 2738.45, "total_tokens": 1478196608} {"current_steps": 8185, "total_steps": 9134, "loss": 0.843, "learning_rate": 1.3199605483233096e-06, "epoch": 0.8960289006267276, "percentage": 89.61, "elapsed_time": "6 days, 5:57:38", "remaining_time": "17:23:13", "throughput": 2738.43, "total_tokens": 1478363936} {"current_steps": 8186, "total_steps": 9134, "loss": 0.8142, "learning_rate": 1.3172048980172935e-06, "epoch": 0.8961383726976655, "percentage": 89.62, "elapsed_time": "6 days, 5:58:42", "remaining_time": "17:22:07", "throughput": 2738.46, "total_tokens": 1478557024} {"current_steps": 8187, "total_steps": 9134, "loss": 1.0974, "learning_rate": 1.314452049340656e-06, "epoch": 0.8962478447686034, "percentage": 89.63, "elapsed_time": "6 days, 5:59:44", "remaining_time": "17:21:00", "throughput": 2738.45, "total_tokens": 1478722560} {"current_steps": 8188, "total_steps": 9134, "loss": 1.0359, "learning_rate": 1.3117020026190696e-06, "epoch": 0.8963573168395413, "percentage": 89.64, "elapsed_time": "6 days, 6:00:49", "remaining_time": "17:19:54", "throughput": 2738.49, "total_tokens": 1478919680} {"current_steps": 8189, "total_steps": 9134, "loss": 0.8444, "learning_rate": 1.3089547581778438e-06, "epoch": 0.8964667889104793, "percentage": 89.65, "elapsed_time": "6 days, 6:01:55", "remaining_time": "17:18:48", "throughput": 2738.52, "total_tokens": 1479116800} {"current_steps": 8190, "total_steps": 9134, "loss": 0.7548, "learning_rate": 1.3062103163419853e-06, "epoch": 0.8965762609814171, "percentage": 89.66, "elapsed_time": "6 days, 6:03:00", "remaining_time": "17:17:42", "throughput": 2738.54, "total_tokens": 1479304288} {"current_steps": 8191, "total_steps": 9134, "loss": 0.8489, "learning_rate": 1.303468677436151e-06, "epoch": 0.896685733052355, "percentage": 89.68, "elapsed_time": "6 days, 6:04:06", "remaining_time": "17:16:36", "throughput": 2738.53, "total_tokens": 1479482816} {"current_steps": 8192, "total_steps": 9134, "loss": 0.775, "learning_rate": 1.3007298417846731e-06, "epoch": 0.8967952051232929, "percentage": 89.69, "elapsed_time": "6 days, 6:05:13", "remaining_time": "17:15:30", "throughput": 2738.55, "total_tokens": 1479678592} {"current_steps": 8193, "total_steps": 9134, "loss": 1.0827, "learning_rate": 1.2979938097115507e-06, "epoch": 0.8969046771942308, "percentage": 89.7, "elapsed_time": "6 days, 6:06:20", "remaining_time": "17:14:24", "throughput": 2738.58, "total_tokens": 1479872352} {"current_steps": 8194, "total_steps": 9134, "loss": 1.1926, "learning_rate": 1.2952605815404445e-06, "epoch": 0.8970141492651688, "percentage": 89.71, "elapsed_time": "6 days, 6:07:26", "remaining_time": "17:13:18", "throughput": 2738.62, "total_tokens": 1480076416} {"current_steps": 8195, "total_steps": 9134, "loss": 0.8696, "learning_rate": 1.2925301575947013e-06, "epoch": 0.8971236213361067, "percentage": 89.72, "elapsed_time": "6 days, 6:08:29", "remaining_time": "17:12:12", "throughput": 2738.62, "total_tokens": 1480251808} {"current_steps": 8196, "total_steps": 9134, "loss": 0.6899, "learning_rate": 1.2898025381973155e-06, "epoch": 0.8972330934070445, "percentage": 89.73, "elapsed_time": "6 days, 6:09:27", "remaining_time": "17:11:05", "throughput": 2738.58, "total_tokens": 1480390240} {"current_steps": 8197, "total_steps": 9134, "loss": 0.8551, "learning_rate": 1.287077723670968e-06, "epoch": 0.8973425654779824, "percentage": 89.74, "elapsed_time": "6 days, 6:10:35", "remaining_time": "17:10:00", "throughput": 2738.62, "total_tokens": 1480592064} {"current_steps": 8198, "total_steps": 9134, "loss": 0.7425, "learning_rate": 1.2843557143379897e-06, "epoch": 0.8974520375489203, "percentage": 89.75, "elapsed_time": "6 days, 6:11:41", "remaining_time": "17:08:54", "throughput": 2738.62, "total_tokens": 1480778432} {"current_steps": 8199, "total_steps": 9134, "loss": 0.9109, "learning_rate": 1.2816365105203953e-06, "epoch": 0.8975615096198583, "percentage": 89.76, "elapsed_time": "6 days, 6:12:46", "remaining_time": "17:07:48", "throughput": 2738.63, "total_tokens": 1480961216} {"current_steps": 8200, "total_steps": 9134, "loss": 1.1402, "learning_rate": 1.278920112539861e-06, "epoch": 0.8976709816907962, "percentage": 89.77, "elapsed_time": "6 days, 6:13:52", "remaining_time": "17:06:42", "throughput": 2738.64, "total_tokens": 1481145568} {"current_steps": 8201, "total_steps": 9134, "loss": 0.7234, "learning_rate": 1.2762065207177292e-06, "epoch": 0.897780453761734, "percentage": 89.79, "elapsed_time": "6 days, 6:14:58", "remaining_time": "17:05:36", "throughput": 2738.65, "total_tokens": 1481329696} {"current_steps": 8202, "total_steps": 9134, "loss": 0.9701, "learning_rate": 1.273495735375016e-06, "epoch": 0.8978899258326719, "percentage": 89.8, "elapsed_time": "6 days, 6:15:58", "remaining_time": "17:04:29", "throughput": 2738.64, "total_tokens": 1481488736} {"current_steps": 8203, "total_steps": 9134, "loss": 0.8281, "learning_rate": 1.270787756832395e-06, "epoch": 0.8979993979036098, "percentage": 89.81, "elapsed_time": "6 days, 6:17:01", "remaining_time": "17:03:23", "throughput": 2738.63, "total_tokens": 1481657408} {"current_steps": 8204, "total_steps": 9134, "loss": 0.7454, "learning_rate": 1.2680825854102268e-06, "epoch": 0.8981088699745478, "percentage": 89.82, "elapsed_time": "6 days, 6:18:07", "remaining_time": "17:02:17", "throughput": 2738.62, "total_tokens": 1481832800} {"current_steps": 8205, "total_steps": 9134, "loss": 0.8103, "learning_rate": 1.2653802214285137e-06, "epoch": 0.8982183420454857, "percentage": 89.83, "elapsed_time": "6 days, 6:19:07", "remaining_time": "17:01:10", "throughput": 2738.6, "total_tokens": 1481989152} {"current_steps": 8206, "total_steps": 9134, "loss": 1.1708, "learning_rate": 1.2626806652069501e-06, "epoch": 0.8983278141164236, "percentage": 89.84, "elapsed_time": "6 days, 6:20:11", "remaining_time": "17:00:04", "throughput": 2738.6, "total_tokens": 1482159392} {"current_steps": 8207, "total_steps": 9134, "loss": 0.7148, "learning_rate": 1.259983917064886e-06, "epoch": 0.8984372861873614, "percentage": 89.85, "elapsed_time": "6 days, 6:21:14", "remaining_time": "16:58:58", "throughput": 2738.57, "total_tokens": 1482316192} {"current_steps": 8208, "total_steps": 9134, "loss": 0.9127, "learning_rate": 1.2572899773213437e-06, "epoch": 0.8985467582582993, "percentage": 89.86, "elapsed_time": "6 days, 6:22:21", "remaining_time": "16:57:52", "throughput": 2738.58, "total_tokens": 1482507264} {"current_steps": 8209, "total_steps": 9134, "loss": 0.9315, "learning_rate": 1.2545988462950077e-06, "epoch": 0.8986562303292372, "percentage": 89.87, "elapsed_time": "6 days, 6:23:28", "remaining_time": "16:56:46", "throughput": 2738.57, "total_tokens": 1482684448} {"current_steps": 8210, "total_steps": 9134, "loss": 0.6121, "learning_rate": 1.251910524304234e-06, "epoch": 0.8987657024001752, "percentage": 89.88, "elapsed_time": "6 days, 6:24:30", "remaining_time": "16:55:40", "throughput": 2738.56, "total_tokens": 1482849760} {"current_steps": 8211, "total_steps": 9134, "loss": 1.0885, "learning_rate": 1.249225011667046e-06, "epoch": 0.8988751744711131, "percentage": 89.89, "elapsed_time": "6 days, 6:25:31", "remaining_time": "16:54:33", "throughput": 2738.57, "total_tokens": 1483023136} {"current_steps": 8212, "total_steps": 9134, "loss": 0.7088, "learning_rate": 1.246542308701132e-06, "epoch": 0.898984646542051, "percentage": 89.91, "elapsed_time": "6 days, 6:26:36", "remaining_time": "16:53:27", "throughput": 2738.59, "total_tokens": 1483213088} {"current_steps": 8213, "total_steps": 9134, "loss": 0.7588, "learning_rate": 1.2438624157238593e-06, "epoch": 0.8990941186129888, "percentage": 89.92, "elapsed_time": "6 days, 6:27:38", "remaining_time": "16:52:21", "throughput": 2738.59, "total_tokens": 1483377728} {"current_steps": 8214, "total_steps": 9134, "loss": 0.8855, "learning_rate": 1.2411853330522472e-06, "epoch": 0.8992035906839267, "percentage": 89.93, "elapsed_time": "6 days, 6:28:43", "remaining_time": "16:51:15", "throughput": 2738.57, "total_tokens": 1483546400} {"current_steps": 8215, "total_steps": 9134, "loss": 0.9485, "learning_rate": 1.238511061002992e-06, "epoch": 0.8993130627548647, "percentage": 89.94, "elapsed_time": "6 days, 6:29:47", "remaining_time": "16:50:09", "throughput": 2738.54, "total_tokens": 1483706112} {"current_steps": 8216, "total_steps": 9134, "loss": 0.9716, "learning_rate": 1.235839599892455e-06, "epoch": 0.8994225348258026, "percentage": 89.95, "elapsed_time": "6 days, 6:30:53", "remaining_time": "16:49:03", "throughput": 2738.56, "total_tokens": 1483898528} {"current_steps": 8217, "total_steps": 9134, "loss": 0.9124, "learning_rate": 1.2331709500366606e-06, "epoch": 0.8995320068967405, "percentage": 89.96, "elapsed_time": "6 days, 6:31:58", "remaining_time": "16:47:56", "throughput": 2738.59, "total_tokens": 1484089600} {"current_steps": 8218, "total_steps": 9134, "loss": 0.8838, "learning_rate": 1.2305051117513067e-06, "epoch": 0.8996414789676783, "percentage": 89.97, "elapsed_time": "6 days, 6:32:58", "remaining_time": "16:46:50", "throughput": 2738.56, "total_tokens": 1484239008} {"current_steps": 8219, "total_steps": 9134, "loss": 0.9587, "learning_rate": 1.2278420853517658e-06, "epoch": 0.8997509510386162, "percentage": 89.98, "elapsed_time": "6 days, 6:34:04", "remaining_time": "16:45:44", "throughput": 2738.55, "total_tokens": 1484414400} {"current_steps": 8220, "total_steps": 9134, "loss": 0.8158, "learning_rate": 1.2251818711530556e-06, "epoch": 0.8998604231095542, "percentage": 89.99, "elapsed_time": "6 days, 6:35:09", "remaining_time": "16:44:38", "throughput": 2738.55, "total_tokens": 1484593376} {"current_steps": 8221, "total_steps": 9134, "loss": 0.831, "learning_rate": 1.222524469469885e-06, "epoch": 0.8999698951804921, "percentage": 90.0, "elapsed_time": "6 days, 6:36:12", "remaining_time": "16:43:32", "throughput": 2738.57, "total_tokens": 1484776160} {"current_steps": 8222, "total_steps": 9134, "loss": 0.8508, "learning_rate": 1.2198698806166086e-06, "epoch": 0.90007936725143, "percentage": 90.02, "elapsed_time": "6 days, 6:37:17", "remaining_time": "16:42:26", "throughput": 2738.61, "total_tokens": 1484975744} {"current_steps": 8223, "total_steps": 9134, "loss": 0.9728, "learning_rate": 1.2172181049072695e-06, "epoch": 0.9001888393223679, "percentage": 90.03, "elapsed_time": "6 days, 6:38:24", "remaining_time": "16:41:20", "throughput": 2738.64, "total_tokens": 1485174208} {"current_steps": 8224, "total_steps": 9134, "loss": 0.839, "learning_rate": 1.214569142655564e-06, "epoch": 0.9002983113933057, "percentage": 90.04, "elapsed_time": "6 days, 6:39:26", "remaining_time": "16:40:13", "throughput": 2738.65, "total_tokens": 1485350272} {"current_steps": 8225, "total_steps": 9134, "loss": 1.0387, "learning_rate": 1.211922994174855e-06, "epoch": 0.9004077834642437, "percentage": 90.05, "elapsed_time": "6 days, 6:40:30", "remaining_time": "16:39:07", "throughput": 2738.67, "total_tokens": 1485539776} {"current_steps": 8226, "total_steps": 9134, "loss": 0.7375, "learning_rate": 1.209279659778187e-06, "epoch": 0.9005172555351816, "percentage": 90.06, "elapsed_time": "6 days, 6:41:34", "remaining_time": "16:38:01", "throughput": 2738.68, "total_tokens": 1485720096} {"current_steps": 8227, "total_steps": 9134, "loss": 0.8056, "learning_rate": 1.2066391397782484e-06, "epoch": 0.9006267276061195, "percentage": 90.07, "elapsed_time": "6 days, 6:42:41", "remaining_time": "16:36:55", "throughput": 2738.69, "total_tokens": 1485908480} {"current_steps": 8228, "total_steps": 9134, "loss": 0.776, "learning_rate": 1.204001434487423e-06, "epoch": 0.9007361996770574, "percentage": 90.08, "elapsed_time": "6 days, 6:43:42", "remaining_time": "16:35:49", "throughput": 2738.64, "total_tokens": 1486050272} {"current_steps": 8229, "total_steps": 9134, "loss": 0.8227, "learning_rate": 1.2013665442177275e-06, "epoch": 0.9008456717479953, "percentage": 90.09, "elapsed_time": "6 days, 6:44:50", "remaining_time": "16:34:43", "throughput": 2738.69, "total_tokens": 1486258592} {"current_steps": 8230, "total_steps": 9134, "loss": 0.7831, "learning_rate": 1.1987344692808849e-06, "epoch": 0.9009551438189332, "percentage": 90.1, "elapsed_time": "6 days, 6:45:52", "remaining_time": "16:33:37", "throughput": 2738.7, "total_tokens": 1486437792} {"current_steps": 8231, "total_steps": 9134, "loss": 0.748, "learning_rate": 1.1961052099882435e-06, "epoch": 0.9010646158898711, "percentage": 90.11, "elapsed_time": "6 days, 6:46:54", "remaining_time": "16:32:30", "throughput": 2738.7, "total_tokens": 1486608704} {"current_steps": 8232, "total_steps": 9134, "loss": 0.8954, "learning_rate": 1.1934787666508573e-06, "epoch": 0.901174087960809, "percentage": 90.12, "elapsed_time": "6 days, 6:47:56", "remaining_time": "16:31:24", "throughput": 2738.71, "total_tokens": 1486783648} {"current_steps": 8233, "total_steps": 9134, "loss": 0.7173, "learning_rate": 1.190855139579422e-06, "epoch": 0.9012835600317469, "percentage": 90.14, "elapsed_time": "6 days, 6:48:59", "remaining_time": "16:30:17", "throughput": 2738.73, "total_tokens": 1486965312} {"current_steps": 8234, "total_steps": 9134, "loss": 1.1024, "learning_rate": 1.1882343290843063e-06, "epoch": 0.9013930321026848, "percentage": 90.15, "elapsed_time": "6 days, 6:50:04", "remaining_time": "16:29:12", "throughput": 2738.75, "total_tokens": 1487155936} {"current_steps": 8235, "total_steps": 9134, "loss": 1.03, "learning_rate": 1.1856163354755505e-06, "epoch": 0.9015025041736227, "percentage": 90.16, "elapsed_time": "6 days, 6:51:09", "remaining_time": "16:28:05", "throughput": 2738.72, "total_tokens": 1487315872} {"current_steps": 8236, "total_steps": 9134, "loss": 1.0913, "learning_rate": 1.1830011590628547e-06, "epoch": 0.9016119762445606, "percentage": 90.17, "elapsed_time": "6 days, 6:52:16", "remaining_time": "16:27:00", "throughput": 2738.72, "total_tokens": 1487497984} {"current_steps": 8237, "total_steps": 9134, "loss": 0.7215, "learning_rate": 1.1803888001555963e-06, "epoch": 0.9017214483154985, "percentage": 90.18, "elapsed_time": "6 days, 6:53:20", "remaining_time": "16:25:53", "throughput": 2738.72, "total_tokens": 1487675840} {"current_steps": 8238, "total_steps": 9134, "loss": 0.958, "learning_rate": 1.1777792590628028e-06, "epoch": 0.9018309203864364, "percentage": 90.19, "elapsed_time": "6 days, 6:54:24", "remaining_time": "16:24:47", "throughput": 2738.74, "total_tokens": 1487861088} {"current_steps": 8239, "total_steps": 9134, "loss": 0.822, "learning_rate": 1.175172536093183e-06, "epoch": 0.9019403924573743, "percentage": 90.2, "elapsed_time": "6 days, 6:55:27", "remaining_time": "16:23:41", "throughput": 2738.76, "total_tokens": 1488042528} {"current_steps": 8240, "total_steps": 9134, "loss": 0.9403, "learning_rate": 1.1725686315551099e-06, "epoch": 0.9020498645283123, "percentage": 90.21, "elapsed_time": "6 days, 6:56:32", "remaining_time": "16:22:35", "throughput": 2738.78, "total_tokens": 1488231808} {"current_steps": 8241, "total_steps": 9134, "loss": 1.0121, "learning_rate": 1.1699675457566144e-06, "epoch": 0.9021593365992501, "percentage": 90.22, "elapsed_time": "6 days, 6:57:37", "remaining_time": "16:21:29", "throughput": 2738.8, "total_tokens": 1488421984} {"current_steps": 8242, "total_steps": 9134, "loss": 0.8738, "learning_rate": 1.1673692790054063e-06, "epoch": 0.902268808670188, "percentage": 90.23, "elapsed_time": "6 days, 6:58:36", "remaining_time": "16:20:22", "throughput": 2738.75, "total_tokens": 1488556160} {"current_steps": 8243, "total_steps": 9134, "loss": 0.8242, "learning_rate": 1.1647738316088508e-06, "epoch": 0.9023782807411259, "percentage": 90.25, "elapsed_time": "6 days, 6:59:40", "remaining_time": "16:19:16", "throughput": 2738.79, "total_tokens": 1488752160} {"current_steps": 8244, "total_steps": 9134, "loss": 0.7347, "learning_rate": 1.1621812038739855e-06, "epoch": 0.9024877528120638, "percentage": 90.26, "elapsed_time": "6 days, 7:00:48", "remaining_time": "16:18:10", "throughput": 2738.83, "total_tokens": 1488958688} {"current_steps": 8245, "total_steps": 9134, "loss": 1.034, "learning_rate": 1.1595913961075094e-06, "epoch": 0.9025972248830018, "percentage": 90.27, "elapsed_time": "6 days, 7:01:53", "remaining_time": "16:17:04", "throughput": 2738.85, "total_tokens": 1489147968} {"current_steps": 8246, "total_steps": 9134, "loss": 0.8037, "learning_rate": 1.1570044086158e-06, "epoch": 0.9027066969539397, "percentage": 90.28, "elapsed_time": "6 days, 7:02:56", "remaining_time": "16:15:58", "throughput": 2738.86, "total_tokens": 1489328288} {"current_steps": 8247, "total_steps": 9134, "loss": 0.516, "learning_rate": 1.15442024170489e-06, "epoch": 0.9028161690248775, "percentage": 90.29, "elapsed_time": "6 days, 7:03:59", "remaining_time": "16:14:52", "throughput": 2738.87, "total_tokens": 1489507488} {"current_steps": 8248, "total_steps": 9134, "loss": 0.8438, "learning_rate": 1.1518388956804793e-06, "epoch": 0.9029256410958154, "percentage": 90.3, "elapsed_time": "6 days, 7:05:04", "remaining_time": "16:13:46", "throughput": 2738.89, "total_tokens": 1489695200} {"current_steps": 8249, "total_steps": 9134, "loss": 0.9425, "learning_rate": 1.149260370847935e-06, "epoch": 0.9030351131667533, "percentage": 90.31, "elapsed_time": "6 days, 7:06:08", "remaining_time": "16:12:40", "throughput": 2738.87, "total_tokens": 1489855360} {"current_steps": 8250, "total_steps": 9134, "loss": 0.7014, "learning_rate": 1.1466846675122988e-06, "epoch": 0.9031445852376913, "percentage": 90.32, "elapsed_time": "6 days, 7:07:02", "remaining_time": "16:11:32", "throughput": 2738.81, "total_tokens": 1489975872} {"current_steps": 8251, "total_steps": 9134, "loss": 0.942, "learning_rate": 1.1441117859782636e-06, "epoch": 0.9032540573086292, "percentage": 90.33, "elapsed_time": "6 days, 7:08:07", "remaining_time": "16:10:26", "throughput": 2738.83, "total_tokens": 1490164032} {"current_steps": 8252, "total_steps": 9134, "loss": 0.7039, "learning_rate": 1.1415417265501993e-06, "epoch": 0.903363529379567, "percentage": 90.34, "elapsed_time": "6 days, 7:09:13", "remaining_time": "16:09:20", "throughput": 2738.81, "total_tokens": 1490330688} {"current_steps": 8253, "total_steps": 9134, "loss": 0.8314, "learning_rate": 1.138974489532138e-06, "epoch": 0.9034730014505049, "percentage": 90.35, "elapsed_time": "6 days, 7:10:19", "remaining_time": "16:08:14", "throughput": 2738.84, "total_tokens": 1490529824} {"current_steps": 8254, "total_steps": 9134, "loss": 0.7096, "learning_rate": 1.1364100752277812e-06, "epoch": 0.9035824735214428, "percentage": 90.37, "elapsed_time": "6 days, 7:11:24", "remaining_time": "16:07:08", "throughput": 2738.87, "total_tokens": 1490724256} {"current_steps": 8255, "total_steps": 9134, "loss": 1.0336, "learning_rate": 1.1338484839404944e-06, "epoch": 0.9036919455923808, "percentage": 90.38, "elapsed_time": "6 days, 7:12:29", "remaining_time": "16:06:02", "throughput": 2738.85, "total_tokens": 1490889792} {"current_steps": 8256, "total_steps": 9134, "loss": 0.6998, "learning_rate": 1.131289715973305e-06, "epoch": 0.9038014176633187, "percentage": 90.39, "elapsed_time": "6 days, 7:13:34", "remaining_time": "16:04:56", "throughput": 2738.83, "total_tokens": 1491058016} {"current_steps": 8257, "total_steps": 9134, "loss": 0.9641, "learning_rate": 1.1287337716289149e-06, "epoch": 0.9039108897342566, "percentage": 90.4, "elapsed_time": "6 days, 7:14:39", "remaining_time": "16:03:50", "throughput": 2738.84, "total_tokens": 1491242816} {"current_steps": 8258, "total_steps": 9134, "loss": 0.9602, "learning_rate": 1.1261806512096878e-06, "epoch": 0.9040203618051944, "percentage": 90.41, "elapsed_time": "6 days, 7:15:45", "remaining_time": "16:02:44", "throughput": 2738.86, "total_tokens": 1491435904} {"current_steps": 8259, "total_steps": 9134, "loss": 1.0269, "learning_rate": 1.1236303550176463e-06, "epoch": 0.9041298338761323, "percentage": 90.42, "elapsed_time": "6 days, 7:16:49", "remaining_time": "16:01:38", "throughput": 2738.84, "total_tokens": 1491595616} {"current_steps": 8260, "total_steps": 9134, "loss": 0.933, "learning_rate": 1.1210828833544907e-06, "epoch": 0.9042393059470702, "percentage": 90.43, "elapsed_time": "6 days, 7:17:54", "remaining_time": "16:00:32", "throughput": 2738.85, "total_tokens": 1491778624} {"current_steps": 8261, "total_steps": 9134, "loss": 0.777, "learning_rate": 1.1185382365215853e-06, "epoch": 0.9043487780180082, "percentage": 90.44, "elapsed_time": "6 days, 7:19:01", "remaining_time": "15:59:26", "throughput": 2738.86, "total_tokens": 1491972160} {"current_steps": 8262, "total_steps": 9134, "loss": 1.0945, "learning_rate": 1.1159964148199475e-06, "epoch": 0.9044582500889461, "percentage": 90.45, "elapsed_time": "6 days, 7:20:08", "remaining_time": "15:58:20", "throughput": 2738.91, "total_tokens": 1492178912} {"current_steps": 8263, "total_steps": 9134, "loss": 0.9078, "learning_rate": 1.1134574185502816e-06, "epoch": 0.904567722159884, "percentage": 90.46, "elapsed_time": "6 days, 7:21:15", "remaining_time": "15:57:15", "throughput": 2738.96, "total_tokens": 1492392160} {"current_steps": 8264, "total_steps": 9134, "loss": 0.7378, "learning_rate": 1.1109212480129334e-06, "epoch": 0.9046771942308218, "percentage": 90.48, "elapsed_time": "6 days, 7:22:18", "remaining_time": "15:56:08", "throughput": 2738.98, "total_tokens": 1492574944} {"current_steps": 8265, "total_steps": 9134, "loss": 0.7589, "learning_rate": 1.1083879035079349e-06, "epoch": 0.9047866663017597, "percentage": 90.49, "elapsed_time": "6 days, 7:23:22", "remaining_time": "15:55:02", "throughput": 2739.0, "total_tokens": 1492760864} {"current_steps": 8266, "total_steps": 9134, "loss": 0.9072, "learning_rate": 1.105857385334977e-06, "epoch": 0.9048961383726977, "percentage": 90.5, "elapsed_time": "6 days, 7:24:20", "remaining_time": "15:53:55", "throughput": 2738.99, "total_tokens": 1492913632} {"current_steps": 8267, "total_steps": 9134, "loss": 0.9772, "learning_rate": 1.1033296937934061e-06, "epoch": 0.9050056104436356, "percentage": 90.51, "elapsed_time": "6 days, 7:25:25", "remaining_time": "15:52:49", "throughput": 2739.02, "total_tokens": 1493112096} {"current_steps": 8268, "total_steps": 9134, "loss": 0.8122, "learning_rate": 1.1008048291822588e-06, "epoch": 0.9051150825145735, "percentage": 90.52, "elapsed_time": "6 days, 7:26:24", "remaining_time": "15:51:43", "throughput": 2738.98, "total_tokens": 1493247168} {"current_steps": 8269, "total_steps": 9134, "loss": 0.8768, "learning_rate": 1.0982827918002065e-06, "epoch": 0.9052245545855113, "percentage": 90.53, "elapsed_time": "6 days, 7:27:31", "remaining_time": "15:50:37", "throughput": 2739.01, "total_tokens": 1493450560} {"current_steps": 8270, "total_steps": 9134, "loss": 1.0532, "learning_rate": 1.0957635819456135e-06, "epoch": 0.9053340266564492, "percentage": 90.54, "elapsed_time": "6 days, 7:28:35", "remaining_time": "15:49:31", "throughput": 2739.01, "total_tokens": 1493625280} {"current_steps": 8271, "total_steps": 9134, "loss": 0.8289, "learning_rate": 1.0932471999164835e-06, "epoch": 0.9054434987273872, "percentage": 90.55, "elapsed_time": "6 days, 7:29:40", "remaining_time": "15:48:25", "throughput": 2739.06, "total_tokens": 1493830688} {"current_steps": 8272, "total_steps": 9134, "loss": 1.2016, "learning_rate": 1.0907336460105166e-06, "epoch": 0.9055529707983251, "percentage": 90.56, "elapsed_time": "6 days, 7:30:46", "remaining_time": "15:47:19", "throughput": 2739.13, "total_tokens": 1494045728} {"current_steps": 8273, "total_steps": 9134, "loss": 0.9235, "learning_rate": 1.088222920525045e-06, "epoch": 0.905662442869263, "percentage": 90.57, "elapsed_time": "6 days, 7:31:50", "remaining_time": "15:46:13", "throughput": 2739.09, "total_tokens": 1494203200} {"current_steps": 8274, "total_steps": 9134, "loss": 1.0415, "learning_rate": 1.0857150237570946e-06, "epoch": 0.9057719149402009, "percentage": 90.58, "elapsed_time": "6 days, 7:32:56", "remaining_time": "15:45:07", "throughput": 2739.09, "total_tokens": 1494382848} {"current_steps": 8275, "total_steps": 9134, "loss": 0.9335, "learning_rate": 1.0832099560033394e-06, "epoch": 0.9058813870111387, "percentage": 90.6, "elapsed_time": "6 days, 7:34:04", "remaining_time": "15:44:01", "throughput": 2739.12, "total_tokens": 1494586240} {"current_steps": 8276, "total_steps": 9134, "loss": 0.8872, "learning_rate": 1.0807077175601255e-06, "epoch": 0.9059908590820767, "percentage": 90.61, "elapsed_time": "6 days, 7:35:09", "remaining_time": "15:42:55", "throughput": 2739.15, "total_tokens": 1494782464} {"current_steps": 8277, "total_steps": 9134, "loss": 0.7234, "learning_rate": 1.0782083087234608e-06, "epoch": 0.9061003311530146, "percentage": 90.62, "elapsed_time": "6 days, 7:36:14", "remaining_time": "15:41:49", "throughput": 2739.17, "total_tokens": 1494966816} {"current_steps": 8278, "total_steps": 9134, "loss": 0.7995, "learning_rate": 1.0757117297890224e-06, "epoch": 0.9062098032239525, "percentage": 90.63, "elapsed_time": "6 days, 7:37:20", "remaining_time": "15:40:43", "throughput": 2739.2, "total_tokens": 1495166624} {"current_steps": 8279, "total_steps": 9134, "loss": 1.1398, "learning_rate": 1.073217981052152e-06, "epoch": 0.9063192752948904, "percentage": 90.64, "elapsed_time": "6 days, 7:38:24", "remaining_time": "15:39:37", "throughput": 2739.2, "total_tokens": 1495342688} {"current_steps": 8280, "total_steps": 9134, "loss": 0.8177, "learning_rate": 1.0707270628078552e-06, "epoch": 0.9064287473658283, "percentage": 90.65, "elapsed_time": "6 days, 7:39:28", "remaining_time": "15:38:31", "throughput": 2739.24, "total_tokens": 1495539584} {"current_steps": 8281, "total_steps": 9134, "loss": 1.036, "learning_rate": 1.0682389753508021e-06, "epoch": 0.9065382194367662, "percentage": 90.66, "elapsed_time": "6 days, 7:40:28", "remaining_time": "15:37:24", "throughput": 2739.21, "total_tokens": 1495686080} {"current_steps": 8282, "total_steps": 9134, "loss": 1.1312, "learning_rate": 1.065753718975329e-06, "epoch": 0.9066476915077041, "percentage": 90.67, "elapsed_time": "6 days, 7:41:33", "remaining_time": "15:36:18", "throughput": 2739.22, "total_tokens": 1495872000} {"current_steps": 8283, "total_steps": 9134, "loss": 0.8706, "learning_rate": 1.0632712939754347e-06, "epoch": 0.906757163578642, "percentage": 90.68, "elapsed_time": "6 days, 7:42:34", "remaining_time": "15:35:12", "throughput": 2739.18, "total_tokens": 1496014912} {"current_steps": 8284, "total_steps": 9134, "loss": 0.9748, "learning_rate": 1.0607917006447865e-06, "epoch": 0.9068666356495799, "percentage": 90.69, "elapsed_time": "6 days, 7:43:38", "remaining_time": "15:34:06", "throughput": 2739.2, "total_tokens": 1496203520} {"current_steps": 8285, "total_steps": 9134, "loss": 1.209, "learning_rate": 1.0583149392767195e-06, "epoch": 0.9069761077205178, "percentage": 90.71, "elapsed_time": "6 days, 7:44:46", "remaining_time": "15:33:00", "throughput": 2739.24, "total_tokens": 1496410272} {"current_steps": 8286, "total_steps": 9134, "loss": 1.0296, "learning_rate": 1.0558410101642213e-06, "epoch": 0.9070855797914557, "percentage": 90.72, "elapsed_time": "6 days, 7:45:51", "remaining_time": "15:31:54", "throughput": 2739.27, "total_tokens": 1496605600} {"current_steps": 8287, "total_steps": 9134, "loss": 0.95, "learning_rate": 1.0533699135999608e-06, "epoch": 0.9071950518623936, "percentage": 90.73, "elapsed_time": "6 days, 7:46:54", "remaining_time": "15:30:48", "throughput": 2739.27, "total_tokens": 1496776736} {"current_steps": 8288, "total_steps": 9134, "loss": 0.8804, "learning_rate": 1.0509016498762625e-06, "epoch": 0.9073045239333315, "percentage": 90.74, "elapsed_time": "6 days, 7:47:58", "remaining_time": "15:29:41", "throughput": 2739.3, "total_tokens": 1496968480} {"current_steps": 8289, "total_steps": 9134, "loss": 0.6753, "learning_rate": 1.0484362192851149e-06, "epoch": 0.9074139960042694, "percentage": 90.75, "elapsed_time": "6 days, 7:49:01", "remaining_time": "15:28:35", "throughput": 2739.32, "total_tokens": 1497154848} {"current_steps": 8290, "total_steps": 9134, "loss": 0.8413, "learning_rate": 1.0459736221181766e-06, "epoch": 0.9075234680752073, "percentage": 90.76, "elapsed_time": "6 days, 7:50:06", "remaining_time": "15:27:29", "throughput": 2739.34, "total_tokens": 1497342336} {"current_steps": 8291, "total_steps": 9134, "loss": 0.847, "learning_rate": 1.0435138586667641e-06, "epoch": 0.9076329401461453, "percentage": 90.77, "elapsed_time": "6 days, 7:51:07", "remaining_time": "15:26:23", "throughput": 2739.34, "total_tokens": 1497511008} {"current_steps": 8292, "total_steps": 9134, "loss": 0.8252, "learning_rate": 1.0410569292218676e-06, "epoch": 0.9077424122170831, "percentage": 90.78, "elapsed_time": "6 days, 7:52:08", "remaining_time": "15:25:16", "throughput": 2739.33, "total_tokens": 1497671616} {"current_steps": 8293, "total_steps": 9134, "loss": 0.8048, "learning_rate": 1.038602834074129e-06, "epoch": 0.907851884288021, "percentage": 90.79, "elapsed_time": "6 days, 7:53:14", "remaining_time": "15:24:10", "throughput": 2739.34, "total_tokens": 1497853280} {"current_steps": 8294, "total_steps": 9134, "loss": 0.9138, "learning_rate": 1.0361515735138772e-06, "epoch": 0.9079613563589589, "percentage": 90.8, "elapsed_time": "6 days, 7:54:18", "remaining_time": "15:23:04", "throughput": 2739.36, "total_tokens": 1498044800} {"current_steps": 8295, "total_steps": 9134, "loss": 0.7592, "learning_rate": 1.0337031478310749e-06, "epoch": 0.9080708284298968, "percentage": 90.81, "elapsed_time": "6 days, 7:55:21", "remaining_time": "15:21:58", "throughput": 2739.37, "total_tokens": 1498220416} {"current_steps": 8296, "total_steps": 9134, "loss": 0.7531, "learning_rate": 1.0312575573153792e-06, "epoch": 0.9081803005008348, "percentage": 90.83, "elapsed_time": "6 days, 7:56:24", "remaining_time": "15:20:52", "throughput": 2739.35, "total_tokens": 1498384608} {"current_steps": 8297, "total_steps": 9134, "loss": 0.8312, "learning_rate": 1.0288148022560923e-06, "epoch": 0.9082897725717727, "percentage": 90.84, "elapsed_time": "6 days, 7:57:32", "remaining_time": "15:19:46", "throughput": 2739.37, "total_tokens": 1498575680} {"current_steps": 8298, "total_steps": 9134, "loss": 0.7952, "learning_rate": 1.026374882942191e-06, "epoch": 0.9083992446427105, "percentage": 90.85, "elapsed_time": "6 days, 7:58:39", "remaining_time": "15:18:40", "throughput": 2739.37, "total_tokens": 1498764736} {"current_steps": 8299, "total_steps": 9134, "loss": 1.1108, "learning_rate": 1.0239377996623112e-06, "epoch": 0.9085087167136484, "percentage": 90.86, "elapsed_time": "6 days, 7:59:46", "remaining_time": "15:17:34", "throughput": 2739.37, "total_tokens": 1498947968} {"current_steps": 8300, "total_steps": 9134, "loss": 0.9321, "learning_rate": 1.02150355270475e-06, "epoch": 0.9086181887845863, "percentage": 90.87, "elapsed_time": "6 days, 8:00:50", "remaining_time": "15:16:28", "throughput": 2739.4, "total_tokens": 1499139040} {"current_steps": 8301, "total_steps": 9134, "loss": 0.8652, "learning_rate": 1.0190721423574884e-06, "epoch": 0.9087276608555243, "percentage": 90.88, "elapsed_time": "6 days, 8:01:52", "remaining_time": "15:15:22", "throughput": 2739.41, "total_tokens": 1499316224} {"current_steps": 8302, "total_steps": 9134, "loss": 0.9271, "learning_rate": 1.0166435689081404e-06, "epoch": 0.9088371329264622, "percentage": 90.89, "elapsed_time": "6 days, 8:02:55", "remaining_time": "15:14:16", "throughput": 2739.43, "total_tokens": 1499499680} {"current_steps": 8303, "total_steps": 9134, "loss": 0.8369, "learning_rate": 1.0142178326440155e-06, "epoch": 0.9089466049974, "percentage": 90.9, "elapsed_time": "6 days, 8:03:56", "remaining_time": "15:13:09", "throughput": 2739.42, "total_tokens": 1499658272} {"current_steps": 8304, "total_steps": 9134, "loss": 0.9242, "learning_rate": 1.0117949338520645e-06, "epoch": 0.9090560770683379, "percentage": 90.91, "elapsed_time": "6 days, 8:04:57", "remaining_time": "15:12:03", "throughput": 2739.4, "total_tokens": 1499815520} {"current_steps": 8305, "total_steps": 9134, "loss": 0.6883, "learning_rate": 1.009374872818919e-06, "epoch": 0.9091655491392758, "percentage": 90.92, "elapsed_time": "6 days, 8:05:59", "remaining_time": "15:10:57", "throughput": 2739.35, "total_tokens": 1499959104} {"current_steps": 8306, "total_steps": 9134, "loss": 0.9726, "learning_rate": 1.0069576498308587e-06, "epoch": 0.9092750212102138, "percentage": 90.93, "elapsed_time": "6 days, 8:07:05", "remaining_time": "15:09:51", "throughput": 2739.4, "total_tokens": 1500167648} {"current_steps": 8307, "total_steps": 9134, "loss": 1.0508, "learning_rate": 1.0045432651738434e-06, "epoch": 0.9093844932811517, "percentage": 90.95, "elapsed_time": "6 days, 8:08:03", "remaining_time": "15:08:44", "throughput": 2739.37, "total_tokens": 1500309216} {"current_steps": 8308, "total_steps": 9134, "loss": 0.693, "learning_rate": 1.0021317191334895e-06, "epoch": 0.9094939653520896, "percentage": 90.96, "elapsed_time": "6 days, 8:09:07", "remaining_time": "15:07:38", "throughput": 2739.38, "total_tokens": 1500491328} {"current_steps": 8309, "total_steps": 9134, "loss": 0.8125, "learning_rate": 9.99723011995074e-07, "epoch": 0.9096034374230274, "percentage": 90.97, "elapsed_time": "6 days, 8:10:06", "remaining_time": "15:06:31", "throughput": 2739.36, "total_tokens": 1500638496} {"current_steps": 8310, "total_steps": 9134, "loss": 0.9299, "learning_rate": 9.973171440435524e-07, "epoch": 0.9097129094939653, "percentage": 90.98, "elapsed_time": "6 days, 8:11:07", "remaining_time": "15:05:25", "throughput": 2739.37, "total_tokens": 1500813888} {"current_steps": 8311, "total_steps": 9134, "loss": 0.9402, "learning_rate": 9.949141155635194e-07, "epoch": 0.9098223815649032, "percentage": 90.99, "elapsed_time": "6 days, 8:12:11", "remaining_time": "15:04:19", "throughput": 2739.37, "total_tokens": 1500988608} {"current_steps": 8312, "total_steps": 9134, "loss": 0.9988, "learning_rate": 9.925139268392614e-07, "epoch": 0.9099318536358412, "percentage": 91.0, "elapsed_time": "6 days, 8:13:16", "remaining_time": "15:03:13", "throughput": 2739.39, "total_tokens": 1501179008} {"current_steps": 8313, "total_steps": 9134, "loss": 0.9574, "learning_rate": 9.901165781547096e-07, "epoch": 0.9100413257067791, "percentage": 91.01, "elapsed_time": "6 days, 8:14:21", "remaining_time": "15:02:07", "throughput": 2739.42, "total_tokens": 1501369184} {"current_steps": 8314, "total_steps": 9134, "loss": 1.0071, "learning_rate": 9.877220697934674e-07, "epoch": 0.910150797777717, "percentage": 91.02, "elapsed_time": "6 days, 8:15:25", "remaining_time": "15:01:01", "throughput": 2739.45, "total_tokens": 1501565632} {"current_steps": 8315, "total_steps": 9134, "loss": 1.0336, "learning_rate": 9.853304020388005e-07, "epoch": 0.9102602698486548, "percentage": 91.03, "elapsed_time": "6 days, 8:16:32", "remaining_time": "14:59:55", "throughput": 2739.47, "total_tokens": 1501753792} {"current_steps": 8316, "total_steps": 9134, "loss": 0.8269, "learning_rate": 9.829415751736404e-07, "epoch": 0.9103697419195927, "percentage": 91.04, "elapsed_time": "6 days, 8:17:38", "remaining_time": "14:58:49", "throughput": 2739.5, "total_tokens": 1501953376} {"current_steps": 8317, "total_steps": 9134, "loss": 1.1037, "learning_rate": 9.805555894805778e-07, "epoch": 0.9104792139905307, "percentage": 91.06, "elapsed_time": "6 days, 8:18:46", "remaining_time": "14:57:43", "throughput": 2739.53, "total_tokens": 1502156768} {"current_steps": 8318, "total_steps": 9134, "loss": 0.8832, "learning_rate": 9.781724452418733e-07, "epoch": 0.9105886860614686, "percentage": 91.07, "elapsed_time": "6 days, 8:19:48", "remaining_time": "14:56:37", "throughput": 2739.56, "total_tokens": 1502339552} {"current_steps": 8319, "total_steps": 9134, "loss": 0.8312, "learning_rate": 9.757921427394457e-07, "epoch": 0.9106981581324065, "percentage": 91.08, "elapsed_time": "6 days, 8:20:49", "remaining_time": "14:55:30", "throughput": 2739.53, "total_tokens": 1502492320} {"current_steps": 8320, "total_steps": 9134, "loss": 0.7666, "learning_rate": 9.73414682254878e-07, "epoch": 0.9108076302033443, "percentage": 91.09, "elapsed_time": "6 days, 8:21:54", "remaining_time": "14:54:24", "throughput": 2739.55, "total_tokens": 1502681376} {"current_steps": 8321, "total_steps": 9134, "loss": 0.8382, "learning_rate": 9.710400640694228e-07, "epoch": 0.9109171022742822, "percentage": 91.1, "elapsed_time": "6 days, 8:23:01", "remaining_time": "14:53:18", "throughput": 2739.52, "total_tokens": 1502850944} {"current_steps": 8322, "total_steps": 9134, "loss": 0.7403, "learning_rate": 9.686682884639948e-07, "epoch": 0.9110265743452202, "percentage": 91.11, "elapsed_time": "6 days, 8:24:08", "remaining_time": "14:52:13", "throughput": 2739.48, "total_tokens": 1503009984} {"current_steps": 8323, "total_steps": 9134, "loss": 0.7701, "learning_rate": 9.662993557191691e-07, "epoch": 0.9111360464161581, "percentage": 91.12, "elapsed_time": "6 days, 8:25:11", "remaining_time": "14:51:06", "throughput": 2739.5, "total_tokens": 1503198368} {"current_steps": 8324, "total_steps": 9134, "loss": 0.942, "learning_rate": 9.639332661151856e-07, "epoch": 0.911245518487096, "percentage": 91.13, "elapsed_time": "6 days, 8:26:15", "remaining_time": "14:50:00", "throughput": 2739.51, "total_tokens": 1503374880} {"current_steps": 8325, "total_steps": 9134, "loss": 0.7965, "learning_rate": 9.615700199319455e-07, "epoch": 0.9113549905580339, "percentage": 91.14, "elapsed_time": "6 days, 8:27:22", "remaining_time": "14:48:54", "throughput": 2739.54, "total_tokens": 1503576256} {"current_steps": 8326, "total_steps": 9134, "loss": 0.8966, "learning_rate": 9.592096174490195e-07, "epoch": 0.9114644626289717, "percentage": 91.15, "elapsed_time": "6 days, 8:28:25", "remaining_time": "14:47:48", "throughput": 2739.53, "total_tokens": 1503744256} {"current_steps": 8327, "total_steps": 9134, "loss": 0.8747, "learning_rate": 9.56852058945637e-07, "epoch": 0.9115739346999097, "percentage": 91.16, "elapsed_time": "6 days, 8:29:27", "remaining_time": "14:46:42", "throughput": 2739.55, "total_tokens": 1503922784} {"current_steps": 8328, "total_steps": 9134, "loss": 0.9247, "learning_rate": 9.544973447006888e-07, "epoch": 0.9116834067708476, "percentage": 91.18, "elapsed_time": "6 days, 8:30:29", "remaining_time": "14:45:36", "throughput": 2739.52, "total_tokens": 1504076896} {"current_steps": 8329, "total_steps": 9134, "loss": 1.1011, "learning_rate": 9.521454749927411e-07, "epoch": 0.9117928788417855, "percentage": 91.19, "elapsed_time": "6 days, 8:31:34", "remaining_time": "14:44:30", "throughput": 2739.56, "total_tokens": 1504278048} {"current_steps": 8330, "total_steps": 9134, "loss": 0.8944, "learning_rate": 9.497964501000128e-07, "epoch": 0.9119023509127234, "percentage": 91.2, "elapsed_time": "6 days, 8:32:41", "remaining_time": "14:43:24", "throughput": 2739.6, "total_tokens": 1504480320} {"current_steps": 8331, "total_steps": 9134, "loss": 1.0168, "learning_rate": 9.474502703003901e-07, "epoch": 0.9120118229836613, "percentage": 91.21, "elapsed_time": "6 days, 8:33:42", "remaining_time": "14:42:17", "throughput": 2739.59, "total_tokens": 1504642944} {"current_steps": 8332, "total_steps": 9134, "loss": 1.0183, "learning_rate": 9.451069358714177e-07, "epoch": 0.9121212950545992, "percentage": 91.22, "elapsed_time": "6 days, 8:34:46", "remaining_time": "14:41:11", "throughput": 2739.59, "total_tokens": 1504822368} {"current_steps": 8333, "total_steps": 9134, "loss": 0.8239, "learning_rate": 9.427664470903097e-07, "epoch": 0.9122307671255371, "percentage": 91.23, "elapsed_time": "6 days, 8:35:51", "remaining_time": "14:40:05", "throughput": 2739.62, "total_tokens": 1505012320} {"current_steps": 8334, "total_steps": 9134, "loss": 1.2347, "learning_rate": 9.40428804233942e-07, "epoch": 0.912340239196475, "percentage": 91.24, "elapsed_time": "6 days, 8:36:53", "remaining_time": "14:38:59", "throughput": 2739.63, "total_tokens": 1505191072} {"current_steps": 8335, "total_steps": 9134, "loss": 0.6422, "learning_rate": 9.380940075788491e-07, "epoch": 0.9124497112674129, "percentage": 91.25, "elapsed_time": "6 days, 8:38:00", "remaining_time": "14:37:53", "throughput": 2739.65, "total_tokens": 1505385952} {"current_steps": 8336, "total_steps": 9134, "loss": 1.0457, "learning_rate": 9.357620574012432e-07, "epoch": 0.9125591833383508, "percentage": 91.26, "elapsed_time": "6 days, 8:39:02", "remaining_time": "14:36:47", "throughput": 2739.64, "total_tokens": 1505547680} {"current_steps": 8337, "total_steps": 9134, "loss": 0.9652, "learning_rate": 9.33432953976976e-07, "epoch": 0.9126686554092887, "percentage": 91.27, "elapsed_time": "6 days, 8:40:04", "remaining_time": "14:35:41", "throughput": 2739.63, "total_tokens": 1505712992} {"current_steps": 8338, "total_steps": 9134, "loss": 0.9688, "learning_rate": 9.311066975815852e-07, "epoch": 0.9127781274802266, "percentage": 91.29, "elapsed_time": "6 days, 8:41:11", "remaining_time": "14:34:35", "throughput": 2739.68, "total_tokens": 1505925344} {"current_steps": 8339, "total_steps": 9134, "loss": 0.7433, "learning_rate": 9.28783288490262e-07, "epoch": 0.9128875995511645, "percentage": 91.3, "elapsed_time": "6 days, 8:42:15", "remaining_time": "14:33:29", "throughput": 2739.72, "total_tokens": 1506120672} {"current_steps": 8340, "total_steps": 9134, "loss": 1.1451, "learning_rate": 9.264627269778586e-07, "epoch": 0.9129970716221024, "percentage": 91.31, "elapsed_time": "6 days, 8:43:17", "remaining_time": "14:32:22", "throughput": 2739.69, "total_tokens": 1506277920} {"current_steps": 8341, "total_steps": 9134, "loss": 0.9105, "learning_rate": 9.241450133188944e-07, "epoch": 0.9131065436930403, "percentage": 91.32, "elapsed_time": "6 days, 8:44:20", "remaining_time": "14:31:16", "throughput": 2739.7, "total_tokens": 1506451968} {"current_steps": 8342, "total_steps": 9134, "loss": 0.8518, "learning_rate": 9.218301477875474e-07, "epoch": 0.9132160157639783, "percentage": 91.33, "elapsed_time": "6 days, 8:45:22", "remaining_time": "14:30:10", "throughput": 2739.7, "total_tokens": 1506626016} {"current_steps": 8343, "total_steps": 9134, "loss": 0.8852, "learning_rate": 9.195181306576678e-07, "epoch": 0.9133254878349161, "percentage": 91.34, "elapsed_time": "6 days, 8:46:26", "remaining_time": "14:29:04", "throughput": 2739.7, "total_tokens": 1506797824} {"current_steps": 8344, "total_steps": 9134, "loss": 0.8781, "learning_rate": 9.172089622027563e-07, "epoch": 0.913434959905854, "percentage": 91.35, "elapsed_time": "6 days, 8:47:31", "remaining_time": "14:27:58", "throughput": 2739.75, "total_tokens": 1507004352} {"current_steps": 8345, "total_steps": 9134, "loss": 0.9618, "learning_rate": 9.149026426959889e-07, "epoch": 0.9135444319767919, "percentage": 91.36, "elapsed_time": "6 days, 8:48:34", "remaining_time": "14:26:52", "throughput": 2739.77, "total_tokens": 1507185568} {"current_steps": 8346, "total_steps": 9134, "loss": 0.8454, "learning_rate": 9.125991724101918e-07, "epoch": 0.9136539040477298, "percentage": 91.37, "elapsed_time": "6 days, 8:49:38", "remaining_time": "14:25:45", "throughput": 2739.76, "total_tokens": 1507356256} {"current_steps": 8347, "total_steps": 9134, "loss": 0.9125, "learning_rate": 9.102985516178692e-07, "epoch": 0.9137633761186678, "percentage": 91.38, "elapsed_time": "6 days, 8:50:45", "remaining_time": "14:24:40", "throughput": 2739.8, "total_tokens": 1507563456} {"current_steps": 8348, "total_steps": 9134, "loss": 1.083, "learning_rate": 9.080007805911728e-07, "epoch": 0.9138728481896057, "percentage": 91.39, "elapsed_time": "6 days, 8:51:53", "remaining_time": "14:23:34", "throughput": 2739.86, "total_tokens": 1507779392} {"current_steps": 8349, "total_steps": 9134, "loss": 1.0887, "learning_rate": 9.057058596019325e-07, "epoch": 0.9139823202605435, "percentage": 91.41, "elapsed_time": "6 days, 8:53:00", "remaining_time": "14:22:28", "throughput": 2739.84, "total_tokens": 1507956128} {"current_steps": 8350, "total_steps": 9134, "loss": 0.9039, "learning_rate": 9.034137889216255e-07, "epoch": 0.9140917923314814, "percentage": 91.42, "elapsed_time": "6 days, 8:54:03", "remaining_time": "14:21:22", "throughput": 2739.84, "total_tokens": 1508125472} {"current_steps": 8351, "total_steps": 9134, "loss": 0.9551, "learning_rate": 9.011245688214015e-07, "epoch": 0.9142012644024193, "percentage": 91.43, "elapsed_time": "6 days, 8:55:08", "remaining_time": "14:20:16", "throughput": 2739.82, "total_tokens": 1508293696} {"current_steps": 8352, "total_steps": 9134, "loss": 0.9495, "learning_rate": 8.988381995720746e-07, "epoch": 0.9143107364733573, "percentage": 91.44, "elapsed_time": "6 days, 8:56:15", "remaining_time": "14:19:10", "throughput": 2739.84, "total_tokens": 1508488800} {"current_steps": 8353, "total_steps": 9134, "loss": 0.8581, "learning_rate": 8.965546814441117e-07, "epoch": 0.9144202085442952, "percentage": 91.45, "elapsed_time": "6 days, 8:57:21", "remaining_time": "14:18:04", "throughput": 2739.84, "total_tokens": 1508669120} {"current_steps": 8354, "total_steps": 9134, "loss": 0.8787, "learning_rate": 8.942740147076551e-07, "epoch": 0.914529680615233, "percentage": 91.46, "elapsed_time": "6 days, 8:58:23", "remaining_time": "14:16:58", "throughput": 2739.8, "total_tokens": 1508819200} {"current_steps": 8355, "total_steps": 9134, "loss": 1.0021, "learning_rate": 8.919961996324999e-07, "epoch": 0.9146391526861709, "percentage": 91.47, "elapsed_time": "6 days, 8:59:26", "remaining_time": "14:15:52", "throughput": 2739.82, "total_tokens": 1509002656} {"current_steps": 8356, "total_steps": 9134, "loss": 0.7413, "learning_rate": 8.897212364881058e-07, "epoch": 0.9147486247571088, "percentage": 91.48, "elapsed_time": "6 days, 9:00:28", "remaining_time": "14:14:45", "throughput": 2739.84, "total_tokens": 1509179616} {"current_steps": 8357, "total_steps": 9134, "loss": 1.1203, "learning_rate": 8.87449125543599e-07, "epoch": 0.9148580968280468, "percentage": 91.49, "elapsed_time": "6 days, 9:01:36", "remaining_time": "14:13:40", "throughput": 2739.87, "total_tokens": 1509385920} {"current_steps": 8358, "total_steps": 9134, "loss": 0.9004, "learning_rate": 8.851798670677674e-07, "epoch": 0.9149675688989847, "percentage": 91.5, "elapsed_time": "6 days, 9:02:37", "remaining_time": "14:12:33", "throughput": 2739.87, "total_tokens": 1509549216} {"current_steps": 8359, "total_steps": 9134, "loss": 0.8603, "learning_rate": 8.829134613290574e-07, "epoch": 0.9150770409699226, "percentage": 91.52, "elapsed_time": "6 days, 9:03:40", "remaining_time": "14:11:27", "throughput": 2739.87, "total_tokens": 1509726624} {"current_steps": 8360, "total_steps": 9134, "loss": 0.8909, "learning_rate": 8.806499085955794e-07, "epoch": 0.9151865130408604, "percentage": 91.53, "elapsed_time": "6 days, 9:04:43", "remaining_time": "14:10:21", "throughput": 2739.88, "total_tokens": 1509904480} {"current_steps": 8361, "total_steps": 9134, "loss": 0.8662, "learning_rate": 8.783892091351053e-07, "epoch": 0.9152959851117983, "percentage": 91.54, "elapsed_time": "6 days, 9:05:45", "remaining_time": "14:09:15", "throughput": 2739.83, "total_tokens": 1510045152} {"current_steps": 8362, "total_steps": 9134, "loss": 0.9722, "learning_rate": 8.761313632150797e-07, "epoch": 0.9154054571827362, "percentage": 91.55, "elapsed_time": "6 days, 9:06:49", "remaining_time": "14:08:09", "throughput": 2739.84, "total_tokens": 1510227936} {"current_steps": 8363, "total_steps": 9134, "loss": 0.9622, "learning_rate": 8.738763711025971e-07, "epoch": 0.9155149292536742, "percentage": 91.56, "elapsed_time": "6 days, 9:07:54", "remaining_time": "14:07:02", "throughput": 2739.83, "total_tokens": 1510399968} {"current_steps": 8364, "total_steps": 9134, "loss": 0.576, "learning_rate": 8.716242330644164e-07, "epoch": 0.9156244013246121, "percentage": 91.57, "elapsed_time": "6 days, 9:08:57", "remaining_time": "14:05:56", "throughput": 2739.88, "total_tokens": 1510596192} {"current_steps": 8365, "total_steps": 9134, "loss": 0.9965, "learning_rate": 8.693749493669662e-07, "epoch": 0.91573387339555, "percentage": 91.58, "elapsed_time": "6 days, 9:10:02", "remaining_time": "14:04:50", "throughput": 2739.9, "total_tokens": 1510784800} {"current_steps": 8366, "total_steps": 9134, "loss": 0.8559, "learning_rate": 8.671285202763252e-07, "epoch": 0.9158433454664878, "percentage": 91.59, "elapsed_time": "6 days, 9:11:03", "remaining_time": "14:03:44", "throughput": 2739.87, "total_tokens": 1510939584} {"current_steps": 8367, "total_steps": 9134, "loss": 0.8519, "learning_rate": 8.648849460582503e-07, "epoch": 0.9159528175374257, "percentage": 91.6, "elapsed_time": "6 days, 9:12:03", "remaining_time": "14:02:37", "throughput": 2739.83, "total_tokens": 1511079808} {"current_steps": 8368, "total_steps": 9134, "loss": 1.038, "learning_rate": 8.626442269781432e-07, "epoch": 0.9160622896083637, "percentage": 91.61, "elapsed_time": "6 days, 9:13:08", "remaining_time": "14:01:31", "throughput": 2739.87, "total_tokens": 1511282976} {"current_steps": 8369, "total_steps": 9134, "loss": 0.8502, "learning_rate": 8.604063633010862e-07, "epoch": 0.9161717616793016, "percentage": 91.62, "elapsed_time": "6 days, 9:14:14", "remaining_time": "14:00:26", "throughput": 2739.9, "total_tokens": 1511478304} {"current_steps": 8370, "total_steps": 9134, "loss": 0.8015, "learning_rate": 8.581713552918064e-07, "epoch": 0.9162812337502395, "percentage": 91.64, "elapsed_time": "6 days, 9:15:16", "remaining_time": "13:59:19", "throughput": 2739.9, "total_tokens": 1511651456} {"current_steps": 8371, "total_steps": 9134, "loss": 1.0392, "learning_rate": 8.559392032147034e-07, "epoch": 0.9163907058211773, "percentage": 91.65, "elapsed_time": "6 days, 9:16:22", "remaining_time": "13:58:13", "throughput": 2739.87, "total_tokens": 1511812512} {"current_steps": 8372, "total_steps": 9134, "loss": 0.8304, "learning_rate": 8.537099073338384e-07, "epoch": 0.9165001778921152, "percentage": 91.66, "elapsed_time": "6 days, 9:17:26", "remaining_time": "13:57:07", "throughput": 2739.88, "total_tokens": 1511992384} {"current_steps": 8373, "total_steps": 9134, "loss": 1.1033, "learning_rate": 8.514834679129336e-07, "epoch": 0.9166096499630532, "percentage": 91.67, "elapsed_time": "6 days, 9:18:34", "remaining_time": "13:56:02", "throughput": 2739.87, "total_tokens": 1512172480} {"current_steps": 8374, "total_steps": 9134, "loss": 0.6975, "learning_rate": 8.492598852153672e-07, "epoch": 0.9167191220339911, "percentage": 91.68, "elapsed_time": "6 days, 9:19:38", "remaining_time": "13:54:55", "throughput": 2739.86, "total_tokens": 1512342272} {"current_steps": 8375, "total_steps": 9134, "loss": 1.029, "learning_rate": 8.470391595041871e-07, "epoch": 0.916828594104929, "percentage": 91.69, "elapsed_time": "6 days, 9:20:44", "remaining_time": "13:53:50", "throughput": 2739.89, "total_tokens": 1512541632} {"current_steps": 8376, "total_steps": 9134, "loss": 0.9035, "learning_rate": 8.448212910421055e-07, "epoch": 0.9169380661758669, "percentage": 91.7, "elapsed_time": "6 days, 9:21:50", "remaining_time": "13:52:44", "throughput": 2739.92, "total_tokens": 1512737856} {"current_steps": 8377, "total_steps": 9134, "loss": 0.9798, "learning_rate": 8.426062800914846e-07, "epoch": 0.9170475382468047, "percentage": 91.71, "elapsed_time": "6 days, 9:22:55", "remaining_time": "13:51:38", "throughput": 2739.96, "total_tokens": 1512936096} {"current_steps": 8378, "total_steps": 9134, "loss": 0.8594, "learning_rate": 8.40394126914365e-07, "epoch": 0.9171570103177427, "percentage": 91.72, "elapsed_time": "6 days, 9:24:00", "remaining_time": "13:50:32", "throughput": 2739.93, "total_tokens": 1513101632} {"current_steps": 8379, "total_steps": 9134, "loss": 0.9631, "learning_rate": 8.381848317724289e-07, "epoch": 0.9172664823886806, "percentage": 91.73, "elapsed_time": "6 days, 9:25:03", "remaining_time": "13:49:25", "throughput": 2739.93, "total_tokens": 1513272544} {"current_steps": 8380, "total_steps": 9134, "loss": 0.9114, "learning_rate": 8.359783949270394e-07, "epoch": 0.9173759544596185, "percentage": 91.75, "elapsed_time": "6 days, 9:26:10", "remaining_time": "13:48:20", "throughput": 2739.92, "total_tokens": 1513452416} {"current_steps": 8381, "total_steps": 9134, "loss": 0.5996, "learning_rate": 8.337748166392129e-07, "epoch": 0.9174854265305564, "percentage": 91.76, "elapsed_time": "6 days, 9:27:11", "remaining_time": "13:47:13", "throughput": 2739.92, "total_tokens": 1513616160} {"current_steps": 8382, "total_steps": 9134, "loss": 0.9963, "learning_rate": 8.315740971696295e-07, "epoch": 0.9175948986014943, "percentage": 91.77, "elapsed_time": "6 days, 9:28:18", "remaining_time": "13:46:07", "throughput": 2739.93, "total_tokens": 1513805216} {"current_steps": 8383, "total_steps": 9134, "loss": 0.8812, "learning_rate": 8.293762367786257e-07, "epoch": 0.9177043706724322, "percentage": 91.78, "elapsed_time": "6 days, 9:29:20", "remaining_time": "13:45:01", "throughput": 2739.94, "total_tokens": 1513984416} {"current_steps": 8384, "total_steps": 9134, "loss": 0.717, "learning_rate": 8.271812357262043e-07, "epoch": 0.9178138427433701, "percentage": 91.79, "elapsed_time": "6 days, 9:30:21", "remaining_time": "13:43:55", "throughput": 2739.93, "total_tokens": 1514143232} {"current_steps": 8385, "total_steps": 9134, "loss": 0.7321, "learning_rate": 8.249890942720384e-07, "epoch": 0.917923314814308, "percentage": 91.8, "elapsed_time": "6 days, 9:31:25", "remaining_time": "13:42:49", "throughput": 2739.92, "total_tokens": 1514313024} {"current_steps": 8386, "total_steps": 9134, "loss": 0.8186, "learning_rate": 8.227998126754427e-07, "epoch": 0.9180327868852459, "percentage": 91.81, "elapsed_time": "6 days, 9:32:30", "remaining_time": "13:41:43", "throughput": 2739.95, "total_tokens": 1514509248} {"current_steps": 8387, "total_steps": 9134, "loss": 0.908, "learning_rate": 8.206133911954156e-07, "epoch": 0.9181422589561838, "percentage": 91.82, "elapsed_time": "6 days, 9:33:35", "remaining_time": "13:40:37", "throughput": 2739.94, "total_tokens": 1514681952} {"current_steps": 8388, "total_steps": 9134, "loss": 1.1958, "learning_rate": 8.184298300905946e-07, "epoch": 0.9182517310271217, "percentage": 91.83, "elapsed_time": "6 days, 9:34:42", "remaining_time": "13:39:31", "throughput": 2740.0, "total_tokens": 1514897440} {"current_steps": 8389, "total_steps": 9134, "loss": 0.9813, "learning_rate": 8.162491296193009e-07, "epoch": 0.9183612030980596, "percentage": 91.84, "elapsed_time": "6 days, 9:35:46", "remaining_time": "13:38:25", "throughput": 2740.02, "total_tokens": 1515083136} {"current_steps": 8390, "total_steps": 9134, "loss": 0.8221, "learning_rate": 8.140712900395031e-07, "epoch": 0.9184706751689975, "percentage": 91.85, "elapsed_time": "6 days, 9:36:47", "remaining_time": "13:37:19", "throughput": 2740.0, "total_tokens": 1515242848} {"current_steps": 8391, "total_steps": 9134, "loss": 0.781, "learning_rate": 8.118963116088369e-07, "epoch": 0.9185801472399354, "percentage": 91.87, "elapsed_time": "6 days, 9:37:49", "remaining_time": "13:36:12", "throughput": 2740.0, "total_tokens": 1515410624} {"current_steps": 8392, "total_steps": 9134, "loss": 0.9616, "learning_rate": 8.097241945845962e-07, "epoch": 0.9186896193108733, "percentage": 91.88, "elapsed_time": "6 days, 9:38:52", "remaining_time": "13:35:06", "throughput": 2740.01, "total_tokens": 1515586464} {"current_steps": 8393, "total_steps": 9134, "loss": 0.9637, "learning_rate": 8.075549392237369e-07, "epoch": 0.9187990913818113, "percentage": 91.89, "elapsed_time": "6 days, 9:39:54", "remaining_time": "13:34:00", "throughput": 2739.98, "total_tokens": 1515743488} {"current_steps": 8394, "total_steps": 9134, "loss": 0.7242, "learning_rate": 8.053885457828869e-07, "epoch": 0.9189085634527491, "percentage": 91.9, "elapsed_time": "6 days, 9:40:59", "remaining_time": "13:32:54", "throughput": 2740.01, "total_tokens": 1515936576} {"current_steps": 8395, "total_steps": 9134, "loss": 0.6952, "learning_rate": 8.032250145183134e-07, "epoch": 0.919018035523687, "percentage": 91.91, "elapsed_time": "6 days, 9:42:07", "remaining_time": "13:31:48", "throughput": 2740.03, "total_tokens": 1516131232} {"current_steps": 8396, "total_steps": 9134, "loss": 0.7914, "learning_rate": 8.010643456859645e-07, "epoch": 0.9191275075946249, "percentage": 91.92, "elapsed_time": "6 days, 9:43:13", "remaining_time": "13:30:42", "throughput": 2740.06, "total_tokens": 1516335296} {"current_steps": 8397, "total_steps": 9134, "loss": 0.8502, "learning_rate": 7.989065395414468e-07, "epoch": 0.9192369796655628, "percentage": 91.93, "elapsed_time": "6 days, 9:44:17", "remaining_time": "13:29:36", "throughput": 2740.09, "total_tokens": 1516523456} {"current_steps": 8398, "total_steps": 9134, "loss": 0.6692, "learning_rate": 7.967515963400202e-07, "epoch": 0.9193464517365008, "percentage": 91.94, "elapsed_time": "6 days, 9:45:21", "remaining_time": "13:28:30", "throughput": 2740.09, "total_tokens": 1516700416} {"current_steps": 8399, "total_steps": 9134, "loss": 1.1064, "learning_rate": 7.945995163366083e-07, "epoch": 0.9194559238074387, "percentage": 91.95, "elapsed_time": "6 days, 9:46:24", "remaining_time": "13:27:24", "throughput": 2740.08, "total_tokens": 1516869088} {"current_steps": 8400, "total_steps": 9134, "loss": 0.7076, "learning_rate": 7.924502997858018e-07, "epoch": 0.9195653958783765, "percentage": 91.96, "elapsed_time": "6 days, 9:47:27", "remaining_time": "13:26:18", "throughput": 2740.05, "total_tokens": 1517019616} {"current_steps": 8401, "total_steps": 9134, "loss": 1.1123, "learning_rate": 7.903039469418506e-07, "epoch": 0.9196748679493144, "percentage": 91.98, "elapsed_time": "6 days, 9:48:34", "remaining_time": "13:25:12", "throughput": 2740.08, "total_tokens": 1517222112} {"current_steps": 8402, "total_steps": 9134, "loss": 0.7529, "learning_rate": 7.881604580586593e-07, "epoch": 0.9197843400202523, "percentage": 91.99, "elapsed_time": "6 days, 9:49:36", "remaining_time": "13:24:06", "throughput": 2740.09, "total_tokens": 1517400640} {"current_steps": 8403, "total_steps": 9134, "loss": 1.0415, "learning_rate": 7.860198333897978e-07, "epoch": 0.9198938120911903, "percentage": 92.0, "elapsed_time": "6 days, 9:50:40", "remaining_time": "13:23:00", "throughput": 2740.1, "total_tokens": 1517576704} {"current_steps": 8404, "total_steps": 9134, "loss": 0.8858, "learning_rate": 7.838820731885021e-07, "epoch": 0.9200032841621282, "percentage": 92.01, "elapsed_time": "6 days, 9:51:44", "remaining_time": "13:21:53", "throughput": 2740.09, "total_tokens": 1517748064} {"current_steps": 8405, "total_steps": 9134, "loss": 1.0054, "learning_rate": 7.817471777076673e-07, "epoch": 0.920112756233066, "percentage": 92.02, "elapsed_time": "6 days, 9:52:51", "remaining_time": "13:20:48", "throughput": 2740.16, "total_tokens": 1517969376} {"current_steps": 8406, "total_steps": 9134, "loss": 0.9971, "learning_rate": 7.796151471998414e-07, "epoch": 0.9202222283040039, "percentage": 92.03, "elapsed_time": "6 days, 9:53:53", "remaining_time": "13:19:41", "throughput": 2740.17, "total_tokens": 1518148352} {"current_steps": 8407, "total_steps": 9134, "loss": 1.0098, "learning_rate": 7.77485981917242e-07, "epoch": 0.9203317003749418, "percentage": 92.04, "elapsed_time": "6 days, 9:54:58", "remaining_time": "13:18:35", "throughput": 2740.2, "total_tokens": 1518339424} {"current_steps": 8408, "total_steps": 9134, "loss": 0.908, "learning_rate": 7.753596821117426e-07, "epoch": 0.9204411724458798, "percentage": 92.05, "elapsed_time": "6 days, 9:56:05", "remaining_time": "13:17:30", "throughput": 2740.21, "total_tokens": 1518530272} {"current_steps": 8409, "total_steps": 9134, "loss": 0.8615, "learning_rate": 7.732362480348892e-07, "epoch": 0.9205506445168177, "percentage": 92.06, "elapsed_time": "6 days, 9:57:09", "remaining_time": "13:16:24", "throughput": 2740.22, "total_tokens": 1518710816} {"current_steps": 8410, "total_steps": 9134, "loss": 0.7845, "learning_rate": 7.7111567993787e-07, "epoch": 0.9206601165877556, "percentage": 92.07, "elapsed_time": "6 days, 9:58:08", "remaining_time": "13:15:17", "throughput": 2740.21, "total_tokens": 1518867616} {"current_steps": 8411, "total_steps": 9134, "loss": 0.999, "learning_rate": 7.689979780715534e-07, "epoch": 0.9207695886586934, "percentage": 92.08, "elapsed_time": "6 days, 9:59:09", "remaining_time": "13:14:11", "throughput": 2740.19, "total_tokens": 1519025984} {"current_steps": 8412, "total_steps": 9134, "loss": 0.8872, "learning_rate": 7.668831426864448e-07, "epoch": 0.9208790607296313, "percentage": 92.1, "elapsed_time": "6 days, 10:00:15", "remaining_time": "13:13:05", "throughput": 2740.23, "total_tokens": 1519221984} {"current_steps": 8413, "total_steps": 9134, "loss": 0.7102, "learning_rate": 7.647711740327412e-07, "epoch": 0.9209885328005692, "percentage": 92.11, "elapsed_time": "6 days, 10:01:18", "remaining_time": "13:11:59", "throughput": 2740.22, "total_tokens": 1519394464} {"current_steps": 8414, "total_steps": 9134, "loss": 0.9296, "learning_rate": 7.626620723602762e-07, "epoch": 0.9210980048715072, "percentage": 92.12, "elapsed_time": "6 days, 10:02:24", "remaining_time": "13:10:53", "throughput": 2740.24, "total_tokens": 1519583520} {"current_steps": 8415, "total_steps": 9134, "loss": 1.0464, "learning_rate": 7.605558379185556e-07, "epoch": 0.9212074769424451, "percentage": 92.13, "elapsed_time": "6 days, 10:03:29", "remaining_time": "13:09:47", "throughput": 2740.2, "total_tokens": 1519741888} {"current_steps": 8416, "total_steps": 9134, "loss": 0.9576, "learning_rate": 7.584524709567386e-07, "epoch": 0.921316949013383, "percentage": 92.14, "elapsed_time": "6 days, 10:04:31", "remaining_time": "13:08:41", "throughput": 2740.23, "total_tokens": 1519928032} {"current_steps": 8417, "total_steps": 9134, "loss": 0.9107, "learning_rate": 7.563519717236511e-07, "epoch": 0.9214264210843208, "percentage": 92.15, "elapsed_time": "6 days, 10:05:36", "remaining_time": "13:07:35", "throughput": 2740.26, "total_tokens": 1520122912} {"current_steps": 8418, "total_steps": 9134, "loss": 0.7846, "learning_rate": 7.54254340467786e-07, "epoch": 0.9215358931552587, "percentage": 92.16, "elapsed_time": "6 days, 10:06:37", "remaining_time": "13:06:28", "throughput": 2740.25, "total_tokens": 1520287552} {"current_steps": 8419, "total_steps": 9134, "loss": 1.1156, "learning_rate": 7.521595774372752e-07, "epoch": 0.9216453652261967, "percentage": 92.17, "elapsed_time": "6 days, 10:07:42", "remaining_time": "13:05:22", "throughput": 2740.26, "total_tokens": 1520464960} {"current_steps": 8420, "total_steps": 9134, "loss": 0.7549, "learning_rate": 7.500676828799402e-07, "epoch": 0.9217548372971346, "percentage": 92.18, "elapsed_time": "6 days, 10:08:46", "remaining_time": "13:04:16", "throughput": 2740.22, "total_tokens": 1520622208} {"current_steps": 8421, "total_steps": 9134, "loss": 1.1153, "learning_rate": 7.479786570432329e-07, "epoch": 0.9218643093680725, "percentage": 92.19, "elapsed_time": "6 days, 10:09:50", "remaining_time": "13:03:10", "throughput": 2740.26, "total_tokens": 1520815744} {"current_steps": 8422, "total_steps": 9134, "loss": 0.8271, "learning_rate": 7.458925001742917e-07, "epoch": 0.9219737814390103, "percentage": 92.2, "elapsed_time": "6 days, 10:10:57", "remaining_time": "13:02:04", "throughput": 2740.25, "total_tokens": 1520996288} {"current_steps": 8423, "total_steps": 9134, "loss": 0.7357, "learning_rate": 7.438092125199025e-07, "epoch": 0.9220832535099482, "percentage": 92.22, "elapsed_time": "6 days, 10:12:04", "remaining_time": "13:00:58", "throughput": 2740.26, "total_tokens": 1521183776} {"current_steps": 8424, "total_steps": 9134, "loss": 1.0724, "learning_rate": 7.417287943265128e-07, "epoch": 0.9221927255808862, "percentage": 92.23, "elapsed_time": "6 days, 10:13:10", "remaining_time": "12:59:53", "throughput": 2740.25, "total_tokens": 1521362528} {"current_steps": 8425, "total_steps": 9134, "loss": 0.6984, "learning_rate": 7.39651245840231e-07, "epoch": 0.9223021976518241, "percentage": 92.24, "elapsed_time": "6 days, 10:14:16", "remaining_time": "12:58:47", "throughput": 2740.25, "total_tokens": 1521540832} {"current_steps": 8426, "total_steps": 9134, "loss": 0.9409, "learning_rate": 7.375765673068275e-07, "epoch": 0.922411669722762, "percentage": 92.25, "elapsed_time": "6 days, 10:15:21", "remaining_time": "12:57:41", "throughput": 2740.27, "total_tokens": 1521728544} {"current_steps": 8427, "total_steps": 9134, "loss": 0.7307, "learning_rate": 7.355047589717418e-07, "epoch": 0.9225211417936999, "percentage": 92.26, "elapsed_time": "6 days, 10:16:27", "remaining_time": "12:56:35", "throughput": 2740.27, "total_tokens": 1521912896} {"current_steps": 8428, "total_steps": 9134, "loss": 1.0393, "learning_rate": 7.334358210800473e-07, "epoch": 0.9226306138646377, "percentage": 92.27, "elapsed_time": "6 days, 10:17:32", "remaining_time": "12:55:29", "throughput": 2740.31, "total_tokens": 1522110240} {"current_steps": 8429, "total_steps": 9134, "loss": 0.7603, "learning_rate": 7.313697538765124e-07, "epoch": 0.9227400859355757, "percentage": 92.28, "elapsed_time": "6 days, 10:18:36", "remaining_time": "12:54:23", "throughput": 2740.29, "total_tokens": 1522277120} {"current_steps": 8430, "total_steps": 9134, "loss": 0.7412, "learning_rate": 7.293065576055386e-07, "epoch": 0.9228495580065136, "percentage": 92.29, "elapsed_time": "6 days, 10:19:39", "remaining_time": "12:53:17", "throughput": 2740.31, "total_tokens": 1522459456} {"current_steps": 8431, "total_steps": 9134, "loss": 0.9742, "learning_rate": 7.272462325112056e-07, "epoch": 0.9229590300774515, "percentage": 92.3, "elapsed_time": "6 days, 10:20:46", "remaining_time": "12:52:11", "throughput": 2740.32, "total_tokens": 1522648736} {"current_steps": 8432, "total_steps": 9134, "loss": 0.8604, "learning_rate": 7.25188778837238e-07, "epoch": 0.9230685021483894, "percentage": 92.31, "elapsed_time": "6 days, 10:21:45", "remaining_time": "12:51:04", "throughput": 2740.31, "total_tokens": 1522807328} {"current_steps": 8433, "total_steps": 9134, "loss": 0.9193, "learning_rate": 7.231341968270328e-07, "epoch": 0.9231779742193273, "percentage": 92.33, "elapsed_time": "6 days, 10:22:50", "remaining_time": "12:49:58", "throughput": 2740.36, "total_tokens": 1523008704} {"current_steps": 8434, "total_steps": 9134, "loss": 0.863, "learning_rate": 7.210824867236427e-07, "epoch": 0.9232874462902652, "percentage": 92.34, "elapsed_time": "6 days, 10:23:57", "remaining_time": "12:48:53", "throughput": 2740.41, "total_tokens": 1523223744} {"current_steps": 8435, "total_steps": 9134, "loss": 1.314, "learning_rate": 7.190336487697791e-07, "epoch": 0.9233969183612031, "percentage": 92.35, "elapsed_time": "6 days, 10:25:04", "remaining_time": "12:47:47", "throughput": 2740.48, "total_tokens": 1523444608} {"current_steps": 8436, "total_steps": 9134, "loss": 0.7338, "learning_rate": 7.169876832078204e-07, "epoch": 0.923506390432141, "percentage": 92.36, "elapsed_time": "6 days, 10:26:09", "remaining_time": "12:46:41", "throughput": 2740.52, "total_tokens": 1523643296} {"current_steps": 8437, "total_steps": 9134, "loss": 0.623, "learning_rate": 7.14944590279798e-07, "epoch": 0.9236158625030789, "percentage": 92.37, "elapsed_time": "6 days, 10:27:09", "remaining_time": "12:45:34", "throughput": 2740.53, "total_tokens": 1523815552} {"current_steps": 8438, "total_steps": 9134, "loss": 0.7945, "learning_rate": 7.129043702274018e-07, "epoch": 0.9237253345740168, "percentage": 92.38, "elapsed_time": "6 days, 10:28:16", "remaining_time": "12:44:29", "throughput": 2740.59, "total_tokens": 1524033056} {"current_steps": 8439, "total_steps": 9134, "loss": 0.8372, "learning_rate": 7.108670232919946e-07, "epoch": 0.9238348066449547, "percentage": 92.39, "elapsed_time": "6 days, 10:29:18", "remaining_time": "12:43:22", "throughput": 2740.58, "total_tokens": 1524196352} {"current_steps": 8440, "total_steps": 9134, "loss": 0.873, "learning_rate": 7.088325497145832e-07, "epoch": 0.9239442787158926, "percentage": 92.4, "elapsed_time": "6 days, 10:30:22", "remaining_time": "12:42:16", "throughput": 2740.56, "total_tokens": 1524360096} {"current_steps": 8441, "total_steps": 9134, "loss": 0.9152, "learning_rate": 7.068009497358446e-07, "epoch": 0.9240537507868305, "percentage": 92.41, "elapsed_time": "6 days, 10:31:28", "remaining_time": "12:41:10", "throughput": 2740.57, "total_tokens": 1524548256} {"current_steps": 8442, "total_steps": 9134, "loss": 0.917, "learning_rate": 7.047722235961119e-07, "epoch": 0.9241632228577684, "percentage": 92.42, "elapsed_time": "6 days, 10:32:33", "remaining_time": "12:40:04", "throughput": 2740.6, "total_tokens": 1524739328} {"current_steps": 8443, "total_steps": 9134, "loss": 0.882, "learning_rate": 7.027463715353789e-07, "epoch": 0.9242726949287063, "percentage": 92.43, "elapsed_time": "6 days, 10:33:34", "remaining_time": "12:38:58", "throughput": 2740.6, "total_tokens": 1524908224} {"current_steps": 8444, "total_steps": 9134, "loss": 0.672, "learning_rate": 7.007233937933067e-07, "epoch": 0.9243821669996443, "percentage": 92.45, "elapsed_time": "6 days, 10:34:36", "remaining_time": "12:37:52", "throughput": 2740.59, "total_tokens": 1525072640} {"current_steps": 8445, "total_steps": 9134, "loss": 0.8003, "learning_rate": 6.987032906091983e-07, "epoch": 0.9244916390705821, "percentage": 92.46, "elapsed_time": "6 days, 10:35:41", "remaining_time": "12:36:46", "throughput": 2740.59, "total_tokens": 1525254976} {"current_steps": 8446, "total_steps": 9134, "loss": 1.0907, "learning_rate": 6.966860622220378e-07, "epoch": 0.92460111114152, "percentage": 92.47, "elapsed_time": "6 days, 10:36:48", "remaining_time": "12:35:40", "throughput": 2740.61, "total_tokens": 1525446272} {"current_steps": 8447, "total_steps": 9134, "loss": 0.9342, "learning_rate": 6.946717088704563e-07, "epoch": 0.9247105832124579, "percentage": 92.48, "elapsed_time": "6 days, 10:37:54", "remaining_time": "12:34:34", "throughput": 2740.66, "total_tokens": 1525654144} {"current_steps": 8448, "total_steps": 9134, "loss": 0.7745, "learning_rate": 6.926602307927494e-07, "epoch": 0.9248200552833958, "percentage": 92.49, "elapsed_time": "6 days, 10:38:57", "remaining_time": "12:33:28", "throughput": 2740.63, "total_tokens": 1525812960} {"current_steps": 8449, "total_steps": 9134, "loss": 0.825, "learning_rate": 6.906516282268682e-07, "epoch": 0.9249295273543338, "percentage": 92.5, "elapsed_time": "6 days, 10:39:59", "remaining_time": "12:32:22", "throughput": 2740.6, "total_tokens": 1525965056} {"current_steps": 8450, "total_steps": 9134, "loss": 0.8161, "learning_rate": 6.88645901410423e-07, "epoch": 0.9250389994252717, "percentage": 92.51, "elapsed_time": "6 days, 10:41:04", "remaining_time": "12:31:16", "throughput": 2740.65, "total_tokens": 1526169568} {"current_steps": 8451, "total_steps": 9134, "loss": 0.7019, "learning_rate": 6.866430505807014e-07, "epoch": 0.9251484714962095, "percentage": 92.52, "elapsed_time": "6 days, 10:42:08", "remaining_time": "12:30:10", "throughput": 2740.64, "total_tokens": 1526341152} {"current_steps": 8452, "total_steps": 9134, "loss": 0.6988, "learning_rate": 6.846430759746198e-07, "epoch": 0.9252579435671474, "percentage": 92.53, "elapsed_time": "6 days, 10:43:11", "remaining_time": "12:29:04", "throughput": 2740.64, "total_tokens": 1526513856} {"current_steps": 8453, "total_steps": 9134, "loss": 0.5826, "learning_rate": 6.826459778287858e-07, "epoch": 0.9253674156380853, "percentage": 92.54, "elapsed_time": "6 days, 10:44:14", "remaining_time": "12:27:58", "throughput": 2740.64, "total_tokens": 1526686784} {"current_steps": 8454, "total_steps": 9134, "loss": 1.0091, "learning_rate": 6.806517563794385e-07, "epoch": 0.9254768877090233, "percentage": 92.56, "elapsed_time": "6 days, 10:45:18", "remaining_time": "12:26:51", "throughput": 2740.66, "total_tokens": 1526872256} {"current_steps": 8455, "total_steps": 9134, "loss": 0.7468, "learning_rate": 6.786604118625029e-07, "epoch": 0.9255863597799612, "percentage": 92.57, "elapsed_time": "6 days, 10:46:18", "remaining_time": "12:25:45", "throughput": 2740.64, "total_tokens": 1527026592} {"current_steps": 8456, "total_steps": 9134, "loss": 0.8087, "learning_rate": 6.766719445135434e-07, "epoch": 0.925695831850899, "percentage": 92.58, "elapsed_time": "6 days, 10:47:23", "remaining_time": "12:24:39", "throughput": 2740.65, "total_tokens": 1527206240} {"current_steps": 8457, "total_steps": 9134, "loss": 0.9421, "learning_rate": 6.746863545677967e-07, "epoch": 0.9258053039218369, "percentage": 92.59, "elapsed_time": "6 days, 10:48:24", "remaining_time": "12:23:33", "throughput": 2740.6, "total_tokens": 1527348032} {"current_steps": 8458, "total_steps": 9134, "loss": 0.7819, "learning_rate": 6.727036422601529e-07, "epoch": 0.9259147759927748, "percentage": 92.6, "elapsed_time": "6 days, 10:49:27", "remaining_time": "12:22:27", "throughput": 2740.61, "total_tokens": 1527527232} {"current_steps": 8459, "total_steps": 9134, "loss": 0.8923, "learning_rate": 6.707238078251576e-07, "epoch": 0.9260242480637128, "percentage": 92.61, "elapsed_time": "6 days, 10:50:33", "remaining_time": "12:21:21", "throughput": 2740.62, "total_tokens": 1527710688} {"current_steps": 8460, "total_steps": 9134, "loss": 0.9081, "learning_rate": 6.687468514970319e-07, "epoch": 0.9261337201346507, "percentage": 92.62, "elapsed_time": "6 days, 10:51:35", "remaining_time": "12:20:15", "throughput": 2740.63, "total_tokens": 1527886080} {"current_steps": 8461, "total_steps": 9134, "loss": 0.7566, "learning_rate": 6.667727735096357e-07, "epoch": 0.9262431922055886, "percentage": 92.63, "elapsed_time": "6 days, 10:52:38", "remaining_time": "12:19:08", "throughput": 2740.63, "total_tokens": 1528058784} {"current_steps": 8462, "total_steps": 9134, "loss": 0.8383, "learning_rate": 6.648015740965074e-07, "epoch": 0.9263526642765264, "percentage": 92.64, "elapsed_time": "6 days, 10:53:40", "remaining_time": "12:18:02", "throughput": 2740.66, "total_tokens": 1528244928} {"current_steps": 8463, "total_steps": 9134, "loss": 0.7559, "learning_rate": 6.628332534908272e-07, "epoch": 0.9264621363474643, "percentage": 92.65, "elapsed_time": "6 days, 10:54:39", "remaining_time": "12:16:56", "throughput": 2740.64, "total_tokens": 1528400832} {"current_steps": 8464, "total_steps": 9134, "loss": 1.1642, "learning_rate": 6.608678119254502e-07, "epoch": 0.9265716084184022, "percentage": 92.66, "elapsed_time": "6 days, 10:55:45", "remaining_time": "12:15:50", "throughput": 2740.7, "total_tokens": 1528612960} {"current_steps": 8465, "total_steps": 9134, "loss": 0.7349, "learning_rate": 6.589052496328824e-07, "epoch": 0.9266810804893402, "percentage": 92.68, "elapsed_time": "6 days, 10:56:47", "remaining_time": "12:14:44", "throughput": 2740.68, "total_tokens": 1528769760} {"current_steps": 8466, "total_steps": 9134, "loss": 0.8504, "learning_rate": 6.569455668452934e-07, "epoch": 0.9267905525602781, "percentage": 92.69, "elapsed_time": "6 days, 10:57:53", "remaining_time": "12:13:38", "throughput": 2740.71, "total_tokens": 1528971360} {"current_steps": 8467, "total_steps": 9134, "loss": 0.8098, "learning_rate": 6.549887637945063e-07, "epoch": 0.926900024631216, "percentage": 92.7, "elapsed_time": "6 days, 10:58:58", "remaining_time": "12:12:32", "throughput": 2740.74, "total_tokens": 1529166240} {"current_steps": 8468, "total_steps": 9134, "loss": 0.7526, "learning_rate": 6.530348407120052e-07, "epoch": 0.9270094967021538, "percentage": 92.71, "elapsed_time": "6 days, 11:00:03", "remaining_time": "12:11:26", "throughput": 2740.73, "total_tokens": 1529336032} {"current_steps": 8469, "total_steps": 9134, "loss": 0.8906, "learning_rate": 6.510837978289414e-07, "epoch": 0.9271189687730917, "percentage": 92.72, "elapsed_time": "6 days, 11:01:09", "remaining_time": "12:10:20", "throughput": 2740.77, "total_tokens": 1529540544} {"current_steps": 8470, "total_steps": 9134, "loss": 0.9147, "learning_rate": 6.491356353761191e-07, "epoch": 0.9272284408440297, "percentage": 92.73, "elapsed_time": "6 days, 11:02:16", "remaining_time": "12:09:14", "throughput": 2740.83, "total_tokens": 1529755136} {"current_steps": 8471, "total_steps": 9134, "loss": 0.8517, "learning_rate": 6.471903535839985e-07, "epoch": 0.9273379129149676, "percentage": 92.74, "elapsed_time": "6 days, 11:03:21", "remaining_time": "12:08:08", "throughput": 2740.82, "total_tokens": 1529933664} {"current_steps": 8472, "total_steps": 9134, "loss": 0.821, "learning_rate": 6.452479526827065e-07, "epoch": 0.9274473849859055, "percentage": 92.75, "elapsed_time": "6 days, 11:04:24", "remaining_time": "12:07:02", "throughput": 2740.82, "total_tokens": 1530105472} {"current_steps": 8473, "total_steps": 9134, "loss": 0.9283, "learning_rate": 6.433084329020233e-07, "epoch": 0.9275568570568433, "percentage": 92.76, "elapsed_time": "6 days, 11:05:28", "remaining_time": "12:05:56", "throughput": 2740.83, "total_tokens": 1530281312} {"current_steps": 8474, "total_steps": 9134, "loss": 0.7355, "learning_rate": 6.413717944713876e-07, "epoch": 0.9276663291277812, "percentage": 92.77, "elapsed_time": "6 days, 11:06:22", "remaining_time": "12:04:49", "throughput": 2740.78, "total_tokens": 1530406080} {"current_steps": 8475, "total_steps": 9134, "loss": 0.6925, "learning_rate": 6.39438037619905e-07, "epoch": 0.9277758011987192, "percentage": 92.79, "elapsed_time": "6 days, 11:07:26", "remaining_time": "12:03:43", "throughput": 2740.77, "total_tokens": 1530575424} {"current_steps": 8476, "total_steps": 9134, "loss": 0.7625, "learning_rate": 6.375071625763285e-07, "epoch": 0.9278852732696571, "percentage": 92.8, "elapsed_time": "6 days, 11:08:28", "remaining_time": "12:02:37", "throughput": 2740.75, "total_tokens": 1530733344} {"current_steps": 8477, "total_steps": 9134, "loss": 1.1852, "learning_rate": 6.355791695690866e-07, "epoch": 0.927994745340595, "percentage": 92.81, "elapsed_time": "6 days, 11:09:31", "remaining_time": "12:01:31", "throughput": 2740.76, "total_tokens": 1530910976} {"current_steps": 8478, "total_steps": 9134, "loss": 0.8084, "learning_rate": 6.336540588262496e-07, "epoch": 0.9281042174115329, "percentage": 92.82, "elapsed_time": "6 days, 11:10:34", "remaining_time": "12:00:25", "throughput": 2740.79, "total_tokens": 1531099136} {"current_steps": 8479, "total_steps": 9134, "loss": 0.793, "learning_rate": 6.317318305755604e-07, "epoch": 0.9282136894824707, "percentage": 92.83, "elapsed_time": "6 days, 11:11:38", "remaining_time": "11:59:19", "throughput": 2740.81, "total_tokens": 1531284384} {"current_steps": 8480, "total_steps": 9134, "loss": 0.9664, "learning_rate": 6.298124850444093e-07, "epoch": 0.9283231615534087, "percentage": 92.84, "elapsed_time": "6 days, 11:12:45", "remaining_time": "11:58:13", "throughput": 2740.81, "total_tokens": 1531469856} {"current_steps": 8481, "total_steps": 9134, "loss": 0.8822, "learning_rate": 6.278960224598507e-07, "epoch": 0.9284326336243466, "percentage": 92.85, "elapsed_time": "6 days, 11:13:49", "remaining_time": "11:57:07", "throughput": 2740.82, "total_tokens": 1531652640} {"current_steps": 8482, "total_steps": 9134, "loss": 0.8781, "learning_rate": 6.259824430486061e-07, "epoch": 0.9285421056952845, "percentage": 92.86, "elapsed_time": "6 days, 11:14:53", "remaining_time": "11:56:01", "throughput": 2740.85, "total_tokens": 1531842368} {"current_steps": 8483, "total_steps": 9134, "loss": 0.8605, "learning_rate": 6.240717470370361e-07, "epoch": 0.9286515777662224, "percentage": 92.87, "elapsed_time": "6 days, 11:16:00", "remaining_time": "11:54:55", "throughput": 2740.89, "total_tokens": 1532052032} {"current_steps": 8484, "total_steps": 9134, "loss": 0.8176, "learning_rate": 6.221639346511876e-07, "epoch": 0.9287610498371603, "percentage": 92.88, "elapsed_time": "6 days, 11:17:04", "remaining_time": "11:53:49", "throughput": 2740.89, "total_tokens": 1532221376} {"current_steps": 8485, "total_steps": 9134, "loss": 0.8043, "learning_rate": 6.202590061167385e-07, "epoch": 0.9288705219080982, "percentage": 92.89, "elapsed_time": "6 days, 11:18:11", "remaining_time": "11:52:43", "throughput": 2740.92, "total_tokens": 1532422304} {"current_steps": 8486, "total_steps": 9134, "loss": 0.8283, "learning_rate": 6.183569616590446e-07, "epoch": 0.9289799939790361, "percentage": 92.91, "elapsed_time": "6 days, 11:19:16", "remaining_time": "11:51:37", "throughput": 2740.98, "total_tokens": 1532637120} {"current_steps": 8487, "total_steps": 9134, "loss": 0.7343, "learning_rate": 6.164578015031092e-07, "epoch": 0.929089466049974, "percentage": 92.92, "elapsed_time": "6 days, 11:20:18", "remaining_time": "11:50:31", "throughput": 2740.97, "total_tokens": 1532801984} {"current_steps": 8488, "total_steps": 9134, "loss": 1.006, "learning_rate": 6.145615258736054e-07, "epoch": 0.9291989381209119, "percentage": 92.93, "elapsed_time": "6 days, 11:21:24", "remaining_time": "11:49:25", "throughput": 2740.99, "total_tokens": 1532994848} {"current_steps": 8489, "total_steps": 9134, "loss": 1.0277, "learning_rate": 6.126681349948565e-07, "epoch": 0.9293084101918498, "percentage": 92.94, "elapsed_time": "6 days, 11:22:29", "remaining_time": "11:48:19", "throughput": 2741.02, "total_tokens": 1533185024} {"current_steps": 8490, "total_steps": 9134, "loss": 1.0418, "learning_rate": 6.107776290908418e-07, "epoch": 0.9294178822627877, "percentage": 92.95, "elapsed_time": "6 days, 11:23:31", "remaining_time": "11:47:13", "throughput": 2741.03, "total_tokens": 1533360864} {"current_steps": 8491, "total_steps": 9134, "loss": 0.7971, "learning_rate": 6.088900083852184e-07, "epoch": 0.9295273543337256, "percentage": 92.96, "elapsed_time": "6 days, 11:24:35", "remaining_time": "11:46:07", "throughput": 2741.04, "total_tokens": 1533542976} {"current_steps": 8492, "total_steps": 9134, "loss": 1.0393, "learning_rate": 6.070052731012688e-07, "epoch": 0.9296368264046635, "percentage": 92.97, "elapsed_time": "6 days, 11:25:39", "remaining_time": "11:45:01", "throughput": 2741.03, "total_tokens": 1533717248} {"current_steps": 8493, "total_steps": 9134, "loss": 0.9276, "learning_rate": 6.051234234619729e-07, "epoch": 0.9297462984756014, "percentage": 92.98, "elapsed_time": "6 days, 11:26:46", "remaining_time": "11:43:55", "throughput": 2741.07, "total_tokens": 1533922208} {"current_steps": 8494, "total_steps": 9134, "loss": 0.6549, "learning_rate": 6.032444596899333e-07, "epoch": 0.9298557705465393, "percentage": 92.99, "elapsed_time": "6 days, 11:27:49", "remaining_time": "11:42:49", "throughput": 2741.05, "total_tokens": 1534081696} {"current_steps": 8495, "total_steps": 9134, "loss": 0.8835, "learning_rate": 6.013683820074418e-07, "epoch": 0.9299652426174773, "percentage": 93.0, "elapsed_time": "6 days, 11:28:51", "remaining_time": "11:41:43", "throughput": 2741.04, "total_tokens": 1534246784} {"current_steps": 8496, "total_steps": 9134, "loss": 0.7314, "learning_rate": 5.99495190636426e-07, "epoch": 0.9300747146884151, "percentage": 93.02, "elapsed_time": "6 days, 11:29:55", "remaining_time": "11:40:37", "throughput": 2741.03, "total_tokens": 1534415904} {"current_steps": 8497, "total_steps": 9134, "loss": 0.7582, "learning_rate": 5.976248857984812e-07, "epoch": 0.930184186759353, "percentage": 93.03, "elapsed_time": "6 days, 11:31:02", "remaining_time": "11:39:31", "throughput": 2741.06, "total_tokens": 1534620192} {"current_steps": 8498, "total_steps": 9134, "loss": 0.7716, "learning_rate": 5.957574677148664e-07, "epoch": 0.9302936588302909, "percentage": 93.04, "elapsed_time": "6 days, 11:32:06", "remaining_time": "11:38:25", "throughput": 2741.07, "total_tokens": 1534799616} {"current_steps": 8499, "total_steps": 9134, "loss": 0.7782, "learning_rate": 5.938929366064882e-07, "epoch": 0.9304031309012288, "percentage": 93.05, "elapsed_time": "6 days, 11:33:11", "remaining_time": "11:37:19", "throughput": 2741.07, "total_tokens": 1534978816} {"current_steps": 8500, "total_steps": 9134, "loss": 0.8257, "learning_rate": 5.920312926939203e-07, "epoch": 0.9305126029721668, "percentage": 93.06, "elapsed_time": "6 days, 11:34:17", "remaining_time": "11:36:13", "throughput": 2741.13, "total_tokens": 1535190048} {"current_steps": 8501, "total_steps": 9134, "loss": 0.7596, "learning_rate": 5.901725361973864e-07, "epoch": 0.9306220750431047, "percentage": 93.07, "elapsed_time": "6 days, 11:35:22", "remaining_time": "11:35:07", "throughput": 2741.17, "total_tokens": 1535391648} {"current_steps": 8502, "total_steps": 9134, "loss": 1.1427, "learning_rate": 5.883166673367829e-07, "epoch": 0.9307315471140425, "percentage": 93.08, "elapsed_time": "6 days, 11:36:26", "remaining_time": "11:34:01", "throughput": 2741.19, "total_tokens": 1535575104} {"current_steps": 8503, "total_steps": 9134, "loss": 0.8961, "learning_rate": 5.864636863316453e-07, "epoch": 0.9308410191849804, "percentage": 93.09, "elapsed_time": "6 days, 11:37:30", "remaining_time": "11:32:55", "throughput": 2741.22, "total_tokens": 1535766400} {"current_steps": 8504, "total_steps": 9134, "loss": 0.9153, "learning_rate": 5.84613593401187e-07, "epoch": 0.9309504912559183, "percentage": 93.1, "elapsed_time": "6 days, 11:38:36", "remaining_time": "11:31:49", "throughput": 2741.21, "total_tokens": 1535944928} {"current_steps": 8505, "total_steps": 9134, "loss": 1.0147, "learning_rate": 5.827663887642665e-07, "epoch": 0.9310599633268563, "percentage": 93.11, "elapsed_time": "6 days, 11:39:41", "remaining_time": "11:30:43", "throughput": 2741.21, "total_tokens": 1536123232} {"current_steps": 8506, "total_steps": 9134, "loss": 0.9718, "learning_rate": 5.809220726394032e-07, "epoch": 0.9311694353977942, "percentage": 93.12, "elapsed_time": "6 days, 11:40:44", "remaining_time": "11:29:37", "throughput": 2741.22, "total_tokens": 1536305120} {"current_steps": 8507, "total_steps": 9134, "loss": 0.7181, "learning_rate": 5.790806452447756e-07, "epoch": 0.931278907468732, "percentage": 93.14, "elapsed_time": "6 days, 11:41:49", "remaining_time": "11:28:31", "throughput": 2741.24, "total_tokens": 1536491040} {"current_steps": 8508, "total_steps": 9134, "loss": 0.7907, "learning_rate": 5.772421067982259e-07, "epoch": 0.9313883795396699, "percentage": 93.15, "elapsed_time": "6 days, 11:42:53", "remaining_time": "11:27:25", "throughput": 2741.27, "total_tokens": 1536681216} {"current_steps": 8509, "total_steps": 9134, "loss": 0.9292, "learning_rate": 5.754064575172441e-07, "epoch": 0.9314978516106078, "percentage": 93.16, "elapsed_time": "6 days, 11:43:57", "remaining_time": "11:26:19", "throughput": 2741.3, "total_tokens": 1536875648} {"current_steps": 8510, "total_steps": 9134, "loss": 1.0131, "learning_rate": 5.735736976189871e-07, "epoch": 0.9316073236815458, "percentage": 93.17, "elapsed_time": "6 days, 11:45:03", "remaining_time": "11:25:13", "throughput": 2741.3, "total_tokens": 1537057984} {"current_steps": 8511, "total_steps": 9134, "loss": 0.7645, "learning_rate": 5.717438273202674e-07, "epoch": 0.9317167957524837, "percentage": 93.18, "elapsed_time": "6 days, 11:46:10", "remaining_time": "11:24:08", "throughput": 2741.31, "total_tokens": 1537246816} {"current_steps": 8512, "total_steps": 9134, "loss": 0.909, "learning_rate": 5.699168468375538e-07, "epoch": 0.9318262678234216, "percentage": 93.19, "elapsed_time": "6 days, 11:47:12", "remaining_time": "11:23:01", "throughput": 2741.3, "total_tokens": 1537409440} {"current_steps": 8513, "total_steps": 9134, "loss": 0.8172, "learning_rate": 5.680927563869731e-07, "epoch": 0.9319357398943594, "percentage": 93.2, "elapsed_time": "6 days, 11:48:16", "remaining_time": "11:21:55", "throughput": 2741.3, "total_tokens": 1537586400} {"current_steps": 8514, "total_steps": 9134, "loss": 1.0101, "learning_rate": 5.662715561843141e-07, "epoch": 0.9320452119652973, "percentage": 93.21, "elapsed_time": "6 days, 11:49:21", "remaining_time": "11:20:49", "throughput": 2741.34, "total_tokens": 1537789120} {"current_steps": 8515, "total_steps": 9134, "loss": 0.8299, "learning_rate": 5.644532464450237e-07, "epoch": 0.9321546840362352, "percentage": 93.22, "elapsed_time": "6 days, 11:50:23", "remaining_time": "11:19:43", "throughput": 2741.33, "total_tokens": 1537951744} {"current_steps": 8516, "total_steps": 9134, "loss": 0.9206, "learning_rate": 5.626378273841965e-07, "epoch": 0.9322641561071732, "percentage": 93.23, "elapsed_time": "6 days, 11:51:31", "remaining_time": "11:18:37", "throughput": 2741.37, "total_tokens": 1538158048} {"current_steps": 8517, "total_steps": 9134, "loss": 0.7052, "learning_rate": 5.608252992166024e-07, "epoch": 0.9323736281781111, "percentage": 93.25, "elapsed_time": "6 days, 11:52:38", "remaining_time": "11:17:32", "throughput": 2741.43, "total_tokens": 1538376000} {"current_steps": 8518, "total_steps": 9134, "loss": 1.1166, "learning_rate": 5.590156621566506e-07, "epoch": 0.932483100249049, "percentage": 93.26, "elapsed_time": "6 days, 11:53:42", "remaining_time": "11:16:26", "throughput": 2741.47, "total_tokens": 1538572224} {"current_steps": 8519, "total_steps": 9134, "loss": 0.6626, "learning_rate": 5.572089164184253e-07, "epoch": 0.9325925723199868, "percentage": 93.27, "elapsed_time": "6 days, 11:54:49", "remaining_time": "11:15:20", "throughput": 2741.49, "total_tokens": 1538771136} {"current_steps": 8520, "total_steps": 9134, "loss": 0.9293, "learning_rate": 5.554050622156609e-07, "epoch": 0.9327020443909247, "percentage": 93.28, "elapsed_time": "6 days, 11:55:47", "remaining_time": "11:14:13", "throughput": 2741.45, "total_tokens": 1538905088} {"current_steps": 8521, "total_steps": 9134, "loss": 0.8047, "learning_rate": 5.536040997617453e-07, "epoch": 0.9328115164618627, "percentage": 93.29, "elapsed_time": "6 days, 11:56:49", "remaining_time": "11:13:07", "throughput": 2741.45, "total_tokens": 1539074208} {"current_steps": 8522, "total_steps": 9134, "loss": 0.875, "learning_rate": 5.518060292697302e-07, "epoch": 0.9329209885328006, "percentage": 93.3, "elapsed_time": "6 days, 11:57:54", "remaining_time": "11:12:01", "throughput": 2741.47, "total_tokens": 1539268192} {"current_steps": 8523, "total_steps": 9134, "loss": 0.8767, "learning_rate": 5.50010850952326e-07, "epoch": 0.9330304606037385, "percentage": 93.31, "elapsed_time": "6 days, 11:58:53", "remaining_time": "11:10:55", "throughput": 2741.45, "total_tokens": 1539418272} {"current_steps": 8524, "total_steps": 9134, "loss": 0.8176, "learning_rate": 5.482185650218991e-07, "epoch": 0.9331399326746763, "percentage": 93.32, "elapsed_time": "6 days, 12:00:00", "remaining_time": "11:09:49", "throughput": 2741.49, "total_tokens": 1539624128} {"current_steps": 8525, "total_steps": 9134, "loss": 1.0462, "learning_rate": 5.464291716904684e-07, "epoch": 0.9332494047456142, "percentage": 93.33, "elapsed_time": "6 days, 12:01:00", "remaining_time": "11:08:43", "throughput": 2741.5, "total_tokens": 1539795712} {"current_steps": 8526, "total_steps": 9134, "loss": 0.8196, "learning_rate": 5.446426711697233e-07, "epoch": 0.9333588768165522, "percentage": 93.34, "elapsed_time": "6 days, 12:02:07", "remaining_time": "11:07:37", "throughput": 2741.52, "total_tokens": 1539988800} {"current_steps": 8527, "total_steps": 9134, "loss": 0.7238, "learning_rate": 5.428590636709973e-07, "epoch": 0.9334683488874901, "percentage": 93.35, "elapsed_time": "6 days, 12:03:11", "remaining_time": "11:06:31", "throughput": 2741.55, "total_tokens": 1540177184} {"current_steps": 8528, "total_steps": 9134, "loss": 0.9734, "learning_rate": 5.41078349405294e-07, "epoch": 0.933577820958428, "percentage": 93.37, "elapsed_time": "6 days, 12:04:18", "remaining_time": "11:05:25", "throughput": 2741.58, "total_tokens": 1540381472} {"current_steps": 8529, "total_steps": 9134, "loss": 0.7023, "learning_rate": 5.393005285832586e-07, "epoch": 0.9336872930293659, "percentage": 93.38, "elapsed_time": "6 days, 12:05:23", "remaining_time": "11:04:19", "throughput": 2741.6, "total_tokens": 1540566048} {"current_steps": 8530, "total_steps": 9134, "loss": 0.7538, "learning_rate": 5.375256014152119e-07, "epoch": 0.9337967651003037, "percentage": 93.39, "elapsed_time": "6 days, 12:06:29", "remaining_time": "11:03:13", "throughput": 2741.6, "total_tokens": 1540751968} {"current_steps": 8531, "total_steps": 9134, "loss": 0.9848, "learning_rate": 5.35753568111122e-07, "epoch": 0.9339062371712417, "percentage": 93.4, "elapsed_time": "6 days, 12:07:36", "remaining_time": "11:02:08", "throughput": 2741.59, "total_tokens": 1540927360} {"current_steps": 8532, "total_steps": 9134, "loss": 1.1922, "learning_rate": 5.339844288806156e-07, "epoch": 0.9340157092421796, "percentage": 93.41, "elapsed_time": "6 days, 12:08:42", "remaining_time": "11:01:02", "throughput": 2741.62, "total_tokens": 1541126496} {"current_steps": 8533, "total_steps": 9134, "loss": 0.8993, "learning_rate": 5.322181839329865e-07, "epoch": 0.9341251813131175, "percentage": 93.42, "elapsed_time": "6 days, 12:09:48", "remaining_time": "10:59:56", "throughput": 2741.63, "total_tokens": 1541313984} {"current_steps": 8534, "total_steps": 9134, "loss": 0.8487, "learning_rate": 5.304548334771648e-07, "epoch": 0.9342346533840554, "percentage": 93.43, "elapsed_time": "6 days, 12:10:55", "remaining_time": "10:58:50", "throughput": 2741.59, "total_tokens": 1541473920} {"current_steps": 8535, "total_steps": 9134, "loss": 0.9311, "learning_rate": 5.28694377721764e-07, "epoch": 0.9343441254549933, "percentage": 93.44, "elapsed_time": "6 days, 12:12:01", "remaining_time": "10:57:44", "throughput": 2741.6, "total_tokens": 1541658720} {"current_steps": 8536, "total_steps": 9134, "loss": 0.9159, "learning_rate": 5.269368168750316e-07, "epoch": 0.9344535975259312, "percentage": 93.45, "elapsed_time": "6 days, 12:13:04", "remaining_time": "10:56:38", "throughput": 2741.57, "total_tokens": 1541818880} {"current_steps": 8537, "total_steps": 9134, "loss": 0.876, "learning_rate": 5.251821511448928e-07, "epoch": 0.9345630695968691, "percentage": 93.46, "elapsed_time": "6 days, 12:14:08", "remaining_time": "10:55:32", "throughput": 2741.57, "total_tokens": 1541990464} {"current_steps": 8538, "total_steps": 9134, "loss": 0.6961, "learning_rate": 5.234303807389151e-07, "epoch": 0.934672541667807, "percentage": 93.47, "elapsed_time": "6 days, 12:15:11", "remaining_time": "10:54:26", "throughput": 2741.55, "total_tokens": 1542149728} {"current_steps": 8539, "total_steps": 9134, "loss": 0.8403, "learning_rate": 5.216815058643353e-07, "epoch": 0.9347820137387449, "percentage": 93.49, "elapsed_time": "6 days, 12:16:15", "remaining_time": "10:53:20", "throughput": 2741.55, "total_tokens": 1542329152} {"current_steps": 8540, "total_steps": 9134, "loss": 0.6809, "learning_rate": 5.199355267280382e-07, "epoch": 0.9348914858096828, "percentage": 93.5, "elapsed_time": "6 days, 12:17:17", "remaining_time": "10:52:14", "throughput": 2741.53, "total_tokens": 1542488416} {"current_steps": 8541, "total_steps": 9134, "loss": 0.9135, "learning_rate": 5.181924435365693e-07, "epoch": 0.9350009578806207, "percentage": 93.51, "elapsed_time": "6 days, 12:18:20", "remaining_time": "10:51:08", "throughput": 2741.57, "total_tokens": 1542682176} {"current_steps": 8542, "total_steps": 9134, "loss": 0.9344, "learning_rate": 5.164522564961332e-07, "epoch": 0.9351104299515586, "percentage": 93.52, "elapsed_time": "6 days, 12:19:28", "remaining_time": "10:50:02", "throughput": 2741.58, "total_tokens": 1542872352} {"current_steps": 8543, "total_steps": 9134, "loss": 0.8241, "learning_rate": 5.147149658125877e-07, "epoch": 0.9352199020224965, "percentage": 93.53, "elapsed_time": "6 days, 12:20:29", "remaining_time": "10:48:56", "throughput": 2741.55, "total_tokens": 1543026240} {"current_steps": 8544, "total_steps": 9134, "loss": 0.9263, "learning_rate": 5.129805716914571e-07, "epoch": 0.9353293740934344, "percentage": 93.54, "elapsed_time": "6 days, 12:21:37", "remaining_time": "10:47:50", "throughput": 2741.59, "total_tokens": 1543232544} {"current_steps": 8545, "total_steps": 9134, "loss": 1.0197, "learning_rate": 5.112490743379133e-07, "epoch": 0.9354388461643723, "percentage": 93.55, "elapsed_time": "6 days, 12:22:40", "remaining_time": "10:46:44", "throughput": 2741.6, "total_tokens": 1543410624} {"current_steps": 8546, "total_steps": 9134, "loss": 0.863, "learning_rate": 5.095204739567899e-07, "epoch": 0.9355483182353103, "percentage": 93.56, "elapsed_time": "6 days, 12:23:45", "remaining_time": "10:45:38", "throughput": 2741.66, "total_tokens": 1543624544} {"current_steps": 8547, "total_steps": 9134, "loss": 0.8846, "learning_rate": 5.07794770752576e-07, "epoch": 0.9356577903062481, "percentage": 93.57, "elapsed_time": "6 days, 12:24:51", "remaining_time": "10:44:32", "throughput": 2741.7, "total_tokens": 1543827712} {"current_steps": 8548, "total_steps": 9134, "loss": 1.1799, "learning_rate": 5.060719649294194e-07, "epoch": 0.935767262377186, "percentage": 93.58, "elapsed_time": "6 days, 12:25:56", "remaining_time": "10:43:26", "throughput": 2741.68, "total_tokens": 1543996160} {"current_steps": 8549, "total_steps": 9134, "loss": 0.8553, "learning_rate": 5.043520566911264e-07, "epoch": 0.9358767344481239, "percentage": 93.6, "elapsed_time": "6 days, 12:27:03", "remaining_time": "10:42:20", "throughput": 2741.72, "total_tokens": 1544201344} {"current_steps": 8550, "total_steps": 9134, "loss": 0.9294, "learning_rate": 5.026350462411567e-07, "epoch": 0.9359862065190618, "percentage": 93.61, "elapsed_time": "6 days, 12:28:08", "remaining_time": "10:41:14", "throughput": 2741.76, "total_tokens": 1544402720} {"current_steps": 8551, "total_steps": 9134, "loss": 0.9125, "learning_rate": 5.009209337826254e-07, "epoch": 0.9360956785899998, "percentage": 93.62, "elapsed_time": "6 days, 12:29:12", "remaining_time": "10:40:08", "throughput": 2741.79, "total_tokens": 1544595584} {"current_steps": 8552, "total_steps": 9134, "loss": 0.7121, "learning_rate": 4.992097195183176e-07, "epoch": 0.9362051506609377, "percentage": 93.63, "elapsed_time": "6 days, 12:30:15", "remaining_time": "10:39:02", "throughput": 2741.77, "total_tokens": 1544752832} {"current_steps": 8553, "total_steps": 9134, "loss": 0.7835, "learning_rate": 4.975014036506631e-07, "epoch": 0.9363146227318755, "percentage": 93.64, "elapsed_time": "6 days, 12:31:17", "remaining_time": "10:37:56", "throughput": 2741.75, "total_tokens": 1544917696} {"current_steps": 8554, "total_steps": 9134, "loss": 0.9602, "learning_rate": 4.957959863817502e-07, "epoch": 0.9364240948028134, "percentage": 93.65, "elapsed_time": "6 days, 12:32:20", "remaining_time": "10:36:50", "throughput": 2741.77, "total_tokens": 1545098240} {"current_steps": 8555, "total_steps": 9134, "loss": 0.9899, "learning_rate": 4.940934679133286e-07, "epoch": 0.9365335668737513, "percentage": 93.66, "elapsed_time": "6 days, 12:33:27", "remaining_time": "10:35:44", "throughput": 2741.82, "total_tokens": 1545311712} {"current_steps": 8556, "total_steps": 9134, "loss": 0.8513, "learning_rate": 4.923938484468038e-07, "epoch": 0.9366430389446893, "percentage": 93.67, "elapsed_time": "6 days, 12:34:32", "remaining_time": "10:34:38", "throughput": 2741.85, "total_tokens": 1545507936} {"current_steps": 8557, "total_steps": 9134, "loss": 0.8305, "learning_rate": 4.906971281832346e-07, "epoch": 0.9367525110156272, "percentage": 93.68, "elapsed_time": "6 days, 12:35:34", "remaining_time": "10:33:32", "throughput": 2741.85, "total_tokens": 1545675712} {"current_steps": 8558, "total_steps": 9134, "loss": 0.723, "learning_rate": 4.890033073233408e-07, "epoch": 0.936861983086565, "percentage": 93.69, "elapsed_time": "6 days, 12:36:38", "remaining_time": "10:32:26", "throughput": 2741.83, "total_tokens": 1545842368} {"current_steps": 8559, "total_steps": 9134, "loss": 0.882, "learning_rate": 4.87312386067501e-07, "epoch": 0.9369714551575029, "percentage": 93.7, "elapsed_time": "6 days, 12:37:45", "remaining_time": "10:31:20", "throughput": 2741.85, "total_tokens": 1546033888} {"current_steps": 8560, "total_steps": 9134, "loss": 1.0436, "learning_rate": 4.856243646157415e-07, "epoch": 0.9370809272284408, "percentage": 93.72, "elapsed_time": "6 days, 12:38:51", "remaining_time": "10:30:15", "throughput": 2741.88, "total_tokens": 1546230784} {"current_steps": 8561, "total_steps": 9134, "loss": 1.016, "learning_rate": 4.83939243167758e-07, "epoch": 0.9371903992993788, "percentage": 93.73, "elapsed_time": "6 days, 12:39:57", "remaining_time": "10:29:09", "throughput": 2741.88, "total_tokens": 1546413120} {"current_steps": 8562, "total_steps": 9134, "loss": 0.7022, "learning_rate": 4.822570219228967e-07, "epoch": 0.9372998713703167, "percentage": 93.74, "elapsed_time": "6 days, 12:41:00", "remaining_time": "10:28:03", "throughput": 2741.86, "total_tokens": 1546574400} {"current_steps": 8563, "total_steps": 9134, "loss": 0.9933, "learning_rate": 4.805777010801593e-07, "epoch": 0.9374093434412546, "percentage": 93.75, "elapsed_time": "6 days, 12:42:03", "remaining_time": "10:26:57", "throughput": 2741.85, "total_tokens": 1546740832} {"current_steps": 8564, "total_steps": 9134, "loss": 0.7225, "learning_rate": 4.789012808382065e-07, "epoch": 0.9375188155121924, "percentage": 93.76, "elapsed_time": "6 days, 12:43:07", "remaining_time": "10:25:51", "throughput": 2741.83, "total_tokens": 1546906144} {"current_steps": 8565, "total_steps": 9134, "loss": 0.9981, "learning_rate": 4.772277613953546e-07, "epoch": 0.9376282875831303, "percentage": 93.77, "elapsed_time": "6 days, 12:44:10", "remaining_time": "10:24:44", "throughput": 2741.84, "total_tokens": 1547086912} {"current_steps": 8566, "total_steps": 9134, "loss": 0.8358, "learning_rate": 4.7555714294958144e-07, "epoch": 0.9377377596540682, "percentage": 93.78, "elapsed_time": "6 days, 12:45:17", "remaining_time": "10:23:39", "throughput": 2741.83, "total_tokens": 1547263424} {"current_steps": 8567, "total_steps": 9134, "loss": 0.8621, "learning_rate": 4.738894256985121e-07, "epoch": 0.9378472317250062, "percentage": 93.79, "elapsed_time": "6 days, 12:46:23", "remaining_time": "10:22:33", "throughput": 2741.81, "total_tokens": 1547436128} {"current_steps": 8568, "total_steps": 9134, "loss": 0.7605, "learning_rate": 4.722246098394417e-07, "epoch": 0.9379567037959441, "percentage": 93.8, "elapsed_time": "6 days, 12:47:31", "remaining_time": "10:21:27", "throughput": 2741.83, "total_tokens": 1547629888} {"current_steps": 8569, "total_steps": 9134, "loss": 0.8189, "learning_rate": 4.705626955693071e-07, "epoch": 0.938066175866882, "percentage": 93.81, "elapsed_time": "6 days, 12:48:34", "remaining_time": "10:20:21", "throughput": 2741.85, "total_tokens": 1547815584} {"current_steps": 8570, "total_steps": 9134, "loss": 0.6934, "learning_rate": 4.689036830847177e-07, "epoch": 0.9381756479378198, "percentage": 93.83, "elapsed_time": "6 days, 12:49:38", "remaining_time": "10:19:15", "throughput": 2741.82, "total_tokens": 1547976640} {"current_steps": 8571, "total_steps": 9134, "loss": 0.8402, "learning_rate": 4.67247572581922e-07, "epoch": 0.9382851200087577, "percentage": 93.84, "elapsed_time": "6 days, 12:50:42", "remaining_time": "10:18:09", "throughput": 2741.8, "total_tokens": 1548135680} {"current_steps": 8572, "total_steps": 9134, "loss": 0.7004, "learning_rate": 4.655943642568411e-07, "epoch": 0.9383945920796957, "percentage": 93.85, "elapsed_time": "6 days, 12:51:43", "remaining_time": "10:17:03", "throughput": 2741.8, "total_tokens": 1548304352} {"current_steps": 8573, "total_steps": 9134, "loss": 1.0581, "learning_rate": 4.639440583050464e-07, "epoch": 0.9385040641506336, "percentage": 93.86, "elapsed_time": "6 days, 12:52:50", "remaining_time": "10:15:57", "throughput": 2741.83, "total_tokens": 1548506624} {"current_steps": 8574, "total_steps": 9134, "loss": 1.0687, "learning_rate": 4.622966549217622e-07, "epoch": 0.9386135362215715, "percentage": 93.87, "elapsed_time": "6 days, 12:53:54", "remaining_time": "10:14:51", "throughput": 2741.83, "total_tokens": 1548682688} {"current_steps": 8575, "total_steps": 9134, "loss": 0.7917, "learning_rate": 4.606521543018799e-07, "epoch": 0.9387230082925093, "percentage": 93.88, "elapsed_time": "6 days, 12:54:58", "remaining_time": "10:13:45", "throughput": 2741.87, "total_tokens": 1548874208} {"current_steps": 8576, "total_steps": 9134, "loss": 0.8699, "learning_rate": 4.5901055663993274e-07, "epoch": 0.9388324803634472, "percentage": 93.89, "elapsed_time": "6 days, 12:56:03", "remaining_time": "10:12:39", "throughput": 2741.86, "total_tokens": 1549049600} {"current_steps": 8577, "total_steps": 9134, "loss": 0.8874, "learning_rate": 4.573718621301265e-07, "epoch": 0.9389419524343852, "percentage": 93.9, "elapsed_time": "6 days, 12:57:07", "remaining_time": "10:11:33", "throughput": 2741.9, "total_tokens": 1549249632} {"current_steps": 8578, "total_steps": 9134, "loss": 0.9138, "learning_rate": 4.557360709663061e-07, "epoch": 0.9390514245053231, "percentage": 93.91, "elapsed_time": "6 days, 12:58:15", "remaining_time": "10:10:27", "throughput": 2741.89, "total_tokens": 1549429280} {"current_steps": 8579, "total_steps": 9134, "loss": 1.1141, "learning_rate": 4.5410318334199175e-07, "epoch": 0.939160896576261, "percentage": 93.92, "elapsed_time": "6 days, 12:59:21", "remaining_time": "10:09:21", "throughput": 2741.88, "total_tokens": 1549606912} {"current_steps": 8580, "total_steps": 9134, "loss": 0.7208, "learning_rate": 4.524731994503456e-07, "epoch": 0.9392703686471989, "percentage": 93.93, "elapsed_time": "6 days, 13:00:27", "remaining_time": "10:08:16", "throughput": 2741.93, "total_tokens": 1549812544} {"current_steps": 8581, "total_steps": 9134, "loss": 0.669, "learning_rate": 4.50846119484194e-07, "epoch": 0.9393798407181367, "percentage": 93.95, "elapsed_time": "6 days, 13:01:34", "remaining_time": "10:07:10", "throughput": 2741.96, "total_tokens": 1550011456} {"current_steps": 8582, "total_steps": 9134, "loss": 0.7336, "learning_rate": 4.4922194363601343e-07, "epoch": 0.9394893127890747, "percentage": 93.96, "elapsed_time": "6 days, 13:02:41", "remaining_time": "10:06:04", "throughput": 2741.98, "total_tokens": 1550208128} {"current_steps": 8583, "total_steps": 9134, "loss": 0.7707, "learning_rate": 4.476006720979475e-07, "epoch": 0.9395987848600126, "percentage": 93.97, "elapsed_time": "6 days, 13:03:44", "remaining_time": "10:04:58", "throughput": 2741.98, "total_tokens": 1550384864} {"current_steps": 8584, "total_steps": 9134, "loss": 0.8883, "learning_rate": 4.459823050617845e-07, "epoch": 0.9397082569309505, "percentage": 93.98, "elapsed_time": "6 days, 13:04:48", "remaining_time": "10:03:52", "throughput": 2741.98, "total_tokens": 1550559584} {"current_steps": 8585, "total_steps": 9134, "loss": 0.9643, "learning_rate": 4.44366842718974e-07, "epoch": 0.9398177290018884, "percentage": 93.99, "elapsed_time": "6 days, 13:05:48", "remaining_time": "10:02:46", "throughput": 2741.94, "total_tokens": 1550698912} {"current_steps": 8586, "total_steps": 9134, "loss": 0.6882, "learning_rate": 4.4275428526062425e-07, "epoch": 0.9399272010728263, "percentage": 94.0, "elapsed_time": "6 days, 13:06:54", "remaining_time": "10:01:40", "throughput": 2741.95, "total_tokens": 1550888192} {"current_steps": 8587, "total_steps": 9134, "loss": 0.926, "learning_rate": 4.411446328774993e-07, "epoch": 0.9400366731437642, "percentage": 94.01, "elapsed_time": "6 days, 13:08:00", "remaining_time": "10:00:34", "throughput": 2741.96, "total_tokens": 1551073888} {"current_steps": 8588, "total_steps": 9134, "loss": 0.7265, "learning_rate": 4.3953788576001353e-07, "epoch": 0.9401461452147021, "percentage": 94.02, "elapsed_time": "6 days, 13:09:05", "remaining_time": "9:59:28", "throughput": 2741.96, "total_tokens": 1551250624} {"current_steps": 8589, "total_steps": 9134, "loss": 0.7611, "learning_rate": 4.3793404409824546e-07, "epoch": 0.94025561728564, "percentage": 94.03, "elapsed_time": "6 days, 13:10:11", "remaining_time": "9:58:22", "throughput": 2741.99, "total_tokens": 1551449088} {"current_steps": 8590, "total_steps": 9134, "loss": 0.8881, "learning_rate": 4.3633310808192385e-07, "epoch": 0.9403650893565779, "percentage": 94.04, "elapsed_time": "6 days, 13:11:14", "remaining_time": "9:57:16", "throughput": 2741.98, "total_tokens": 1551615072} {"current_steps": 8591, "total_steps": 9134, "loss": 0.757, "learning_rate": 4.347350779004389e-07, "epoch": 0.9404745614275158, "percentage": 94.06, "elapsed_time": "6 days, 13:12:18", "remaining_time": "9:56:10", "throughput": 2742.01, "total_tokens": 1551807936} {"current_steps": 8592, "total_steps": 9134, "loss": 0.6877, "learning_rate": 4.331399537428338e-07, "epoch": 0.9405840334984537, "percentage": 94.07, "elapsed_time": "6 days, 13:13:22", "remaining_time": "9:55:04", "throughput": 2742.02, "total_tokens": 1551994080} {"current_steps": 8593, "total_steps": 9134, "loss": 0.9182, "learning_rate": 4.3154773579780483e-07, "epoch": 0.9406935055693916, "percentage": 94.08, "elapsed_time": "6 days, 13:14:24", "remaining_time": "9:53:58", "throughput": 2742.0, "total_tokens": 1552151328} {"current_steps": 8594, "total_steps": 9134, "loss": 0.8199, "learning_rate": 4.2995842425371524e-07, "epoch": 0.9408029776403295, "percentage": 94.09, "elapsed_time": "6 days, 13:15:30", "remaining_time": "9:52:52", "throughput": 2742.0, "total_tokens": 1552328512} {"current_steps": 8595, "total_steps": 9134, "loss": 0.8618, "learning_rate": 4.283720192985757e-07, "epoch": 0.9409124497112674, "percentage": 94.1, "elapsed_time": "6 days, 13:16:33", "remaining_time": "9:51:46", "throughput": 2741.99, "total_tokens": 1552496064} {"current_steps": 8596, "total_steps": 9134, "loss": 1.074, "learning_rate": 4.267885211200501e-07, "epoch": 0.9410219217822053, "percentage": 94.11, "elapsed_time": "6 days, 13:17:37", "remaining_time": "9:50:40", "throughput": 2742.03, "total_tokens": 1552695424} {"current_steps": 8597, "total_steps": 9134, "loss": 0.919, "learning_rate": 4.25207929905469e-07, "epoch": 0.9411313938531433, "percentage": 94.12, "elapsed_time": "6 days, 13:18:42", "remaining_time": "9:49:34", "throughput": 2742.04, "total_tokens": 1552878880} {"current_steps": 8598, "total_steps": 9134, "loss": 0.6893, "learning_rate": 4.236302458418051e-07, "epoch": 0.9412408659240811, "percentage": 94.13, "elapsed_time": "6 days, 13:19:48", "remaining_time": "9:48:28", "throughput": 2742.05, "total_tokens": 1553065248} {"current_steps": 8599, "total_steps": 9134, "loss": 0.8205, "learning_rate": 4.2205546911570913e-07, "epoch": 0.941350337995019, "percentage": 94.14, "elapsed_time": "6 days, 13:20:48", "remaining_time": "9:47:22", "throughput": 2742.04, "total_tokens": 1553225408} {"current_steps": 8600, "total_steps": 9134, "loss": 0.8021, "learning_rate": 4.2048359991345986e-07, "epoch": 0.9414598100659569, "percentage": 94.15, "elapsed_time": "6 days, 13:21:52", "remaining_time": "9:46:16", "throughput": 2742.06, "total_tokens": 1553411552} {"current_steps": 8601, "total_steps": 9134, "loss": 0.8877, "learning_rate": 4.1891463842101685e-07, "epoch": 0.9415692821368948, "percentage": 94.16, "elapsed_time": "6 days, 13:22:57", "remaining_time": "9:45:10", "throughput": 2742.05, "total_tokens": 1553583584} {"current_steps": 8602, "total_steps": 9134, "loss": 0.7356, "learning_rate": 4.173485848239761e-07, "epoch": 0.9416787542078328, "percentage": 94.18, "elapsed_time": "6 days, 13:24:03", "remaining_time": "9:44:04", "throughput": 2742.11, "total_tokens": 1553795712} {"current_steps": 8603, "total_steps": 9134, "loss": 0.8512, "learning_rate": 4.157854393076088e-07, "epoch": 0.9417882262787707, "percentage": 94.19, "elapsed_time": "6 days, 13:25:06", "remaining_time": "9:42:58", "throughput": 2742.09, "total_tokens": 1553959456} {"current_steps": 8604, "total_steps": 9134, "loss": 0.5796, "learning_rate": 4.1422520205682547e-07, "epoch": 0.9418976983497085, "percentage": 94.2, "elapsed_time": "6 days, 13:26:07", "remaining_time": "9:41:52", "throughput": 2742.1, "total_tokens": 1554131488} {"current_steps": 8605, "total_steps": 9134, "loss": 0.7157, "learning_rate": 4.126678732562006e-07, "epoch": 0.9420071704206464, "percentage": 94.21, "elapsed_time": "6 days, 13:27:07", "remaining_time": "9:40:46", "throughput": 2742.05, "total_tokens": 1554267904} {"current_steps": 8606, "total_steps": 9134, "loss": 0.794, "learning_rate": 4.1111345308996185e-07, "epoch": 0.9421166424915843, "percentage": 94.22, "elapsed_time": "6 days, 13:28:13", "remaining_time": "9:39:40", "throughput": 2742.04, "total_tokens": 1554447328} {"current_steps": 8607, "total_steps": 9134, "loss": 0.7521, "learning_rate": 4.095619417419955e-07, "epoch": 0.9422261145625223, "percentage": 94.23, "elapsed_time": "6 days, 13:29:14", "remaining_time": "9:38:34", "throughput": 2742.02, "total_tokens": 1554598528} {"current_steps": 8608, "total_steps": 9134, "loss": 1.0468, "learning_rate": 4.080133393958463e-07, "epoch": 0.9423355866334602, "percentage": 94.24, "elapsed_time": "6 days, 13:30:21", "remaining_time": "9:37:28", "throughput": 2742.05, "total_tokens": 1554799232} {"current_steps": 8609, "total_steps": 9134, "loss": 1.1265, "learning_rate": 4.0646764623470113e-07, "epoch": 0.942445058704398, "percentage": 94.25, "elapsed_time": "6 days, 13:31:26", "remaining_time": "9:36:22", "throughput": 2742.07, "total_tokens": 1554991872} {"current_steps": 8610, "total_steps": 9134, "loss": 0.9153, "learning_rate": 4.049248624414248e-07, "epoch": 0.9425545307753359, "percentage": 94.26, "elapsed_time": "6 days, 13:32:28", "remaining_time": "9:35:16", "throughput": 2742.05, "total_tokens": 1555152032} {"current_steps": 8611, "total_steps": 9134, "loss": 1.1393, "learning_rate": 4.0338498819851577e-07, "epoch": 0.9426640028462738, "percentage": 94.27, "elapsed_time": "6 days, 13:33:34", "remaining_time": "9:34:10", "throughput": 2742.08, "total_tokens": 1555347360} {"current_steps": 8612, "total_steps": 9134, "loss": 0.9882, "learning_rate": 4.018480236881422e-07, "epoch": 0.9427734749172118, "percentage": 94.29, "elapsed_time": "6 days, 13:34:39", "remaining_time": "9:33:04", "throughput": 2742.12, "total_tokens": 1555545152} {"current_steps": 8613, "total_steps": 9134, "loss": 0.7905, "learning_rate": 4.003139690921254e-07, "epoch": 0.9428829469881497, "percentage": 94.3, "elapsed_time": "6 days, 13:35:39", "remaining_time": "9:31:58", "throughput": 2742.1, "total_tokens": 1555699040} {"current_steps": 8614, "total_steps": 9134, "loss": 1.1261, "learning_rate": 3.987828245919367e-07, "epoch": 0.9429924190590876, "percentage": 94.31, "elapsed_time": "6 days, 13:36:44", "remaining_time": "9:30:52", "throughput": 2742.11, "total_tokens": 1555886528} {"current_steps": 8615, "total_steps": 9134, "loss": 0.9953, "learning_rate": 3.972545903687119e-07, "epoch": 0.9431018911300254, "percentage": 94.32, "elapsed_time": "6 days, 13:37:50", "remaining_time": "9:29:46", "throughput": 2742.11, "total_tokens": 1556065952} {"current_steps": 8616, "total_steps": 9134, "loss": 0.6505, "learning_rate": 3.9572926660323695e-07, "epoch": 0.9432113632009633, "percentage": 94.33, "elapsed_time": "6 days, 13:38:50", "remaining_time": "9:28:40", "throughput": 2742.07, "total_tokens": 1556208416} {"current_steps": 8617, "total_steps": 9134, "loss": 0.8938, "learning_rate": 3.9420685347595634e-07, "epoch": 0.9433208352719012, "percentage": 94.34, "elapsed_time": "6 days, 13:39:58", "remaining_time": "9:27:34", "throughput": 2742.1, "total_tokens": 1556410464} {"current_steps": 8618, "total_steps": 9134, "loss": 0.8711, "learning_rate": 3.926873511669621e-07, "epoch": 0.9434303073428392, "percentage": 94.35, "elapsed_time": "6 days, 13:40:58", "remaining_time": "9:26:28", "throughput": 2742.07, "total_tokens": 1556560992} {"current_steps": 8619, "total_steps": 9134, "loss": 0.7365, "learning_rate": 3.91170759856016e-07, "epoch": 0.9435397794137771, "percentage": 94.36, "elapsed_time": "6 days, 13:42:03", "remaining_time": "9:25:22", "throughput": 2742.07, "total_tokens": 1556734368} {"current_steps": 8620, "total_steps": 9134, "loss": 0.8661, "learning_rate": 3.896570797225246e-07, "epoch": 0.943649251484715, "percentage": 94.37, "elapsed_time": "6 days, 13:43:04", "remaining_time": "9:24:16", "throughput": 2742.06, "total_tokens": 1556896320} {"current_steps": 8621, "total_steps": 9134, "loss": 0.8052, "learning_rate": 3.88146310945553e-07, "epoch": 0.9437587235556528, "percentage": 94.38, "elapsed_time": "6 days, 13:44:03", "remaining_time": "9:23:10", "throughput": 2742.01, "total_tokens": 1557033856} {"current_steps": 8622, "total_steps": 9134, "loss": 0.8734, "learning_rate": 3.86638453703822e-07, "epoch": 0.9438681956265907, "percentage": 94.39, "elapsed_time": "6 days, 13:45:10", "remaining_time": "9:22:04", "throughput": 2742.03, "total_tokens": 1557225376} {"current_steps": 8623, "total_steps": 9134, "loss": 1.0547, "learning_rate": 3.8513350817571124e-07, "epoch": 0.9439776676975287, "percentage": 94.41, "elapsed_time": "6 days, 13:46:15", "remaining_time": "9:20:58", "throughput": 2742.06, "total_tokens": 1557420928} {"current_steps": 8624, "total_steps": 9134, "loss": 0.8674, "learning_rate": 3.836314745392505e-07, "epoch": 0.9440871397684666, "percentage": 94.42, "elapsed_time": "6 days, 13:47:22", "remaining_time": "9:19:52", "throughput": 2742.09, "total_tokens": 1557622528} {"current_steps": 8625, "total_steps": 9134, "loss": 0.9329, "learning_rate": 3.8213235297212823e-07, "epoch": 0.9441966118394045, "percentage": 94.43, "elapsed_time": "6 days, 13:48:25", "remaining_time": "9:18:46", "throughput": 2742.12, "total_tokens": 1557815168} {"current_steps": 8626, "total_steps": 9134, "loss": 0.7863, "learning_rate": 3.806361436516831e-07, "epoch": 0.9443060839103423, "percentage": 94.44, "elapsed_time": "6 days, 13:49:29", "remaining_time": "9:17:40", "throughput": 2742.14, "total_tokens": 1558003104} {"current_steps": 8627, "total_steps": 9134, "loss": 0.768, "learning_rate": 3.7914284675492075e-07, "epoch": 0.9444155559812802, "percentage": 94.45, "elapsed_time": "6 days, 13:50:31", "remaining_time": "9:16:34", "throughput": 2742.13, "total_tokens": 1558161696} {"current_steps": 8628, "total_steps": 9134, "loss": 0.8753, "learning_rate": 3.7765246245849426e-07, "epoch": 0.9445250280522182, "percentage": 94.46, "elapsed_time": "6 days, 13:51:38", "remaining_time": "9:15:28", "throughput": 2742.18, "total_tokens": 1558373600} {"current_steps": 8629, "total_steps": 9134, "loss": 0.8266, "learning_rate": 3.761649909387099e-07, "epoch": 0.9446345001231561, "percentage": 94.47, "elapsed_time": "6 days, 13:52:44", "remaining_time": "9:14:22", "throughput": 2742.16, "total_tokens": 1558547872} {"current_steps": 8630, "total_steps": 9134, "loss": 0.837, "learning_rate": 3.746804323715353e-07, "epoch": 0.944743972194094, "percentage": 94.48, "elapsed_time": "6 days, 13:53:47", "remaining_time": "9:13:16", "throughput": 2742.15, "total_tokens": 1558713856} {"current_steps": 8631, "total_steps": 9134, "loss": 1.302, "learning_rate": 3.731987869325881e-07, "epoch": 0.9448534442650319, "percentage": 94.49, "elapsed_time": "6 days, 13:54:54", "remaining_time": "9:12:10", "throughput": 2742.16, "total_tokens": 1558902240} {"current_steps": 8632, "total_steps": 9134, "loss": 0.6936, "learning_rate": 3.7172005479714777e-07, "epoch": 0.9449629163359697, "percentage": 94.5, "elapsed_time": "6 days, 13:55:58", "remaining_time": "9:11:04", "throughput": 2742.14, "total_tokens": 1559067552} {"current_steps": 8633, "total_steps": 9134, "loss": 0.9548, "learning_rate": 3.7024423614014094e-07, "epoch": 0.9450723884069077, "percentage": 94.51, "elapsed_time": "6 days, 13:57:05", "remaining_time": "9:09:59", "throughput": 2742.16, "total_tokens": 1559262880} {"current_steps": 8634, "total_steps": 9134, "loss": 1.3285, "learning_rate": 3.6877133113616123e-07, "epoch": 0.9451818604778456, "percentage": 94.53, "elapsed_time": "6 days, 13:58:09", "remaining_time": "9:08:53", "throughput": 2742.18, "total_tokens": 1559447456} {"current_steps": 8635, "total_steps": 9134, "loss": 0.8459, "learning_rate": 3.673013399594444e-07, "epoch": 0.9452913325487835, "percentage": 94.54, "elapsed_time": "6 days, 13:59:11", "remaining_time": "9:07:47", "throughput": 2742.2, "total_tokens": 1559633376} {"current_steps": 8636, "total_steps": 9134, "loss": 0.929, "learning_rate": 3.658342627838873e-07, "epoch": 0.9454008046197214, "percentage": 94.55, "elapsed_time": "6 days, 14:00:13", "remaining_time": "9:06:40", "throughput": 2742.17, "total_tokens": 1559782336} {"current_steps": 8637, "total_steps": 9134, "loss": 0.9585, "learning_rate": 3.643700997830457e-07, "epoch": 0.9455102766906593, "percentage": 94.56, "elapsed_time": "6 days, 14:01:15", "remaining_time": "9:05:34", "throughput": 2742.16, "total_tokens": 1559946080} {"current_steps": 8638, "total_steps": 9134, "loss": 1.0131, "learning_rate": 3.6290885113012816e-07, "epoch": 0.9456197487615972, "percentage": 94.57, "elapsed_time": "6 days, 14:02:16", "remaining_time": "9:04:28", "throughput": 2742.13, "total_tokens": 1560093920} {"current_steps": 8639, "total_steps": 9134, "loss": 0.8744, "learning_rate": 3.614505169979909e-07, "epoch": 0.9457292208325351, "percentage": 94.58, "elapsed_time": "6 days, 14:03:20", "remaining_time": "9:03:22", "throughput": 2742.14, "total_tokens": 1560278272} {"current_steps": 8640, "total_steps": 9134, "loss": 0.8874, "learning_rate": 3.5999509755915985e-07, "epoch": 0.945838692903473, "percentage": 94.59, "elapsed_time": "6 days, 14:04:23", "remaining_time": "9:02:16", "throughput": 2742.16, "total_tokens": 1560461728} {"current_steps": 8641, "total_steps": 9134, "loss": 0.7381, "learning_rate": 3.585425929858055e-07, "epoch": 0.9459481649744109, "percentage": 94.6, "elapsed_time": "6 days, 14:05:28", "remaining_time": "9:01:10", "throughput": 2742.16, "total_tokens": 1560644960} {"current_steps": 8642, "total_steps": 9134, "loss": 0.732, "learning_rate": 3.570930034497516e-07, "epoch": 0.9460576370453488, "percentage": 94.61, "elapsed_time": "6 days, 14:06:36", "remaining_time": "9:00:05", "throughput": 2742.19, "total_tokens": 1560846784} {"current_steps": 8643, "total_steps": 9134, "loss": 0.7702, "learning_rate": 3.556463291224915e-07, "epoch": 0.9461671091162867, "percentage": 94.62, "elapsed_time": "6 days, 14:07:36", "remaining_time": "8:58:58", "throughput": 2742.19, "total_tokens": 1561011872} {"current_steps": 8644, "total_steps": 9134, "loss": 1.0645, "learning_rate": 3.54202570175155e-07, "epoch": 0.9462765811872246, "percentage": 94.64, "elapsed_time": "6 days, 14:08:43", "remaining_time": "8:57:53", "throughput": 2742.22, "total_tokens": 1561211904} {"current_steps": 8645, "total_steps": 9134, "loss": 0.6722, "learning_rate": 3.527617267785416e-07, "epoch": 0.9463860532581625, "percentage": 94.65, "elapsed_time": "6 days, 14:09:45", "remaining_time": "8:56:47", "throughput": 2742.21, "total_tokens": 1561375200} {"current_steps": 8646, "total_steps": 9134, "loss": 0.9221, "learning_rate": 3.513237991030982e-07, "epoch": 0.9464955253291004, "percentage": 94.66, "elapsed_time": "6 days, 14:10:46", "remaining_time": "8:55:40", "throughput": 2742.2, "total_tokens": 1561535136} {"current_steps": 8647, "total_steps": 9134, "loss": 1.0339, "learning_rate": 3.498887873189277e-07, "epoch": 0.9466049974000383, "percentage": 94.67, "elapsed_time": "6 days, 14:11:53", "remaining_time": "8:54:35", "throughput": 2742.22, "total_tokens": 1561729792} {"current_steps": 8648, "total_steps": 9134, "loss": 0.7969, "learning_rate": 3.484566915957943e-07, "epoch": 0.9467144694709763, "percentage": 94.68, "elapsed_time": "6 days, 14:12:58", "remaining_time": "8:53:29", "throughput": 2742.25, "total_tokens": 1561928256} {"current_steps": 8649, "total_steps": 9134, "loss": 0.9274, "learning_rate": 3.470275121031041e-07, "epoch": 0.9468239415419141, "percentage": 94.69, "elapsed_time": "6 days, 14:14:03", "remaining_time": "8:52:23", "throughput": 2742.22, "total_tokens": 1562086848} {"current_steps": 8650, "total_steps": 9134, "loss": 0.988, "learning_rate": 3.4560124900993305e-07, "epoch": 0.946933413612852, "percentage": 94.7, "elapsed_time": "6 days, 14:15:09", "remaining_time": "8:51:17", "throughput": 2742.25, "total_tokens": 1562287552} {"current_steps": 8651, "total_steps": 9134, "loss": 0.9888, "learning_rate": 3.441779024850017e-07, "epoch": 0.9470428856837899, "percentage": 94.71, "elapsed_time": "6 days, 14:16:13", "remaining_time": "8:50:11", "throughput": 2742.26, "total_tokens": 1562464960} {"current_steps": 8652, "total_steps": 9134, "loss": 0.7119, "learning_rate": 3.4275747269669203e-07, "epoch": 0.9471523577547278, "percentage": 94.72, "elapsed_time": "6 days, 14:17:13", "remaining_time": "8:49:05", "throughput": 2742.24, "total_tokens": 1562619520} {"current_steps": 8653, "total_steps": 9134, "loss": 1.0552, "learning_rate": 3.4133995981303624e-07, "epoch": 0.9472618298256658, "percentage": 94.73, "elapsed_time": "6 days, 14:18:20", "remaining_time": "8:47:59", "throughput": 2742.3, "total_tokens": 1562840832} {"current_steps": 8654, "total_steps": 9134, "loss": 1.2645, "learning_rate": 3.3992536400172246e-07, "epoch": 0.9473713018966037, "percentage": 94.74, "elapsed_time": "6 days, 14:19:23", "remaining_time": "8:46:53", "throughput": 2742.32, "total_tokens": 1563020256} {"current_steps": 8655, "total_steps": 9134, "loss": 0.7241, "learning_rate": 3.3851368543009745e-07, "epoch": 0.9474807739675415, "percentage": 94.76, "elapsed_time": "6 days, 14:20:29", "remaining_time": "8:45:47", "throughput": 2742.31, "total_tokens": 1563197888} {"current_steps": 8656, "total_steps": 9134, "loss": 0.8746, "learning_rate": 3.3710492426515804e-07, "epoch": 0.9475902460384794, "percentage": 94.77, "elapsed_time": "6 days, 14:21:34", "remaining_time": "8:44:41", "throughput": 2742.31, "total_tokens": 1563376192} {"current_steps": 8657, "total_steps": 9134, "loss": 0.7682, "learning_rate": 3.3569908067355993e-07, "epoch": 0.9476997181094173, "percentage": 94.78, "elapsed_time": "6 days, 14:22:39", "remaining_time": "8:43:35", "throughput": 2742.32, "total_tokens": 1563557184} {"current_steps": 8658, "total_steps": 9134, "loss": 0.7507, "learning_rate": 3.3429615482160893e-07, "epoch": 0.9478091901803553, "percentage": 94.79, "elapsed_time": "6 days, 14:23:42", "remaining_time": "8:42:29", "throughput": 2742.33, "total_tokens": 1563735488} {"current_steps": 8659, "total_steps": 9134, "loss": 0.7345, "learning_rate": 3.328961468752695e-07, "epoch": 0.9479186622512932, "percentage": 94.8, "elapsed_time": "6 days, 14:24:47", "remaining_time": "8:41:23", "throughput": 2742.32, "total_tokens": 1563909536} {"current_steps": 8660, "total_steps": 9134, "loss": 0.8257, "learning_rate": 3.3149905700016193e-07, "epoch": 0.948028134322231, "percentage": 94.81, "elapsed_time": "6 days, 14:25:52", "remaining_time": "8:40:17", "throughput": 2742.32, "total_tokens": 1564088288} {"current_steps": 8661, "total_steps": 9134, "loss": 1.1699, "learning_rate": 3.301048853615568e-07, "epoch": 0.9481376063931689, "percentage": 94.82, "elapsed_time": "6 days, 14:26:59", "remaining_time": "8:39:12", "throughput": 2742.33, "total_tokens": 1564279808} {"current_steps": 8662, "total_steps": 9134, "loss": 0.6865, "learning_rate": 3.2871363212438613e-07, "epoch": 0.9482470784641068, "percentage": 94.83, "elapsed_time": "6 days, 14:28:05", "remaining_time": "8:38:06", "throughput": 2742.35, "total_tokens": 1564473120} {"current_steps": 8663, "total_steps": 9134, "loss": 1.1145, "learning_rate": 3.2732529745322647e-07, "epoch": 0.9483565505350448, "percentage": 94.84, "elapsed_time": "6 days, 14:29:09", "remaining_time": "8:37:00", "throughput": 2742.37, "total_tokens": 1564659488} {"current_steps": 8664, "total_steps": 9134, "loss": 1.0402, "learning_rate": 3.2593988151231603e-07, "epoch": 0.9484660226059827, "percentage": 94.85, "elapsed_time": "6 days, 14:30:14", "remaining_time": "8:35:54", "throughput": 2742.41, "total_tokens": 1564862208} {"current_steps": 8665, "total_steps": 9134, "loss": 0.8883, "learning_rate": 3.245573844655514e-07, "epoch": 0.9485754946769206, "percentage": 94.87, "elapsed_time": "6 days, 14:31:22", "remaining_time": "8:34:48", "throughput": 2742.42, "total_tokens": 1565052384} {"current_steps": 8666, "total_steps": 9134, "loss": 0.752, "learning_rate": 3.231778064764768e-07, "epoch": 0.9486849667478584, "percentage": 94.88, "elapsed_time": "6 days, 14:32:24", "remaining_time": "8:33:42", "throughput": 2742.41, "total_tokens": 1565214336} {"current_steps": 8667, "total_steps": 9134, "loss": 0.8407, "learning_rate": 3.2180114770829495e-07, "epoch": 0.9487944388187963, "percentage": 94.89, "elapsed_time": "6 days, 14:33:30", "remaining_time": "8:32:36", "throughput": 2742.42, "total_tokens": 1565400928} {"current_steps": 8668, "total_steps": 9134, "loss": 0.8355, "learning_rate": 3.204274083238562e-07, "epoch": 0.9489039108897342, "percentage": 94.9, "elapsed_time": "6 days, 14:34:29", "remaining_time": "8:31:30", "throughput": 2742.38, "total_tokens": 1565542496} {"current_steps": 8669, "total_steps": 9134, "loss": 0.932, "learning_rate": 3.1905658848567774e-07, "epoch": 0.9490133829606722, "percentage": 94.91, "elapsed_time": "6 days, 14:35:34", "remaining_time": "8:30:24", "throughput": 2742.39, "total_tokens": 1565724384} {"current_steps": 8670, "total_steps": 9134, "loss": 0.983, "learning_rate": 3.1768868835592434e-07, "epoch": 0.9491228550316101, "percentage": 94.92, "elapsed_time": "6 days, 14:36:42", "remaining_time": "8:29:18", "throughput": 2742.42, "total_tokens": 1565927776} {"current_steps": 8671, "total_steps": 9134, "loss": 0.7766, "learning_rate": 3.1632370809641376e-07, "epoch": 0.949232327102548, "percentage": 94.93, "elapsed_time": "6 days, 14:37:43", "remaining_time": "8:28:12", "throughput": 2742.42, "total_tokens": 1566093984} {"current_steps": 8672, "total_steps": 9134, "loss": 0.8213, "learning_rate": 3.149616478686196e-07, "epoch": 0.9493417991734858, "percentage": 94.94, "elapsed_time": "6 days, 14:38:46", "remaining_time": "8:27:06", "throughput": 2742.4, "total_tokens": 1566259744} {"current_steps": 8673, "total_steps": 9134, "loss": 0.9684, "learning_rate": 3.1360250783367406e-07, "epoch": 0.9494512712444237, "percentage": 94.95, "elapsed_time": "6 days, 14:39:44", "remaining_time": "8:26:00", "throughput": 2742.39, "total_tokens": 1566412512} {"current_steps": 8674, "total_steps": 9134, "loss": 0.7546, "learning_rate": 3.122462881523625e-07, "epoch": 0.9495607433153617, "percentage": 94.96, "elapsed_time": "6 days, 14:40:50", "remaining_time": "8:24:54", "throughput": 2742.41, "total_tokens": 1566602240} {"current_steps": 8675, "total_steps": 9134, "loss": 0.9811, "learning_rate": 3.1089298898511476e-07, "epoch": 0.9496702153862996, "percentage": 94.97, "elapsed_time": "6 days, 14:41:58", "remaining_time": "8:23:48", "throughput": 2742.48, "total_tokens": 1566831616} {"current_steps": 8676, "total_steps": 9134, "loss": 0.9962, "learning_rate": 3.095426104920335e-07, "epoch": 0.9497796874572375, "percentage": 94.99, "elapsed_time": "6 days, 14:43:01", "remaining_time": "8:22:42", "throughput": 2742.47, "total_tokens": 1566999168} {"current_steps": 8677, "total_steps": 9134, "loss": 0.6982, "learning_rate": 3.081951528328575e-07, "epoch": 0.9498891595281753, "percentage": 95.0, "elapsed_time": "6 days, 14:44:04", "remaining_time": "8:21:36", "throughput": 2742.5, "total_tokens": 1567184192} {"current_steps": 8678, "total_steps": 9134, "loss": 0.8442, "learning_rate": 3.0685061616699263e-07, "epoch": 0.9499986315991132, "percentage": 95.01, "elapsed_time": "6 days, 14:45:07", "remaining_time": "8:20:30", "throughput": 2742.49, "total_tokens": 1567353088} {"current_steps": 8679, "total_steps": 9134, "loss": 0.8111, "learning_rate": 3.0550900065349774e-07, "epoch": 0.9501081036700512, "percentage": 95.02, "elapsed_time": "6 days, 14:46:09", "remaining_time": "8:19:24", "throughput": 2742.48, "total_tokens": 1567517056} {"current_steps": 8680, "total_steps": 9134, "loss": 0.8162, "learning_rate": 3.0417030645107924e-07, "epoch": 0.9502175757409891, "percentage": 95.03, "elapsed_time": "6 days, 14:47:11", "remaining_time": "8:18:18", "throughput": 2742.51, "total_tokens": 1567705664} {"current_steps": 8681, "total_steps": 9134, "loss": 0.8566, "learning_rate": 3.028345337181021e-07, "epoch": 0.950327047811927, "percentage": 95.04, "elapsed_time": "6 days, 14:48:12", "remaining_time": "8:17:12", "throughput": 2742.52, "total_tokens": 1567878816} {"current_steps": 8682, "total_steps": 9134, "loss": 0.9804, "learning_rate": 3.015016826125844e-07, "epoch": 0.9504365198828649, "percentage": 95.05, "elapsed_time": "6 days, 14:49:15", "remaining_time": "8:16:06", "throughput": 2742.5, "total_tokens": 1568039872} {"current_steps": 8683, "total_steps": 9134, "loss": 0.7235, "learning_rate": 3.001717532922055e-07, "epoch": 0.9505459919538027, "percentage": 95.06, "elapsed_time": "6 days, 14:50:18", "remaining_time": "8:15:00", "throughput": 2742.5, "total_tokens": 1568210560} {"current_steps": 8684, "total_steps": 9134, "loss": 1.2196, "learning_rate": 2.988447459142868e-07, "epoch": 0.9506554640247407, "percentage": 95.07, "elapsed_time": "6 days, 14:51:25", "remaining_time": "8:13:54", "throughput": 2742.53, "total_tokens": 1568414400} {"current_steps": 8685, "total_steps": 9134, "loss": 0.9516, "learning_rate": 2.975206606358194e-07, "epoch": 0.9507649360956786, "percentage": 95.08, "elapsed_time": "6 days, 14:52:30", "remaining_time": "8:12:48", "throughput": 2742.55, "total_tokens": 1568601888} {"current_steps": 8686, "total_steps": 9134, "loss": 0.6294, "learning_rate": 2.961994976134308e-07, "epoch": 0.9508744081666165, "percentage": 95.1, "elapsed_time": "6 days, 14:53:37", "remaining_time": "8:11:43", "throughput": 2742.57, "total_tokens": 1568796768} {"current_steps": 8687, "total_steps": 9134, "loss": 0.8852, "learning_rate": 2.948812570034154e-07, "epoch": 0.9509838802375544, "percentage": 95.11, "elapsed_time": "6 days, 14:54:42", "remaining_time": "8:10:37", "throughput": 2742.58, "total_tokens": 1568982688} {"current_steps": 8688, "total_steps": 9134, "loss": 0.8671, "learning_rate": 2.9356593896172066e-07, "epoch": 0.9510933523084923, "percentage": 95.12, "elapsed_time": "6 days, 14:55:47", "remaining_time": "8:09:31", "throughput": 2742.56, "total_tokens": 1569148896} {"current_steps": 8689, "total_steps": 9134, "loss": 0.6928, "learning_rate": 2.9225354364394444e-07, "epoch": 0.9512028243794302, "percentage": 95.13, "elapsed_time": "6 days, 14:56:51", "remaining_time": "8:08:25", "throughput": 2742.57, "total_tokens": 1569332352} {"current_steps": 8690, "total_steps": 9134, "loss": 0.7127, "learning_rate": 2.9094407120534295e-07, "epoch": 0.9513122964503681, "percentage": 95.14, "elapsed_time": "6 days, 14:57:55", "remaining_time": "8:07:19", "throughput": 2742.59, "total_tokens": 1569519168} {"current_steps": 8691, "total_steps": 9134, "loss": 1.0312, "learning_rate": 2.896375218008174e-07, "epoch": 0.951421768521306, "percentage": 95.15, "elapsed_time": "6 days, 14:59:01", "remaining_time": "8:06:13", "throughput": 2742.62, "total_tokens": 1569713600} {"current_steps": 8692, "total_steps": 9134, "loss": 0.9164, "learning_rate": 2.883338955849385e-07, "epoch": 0.9515312405922439, "percentage": 95.16, "elapsed_time": "6 days, 15:00:06", "remaining_time": "8:05:07", "throughput": 2742.65, "total_tokens": 1569909152} {"current_steps": 8693, "total_steps": 9134, "loss": 0.7892, "learning_rate": 2.870331927119163e-07, "epoch": 0.9516407126631818, "percentage": 95.17, "elapsed_time": "6 days, 15:01:11", "remaining_time": "8:04:01", "throughput": 2742.67, "total_tokens": 1570100896} {"current_steps": 8694, "total_steps": 9134, "loss": 0.9148, "learning_rate": 2.857354133356277e-07, "epoch": 0.9517501847341197, "percentage": 95.18, "elapsed_time": "6 days, 15:02:15", "remaining_time": "8:02:55", "throughput": 2742.68, "total_tokens": 1570284352} {"current_steps": 8695, "total_steps": 9134, "loss": 0.8886, "learning_rate": 2.8444055760959154e-07, "epoch": 0.9518596568050576, "percentage": 95.19, "elapsed_time": "6 days, 15:03:22", "remaining_time": "8:01:49", "throughput": 2742.71, "total_tokens": 1570481920} {"current_steps": 8696, "total_steps": 9134, "loss": 1.0138, "learning_rate": 2.8314862568699087e-07, "epoch": 0.9519691288759955, "percentage": 95.2, "elapsed_time": "6 days, 15:04:29", "remaining_time": "8:00:44", "throughput": 2742.7, "total_tokens": 1570658208} {"current_steps": 8697, "total_steps": 9134, "loss": 1.0857, "learning_rate": 2.8185961772065616e-07, "epoch": 0.9520786009469334, "percentage": 95.22, "elapsed_time": "6 days, 15:05:36", "remaining_time": "7:59:38", "throughput": 2742.71, "total_tokens": 1570848832} {"current_steps": 8698, "total_steps": 9134, "loss": 0.8204, "learning_rate": 2.8057353386307663e-07, "epoch": 0.9521880730178713, "percentage": 95.23, "elapsed_time": "6 days, 15:06:41", "remaining_time": "7:58:32", "throughput": 2742.69, "total_tokens": 1571013696} {"current_steps": 8699, "total_steps": 9134, "loss": 0.8364, "learning_rate": 2.792903742663916e-07, "epoch": 0.9522975450888093, "percentage": 95.24, "elapsed_time": "6 days, 15:07:47", "remaining_time": "7:57:26", "throughput": 2742.72, "total_tokens": 1571216640} {"current_steps": 8700, "total_steps": 9134, "loss": 1.0535, "learning_rate": 2.7801013908239636e-07, "epoch": 0.9524070171597471, "percentage": 95.25, "elapsed_time": "6 days, 15:08:51", "remaining_time": "7:56:20", "throughput": 2742.75, "total_tokens": 1571405696} {"current_steps": 8701, "total_steps": 9134, "loss": 0.8625, "learning_rate": 2.76732828462542e-07, "epoch": 0.952516489230685, "percentage": 95.26, "elapsed_time": "6 days, 15:09:58", "remaining_time": "7:55:14", "throughput": 2742.75, "total_tokens": 1571594304} {"current_steps": 8702, "total_steps": 9134, "loss": 0.7619, "learning_rate": 2.7545844255793263e-07, "epoch": 0.9526259613016229, "percentage": 95.27, "elapsed_time": "6 days, 15:11:06", "remaining_time": "7:54:09", "throughput": 2742.77, "total_tokens": 1571790976} {"current_steps": 8703, "total_steps": 9134, "loss": 0.7626, "learning_rate": 2.741869815193226e-07, "epoch": 0.9527354333725608, "percentage": 95.28, "elapsed_time": "6 days, 15:12:11", "remaining_time": "7:53:03", "throughput": 2742.73, "total_tokens": 1571943744} {"current_steps": 8704, "total_steps": 9134, "loss": 0.7584, "learning_rate": 2.729184454971251e-07, "epoch": 0.9528449054434988, "percentage": 95.29, "elapsed_time": "6 days, 15:13:17", "remaining_time": "7:51:57", "throughput": 2742.74, "total_tokens": 1572130112} {"current_steps": 8705, "total_steps": 9134, "loss": 0.7514, "learning_rate": 2.71652834641406e-07, "epoch": 0.9529543775144367, "percentage": 95.3, "elapsed_time": "6 days, 15:14:21", "remaining_time": "7:50:51", "throughput": 2742.74, "total_tokens": 1572308864} {"current_steps": 8706, "total_steps": 9134, "loss": 0.6886, "learning_rate": 2.7039014910188455e-07, "epoch": 0.9530638495853745, "percentage": 95.31, "elapsed_time": "6 days, 15:15:24", "remaining_time": "7:49:45", "throughput": 2742.77, "total_tokens": 1572494336} {"current_steps": 8707, "total_steps": 9134, "loss": 0.999, "learning_rate": 2.691303890279301e-07, "epoch": 0.9531733216563124, "percentage": 95.33, "elapsed_time": "6 days, 15:16:27", "remaining_time": "7:48:39", "throughput": 2742.72, "total_tokens": 1572638592} {"current_steps": 8708, "total_steps": 9134, "loss": 1.2156, "learning_rate": 2.678735545685762e-07, "epoch": 0.9532827937272503, "percentage": 95.34, "elapsed_time": "6 days, 15:17:34", "remaining_time": "7:47:33", "throughput": 2742.76, "total_tokens": 1572849376} {"current_steps": 8709, "total_steps": 9134, "loss": 0.9521, "learning_rate": 2.666196458725012e-07, "epoch": 0.9533922657981883, "percentage": 95.35, "elapsed_time": "6 days, 15:18:38", "remaining_time": "7:46:27", "throughput": 2742.74, "total_tokens": 1573016256} {"current_steps": 8710, "total_steps": 9134, "loss": 0.6871, "learning_rate": 2.653686630880392e-07, "epoch": 0.9535017378691262, "percentage": 95.36, "elapsed_time": "6 days, 15:19:43", "remaining_time": "7:45:21", "throughput": 2742.75, "total_tokens": 1573197024} {"current_steps": 8711, "total_steps": 9134, "loss": 0.7378, "learning_rate": 2.641206063631774e-07, "epoch": 0.953611209940064, "percentage": 95.37, "elapsed_time": "6 days, 15:20:50", "remaining_time": "7:44:16", "throughput": 2742.76, "total_tokens": 1573388544} {"current_steps": 8712, "total_steps": 9134, "loss": 0.8983, "learning_rate": 2.628754758455643e-07, "epoch": 0.9537206820110019, "percentage": 95.38, "elapsed_time": "6 days, 15:21:49", "remaining_time": "7:43:09", "throughput": 2742.75, "total_tokens": 1573538848} {"current_steps": 8713, "total_steps": 9134, "loss": 0.9111, "learning_rate": 2.616332716824932e-07, "epoch": 0.9538301540819398, "percentage": 95.39, "elapsed_time": "6 days, 15:22:53", "remaining_time": "7:42:03", "throughput": 2742.72, "total_tokens": 1573701920} {"current_steps": 8714, "total_steps": 9134, "loss": 0.9241, "learning_rate": 2.6039399402091324e-07, "epoch": 0.9539396261528778, "percentage": 95.4, "elapsed_time": "6 days, 15:23:58", "remaining_time": "7:40:58", "throughput": 2742.75, "total_tokens": 1573896128} {"current_steps": 8715, "total_steps": 9134, "loss": 0.8482, "learning_rate": 2.591576430074266e-07, "epoch": 0.9540490982238157, "percentage": 95.41, "elapsed_time": "6 days, 15:25:04", "remaining_time": "7:39:52", "throughput": 2742.77, "total_tokens": 1574088768} {"current_steps": 8716, "total_steps": 9134, "loss": 0.7391, "learning_rate": 2.5792421878829965e-07, "epoch": 0.9541585702947536, "percentage": 95.42, "elapsed_time": "6 days, 15:26:07", "remaining_time": "7:38:46", "throughput": 2742.77, "total_tokens": 1574259008} {"current_steps": 8717, "total_steps": 9134, "loss": 0.7435, "learning_rate": 2.5669372150943505e-07, "epoch": 0.9542680423656914, "percentage": 95.43, "elapsed_time": "6 days, 15:27:11", "remaining_time": "7:37:40", "throughput": 2742.78, "total_tokens": 1574444256} {"current_steps": 8718, "total_steps": 9134, "loss": 1.035, "learning_rate": 2.554661513164053e-07, "epoch": 0.9543775144366293, "percentage": 95.45, "elapsed_time": "6 days, 15:28:15", "remaining_time": "7:36:34", "throughput": 2742.8, "total_tokens": 1574628160} {"current_steps": 8719, "total_steps": 9134, "loss": 0.7947, "learning_rate": 2.5424150835442193e-07, "epoch": 0.9544869865075672, "percentage": 95.46, "elapsed_time": "6 days, 15:29:15", "remaining_time": "7:35:28", "throughput": 2742.79, "total_tokens": 1574789216} {"current_steps": 8720, "total_steps": 9134, "loss": 0.8687, "learning_rate": 2.530197927683664e-07, "epoch": 0.9545964585785052, "percentage": 95.47, "elapsed_time": "6 days, 15:30:18", "remaining_time": "7:34:22", "throughput": 2742.75, "total_tokens": 1574937728} {"current_steps": 8721, "total_steps": 9134, "loss": 1.0996, "learning_rate": 2.5180100470275916e-07, "epoch": 0.9547059306494431, "percentage": 95.48, "elapsed_time": "6 days, 15:31:24", "remaining_time": "7:33:16", "throughput": 2742.73, "total_tokens": 1575109312} {"current_steps": 8722, "total_steps": 9134, "loss": 1.0317, "learning_rate": 2.5058514430178205e-07, "epoch": 0.954815402720381, "percentage": 95.49, "elapsed_time": "6 days, 15:32:29", "remaining_time": "7:32:10", "throughput": 2742.73, "total_tokens": 1575283584} {"current_steps": 8723, "total_steps": 9134, "loss": 0.7477, "learning_rate": 2.4937221170927007e-07, "epoch": 0.9549248747913188, "percentage": 95.5, "elapsed_time": "6 days, 15:33:29", "remaining_time": "7:31:04", "throughput": 2742.7, "total_tokens": 1575429184} {"current_steps": 8724, "total_steps": 9134, "loss": 1.013, "learning_rate": 2.481622070687112e-07, "epoch": 0.9550343468622567, "percentage": 95.51, "elapsed_time": "6 days, 15:34:30", "remaining_time": "7:29:58", "throughput": 2742.72, "total_tokens": 1575613760} {"current_steps": 8725, "total_steps": 9134, "loss": 1.0867, "learning_rate": 2.469551305232465e-07, "epoch": 0.9551438189331947, "percentage": 95.52, "elapsed_time": "6 days, 15:35:33", "remaining_time": "7:28:52", "throughput": 2742.73, "total_tokens": 1575788256} {"current_steps": 8726, "total_steps": 9134, "loss": 0.874, "learning_rate": 2.457509822156673e-07, "epoch": 0.9552532910041326, "percentage": 95.53, "elapsed_time": "6 days, 15:36:35", "remaining_time": "7:27:46", "throughput": 2742.72, "total_tokens": 1575955360} {"current_steps": 8727, "total_steps": 9134, "loss": 0.8812, "learning_rate": 2.445497622884263e-07, "epoch": 0.9553627630750705, "percentage": 95.54, "elapsed_time": "6 days, 15:37:43", "remaining_time": "7:26:40", "throughput": 2742.72, "total_tokens": 1576140608} {"current_steps": 8728, "total_steps": 9134, "loss": 0.8874, "learning_rate": 2.4335147088362377e-07, "epoch": 0.9554722351460083, "percentage": 95.56, "elapsed_time": "6 days, 15:38:49", "remaining_time": "7:25:34", "throughput": 2742.76, "total_tokens": 1576344672} {"current_steps": 8729, "total_steps": 9134, "loss": 0.8185, "learning_rate": 2.421561081430157e-07, "epoch": 0.9555817072169462, "percentage": 95.57, "elapsed_time": "6 days, 15:39:54", "remaining_time": "7:24:28", "throughput": 2742.76, "total_tokens": 1576519392} {"current_steps": 8730, "total_steps": 9134, "loss": 1.0725, "learning_rate": 2.409636742080112e-07, "epoch": 0.9556911792878842, "percentage": 95.58, "elapsed_time": "6 days, 15:40:54", "remaining_time": "7:23:22", "throughput": 2742.72, "total_tokens": 1576664544} {"current_steps": 8731, "total_steps": 9134, "loss": 0.9885, "learning_rate": 2.3977416921967256e-07, "epoch": 0.9558006513588221, "percentage": 95.59, "elapsed_time": "6 days, 15:41:56", "remaining_time": "7:22:16", "throughput": 2742.75, "total_tokens": 1576849120} {"current_steps": 8732, "total_steps": 9134, "loss": 0.9752, "learning_rate": 2.385875933187176e-07, "epoch": 0.95591012342976, "percentage": 95.6, "elapsed_time": "6 days, 15:42:57", "remaining_time": "7:21:10", "throughput": 2742.72, "total_tokens": 1577000096} {"current_steps": 8733, "total_steps": 9134, "loss": 0.8625, "learning_rate": 2.374039466455119e-07, "epoch": 0.9560195955006979, "percentage": 95.61, "elapsed_time": "6 days, 15:44:02", "remaining_time": "7:20:04", "throughput": 2742.71, "total_tokens": 1577177504} {"current_steps": 8734, "total_steps": 9134, "loss": 0.8287, "learning_rate": 2.3622322934008235e-07, "epoch": 0.9561290675716357, "percentage": 95.62, "elapsed_time": "6 days, 15:45:07", "remaining_time": "7:18:58", "throughput": 2742.71, "total_tokens": 1577353344} {"current_steps": 8735, "total_steps": 9134, "loss": 1.0082, "learning_rate": 2.350454415421033e-07, "epoch": 0.9562385396425737, "percentage": 95.63, "elapsed_time": "6 days, 15:46:13", "remaining_time": "7:17:52", "throughput": 2742.72, "total_tokens": 1577537472} {"current_steps": 8736, "total_steps": 9134, "loss": 0.9232, "learning_rate": 2.3387058339090773e-07, "epoch": 0.9563480117135116, "percentage": 95.64, "elapsed_time": "6 days, 15:47:18", "remaining_time": "7:16:47", "throughput": 2742.73, "total_tokens": 1577727200} {"current_steps": 8737, "total_steps": 9134, "loss": 1.0253, "learning_rate": 2.3269865502547894e-07, "epoch": 0.9564574837844495, "percentage": 95.65, "elapsed_time": "6 days, 15:48:26", "remaining_time": "7:15:41", "throughput": 2742.78, "total_tokens": 1577936640} {"current_steps": 8738, "total_steps": 9134, "loss": 0.89, "learning_rate": 2.3152965658445046e-07, "epoch": 0.9565669558553874, "percentage": 95.66, "elapsed_time": "6 days, 15:49:31", "remaining_time": "7:14:35", "throughput": 2742.83, "total_tokens": 1578147872} {"current_steps": 8739, "total_steps": 9134, "loss": 0.8703, "learning_rate": 2.3036358820611448e-07, "epoch": 0.9566764279263253, "percentage": 95.68, "elapsed_time": "6 days, 15:50:35", "remaining_time": "7:13:29", "throughput": 2742.82, "total_tokens": 1578315872} {"current_steps": 8740, "total_steps": 9134, "loss": 1.0554, "learning_rate": 2.2920045002841338e-07, "epoch": 0.9567858999972632, "percentage": 95.69, "elapsed_time": "6 days, 15:51:35", "remaining_time": "7:12:23", "throughput": 2742.8, "total_tokens": 1578467968} {"current_steps": 8741, "total_steps": 9134, "loss": 0.8738, "learning_rate": 2.280402421889455e-07, "epoch": 0.9568953720682011, "percentage": 95.7, "elapsed_time": "6 days, 15:52:38", "remaining_time": "7:11:17", "throughput": 2742.81, "total_tokens": 1578645152} {"current_steps": 8742, "total_steps": 9134, "loss": 0.8372, "learning_rate": 2.2688296482496208e-07, "epoch": 0.957004844139139, "percentage": 95.71, "elapsed_time": "6 days, 15:53:41", "remaining_time": "7:10:11", "throughput": 2742.82, "total_tokens": 1578822560} {"current_steps": 8743, "total_steps": 9134, "loss": 0.7412, "learning_rate": 2.2572861807336477e-07, "epoch": 0.9571143162100769, "percentage": 95.72, "elapsed_time": "6 days, 15:54:43", "remaining_time": "7:09:05", "throughput": 2742.8, "total_tokens": 1578988096} {"current_steps": 8744, "total_steps": 9134, "loss": 1.0477, "learning_rate": 2.2457720207071098e-07, "epoch": 0.9572237882810148, "percentage": 95.73, "elapsed_time": "6 days, 15:55:50", "remaining_time": "7:07:59", "throughput": 2742.81, "total_tokens": 1579175360} {"current_steps": 8745, "total_steps": 9134, "loss": 0.9589, "learning_rate": 2.23428716953214e-07, "epoch": 0.9573332603519527, "percentage": 95.74, "elapsed_time": "6 days, 15:56:53", "remaining_time": "7:06:53", "throughput": 2742.79, "total_tokens": 1579333280} {"current_steps": 8746, "total_steps": 9134, "loss": 0.9437, "learning_rate": 2.2228316285673456e-07, "epoch": 0.9574427324228906, "percentage": 95.75, "elapsed_time": "6 days, 15:57:53", "remaining_time": "7:05:47", "throughput": 2742.76, "total_tokens": 1579485824} {"current_steps": 8747, "total_steps": 9134, "loss": 1.0804, "learning_rate": 2.211405399167893e-07, "epoch": 0.9575522044938285, "percentage": 95.76, "elapsed_time": "6 days, 15:58:55", "remaining_time": "7:04:41", "throughput": 2742.76, "total_tokens": 1579650688} {"current_steps": 8748, "total_steps": 9134, "loss": 1.0293, "learning_rate": 2.2000084826854784e-07, "epoch": 0.9576616765647664, "percentage": 95.77, "elapsed_time": "6 days, 15:59:57", "remaining_time": "7:03:35", "throughput": 2742.75, "total_tokens": 1579818240} {"current_steps": 8749, "total_steps": 9134, "loss": 0.9951, "learning_rate": 2.1886408804683568e-07, "epoch": 0.9577711486357043, "percentage": 95.78, "elapsed_time": "6 days, 16:01:04", "remaining_time": "7:02:29", "throughput": 2742.79, "total_tokens": 1580026336} {"current_steps": 8750, "total_steps": 9134, "loss": 0.8404, "learning_rate": 2.1773025938612856e-07, "epoch": 0.9578806207066423, "percentage": 95.8, "elapsed_time": "6 days, 16:02:07", "remaining_time": "7:01:23", "throughput": 2742.79, "total_tokens": 1580196352} {"current_steps": 8751, "total_steps": 9134, "loss": 0.7377, "learning_rate": 2.1659936242055811e-07, "epoch": 0.9579900927775801, "percentage": 95.81, "elapsed_time": "6 days, 16:03:06", "remaining_time": "7:00:17", "throughput": 2742.75, "total_tokens": 1580331424} {"current_steps": 8752, "total_steps": 9134, "loss": 0.8792, "learning_rate": 2.1547139728390064e-07, "epoch": 0.958099564848518, "percentage": 95.82, "elapsed_time": "6 days, 16:04:07", "remaining_time": "6:59:11", "throughput": 2742.73, "total_tokens": 1580488896} {"current_steps": 8753, "total_steps": 9134, "loss": 1.1186, "learning_rate": 2.143463641095994e-07, "epoch": 0.9582090369194559, "percentage": 95.83, "elapsed_time": "6 days, 16:05:14", "remaining_time": "6:58:05", "throughput": 2742.74, "total_tokens": 1580682208} {"current_steps": 8754, "total_steps": 9134, "loss": 0.9549, "learning_rate": 2.1322426303074238e-07, "epoch": 0.9583185089903938, "percentage": 95.84, "elapsed_time": "6 days, 16:06:18", "remaining_time": "6:56:59", "throughput": 2742.74, "total_tokens": 1580854464} {"current_steps": 8755, "total_steps": 9134, "loss": 0.8644, "learning_rate": 2.1210509418006785e-07, "epoch": 0.9584279810613318, "percentage": 95.85, "elapsed_time": "6 days, 16:07:25", "remaining_time": "6:55:54", "throughput": 2742.77, "total_tokens": 1581057856} {"current_steps": 8756, "total_steps": 9134, "loss": 1.1488, "learning_rate": 2.1098885768997824e-07, "epoch": 0.9585374531322697, "percentage": 95.86, "elapsed_time": "6 days, 16:08:29", "remaining_time": "6:54:48", "throughput": 2742.77, "total_tokens": 1581234816} {"current_steps": 8757, "total_steps": 9134, "loss": 0.8268, "learning_rate": 2.098755536925151e-07, "epoch": 0.9586469252032075, "percentage": 95.87, "elapsed_time": "6 days, 16:09:29", "remaining_time": "6:53:42", "throughput": 2742.75, "total_tokens": 1581386912} {"current_steps": 8758, "total_steps": 9134, "loss": 0.9307, "learning_rate": 2.0876518231938426e-07, "epoch": 0.9587563972741454, "percentage": 95.88, "elapsed_time": "6 days, 16:10:32", "remaining_time": "6:52:36", "throughput": 2742.76, "total_tokens": 1581565664} {"current_steps": 8759, "total_steps": 9134, "loss": 0.6979, "learning_rate": 2.0765774370193892e-07, "epoch": 0.9588658693450833, "percentage": 95.89, "elapsed_time": "6 days, 16:11:38", "remaining_time": "6:51:30", "throughput": 2742.77, "total_tokens": 1581752256} {"current_steps": 8760, "total_steps": 9134, "loss": 0.85, "learning_rate": 2.0655323797119098e-07, "epoch": 0.9589753414160213, "percentage": 95.91, "elapsed_time": "6 days, 16:12:43", "remaining_time": "6:50:24", "throughput": 2742.81, "total_tokens": 1581951616} {"current_steps": 8761, "total_steps": 9134, "loss": 1.1693, "learning_rate": 2.0545166525779147e-07, "epoch": 0.9590848134869592, "percentage": 95.92, "elapsed_time": "6 days, 16:13:49", "remaining_time": "6:49:18", "throughput": 2742.85, "total_tokens": 1582157024} {"current_steps": 8762, "total_steps": 9134, "loss": 0.7726, "learning_rate": 2.0435302569206672e-07, "epoch": 0.959194285557897, "percentage": 95.93, "elapsed_time": "6 days, 16:14:56", "remaining_time": "6:48:12", "throughput": 2742.9, "total_tokens": 1582367136} {"current_steps": 8763, "total_steps": 9134, "loss": 0.9017, "learning_rate": 2.0325731940397386e-07, "epoch": 0.9593037576288349, "percentage": 95.94, "elapsed_time": "6 days, 16:15:54", "remaining_time": "6:47:06", "throughput": 2742.88, "total_tokens": 1582514528} {"current_steps": 8764, "total_steps": 9134, "loss": 0.977, "learning_rate": 2.0216454652313976e-07, "epoch": 0.9594132296997728, "percentage": 95.95, "elapsed_time": "6 days, 16:17:00", "remaining_time": "6:46:00", "throughput": 2742.91, "total_tokens": 1582714560} {"current_steps": 8765, "total_steps": 9134, "loss": 1.1677, "learning_rate": 2.0107470717883326e-07, "epoch": 0.9595227017707108, "percentage": 95.96, "elapsed_time": "6 days, 16:18:03", "remaining_time": "6:44:54", "throughput": 2742.93, "total_tokens": 1582898464} {"current_steps": 8766, "total_steps": 9134, "loss": 0.8775, "learning_rate": 1.9998780149997898e-07, "epoch": 0.9596321738416487, "percentage": 95.97, "elapsed_time": "6 days, 16:19:06", "remaining_time": "6:43:48", "throughput": 2742.94, "total_tokens": 1583079456} {"current_steps": 8767, "total_steps": 9134, "loss": 1.007, "learning_rate": 1.9890382961516295e-07, "epoch": 0.9597416459125866, "percentage": 95.98, "elapsed_time": "6 days, 16:20:13", "remaining_time": "6:42:43", "throughput": 2742.95, "total_tokens": 1583267168} {"current_steps": 8768, "total_steps": 9134, "loss": 0.8749, "learning_rate": 1.9782279165260765e-07, "epoch": 0.9598511179835244, "percentage": 95.99, "elapsed_time": "6 days, 16:21:17", "remaining_time": "6:41:37", "throughput": 2742.98, "total_tokens": 1583458912} {"current_steps": 8769, "total_steps": 9134, "loss": 1.0305, "learning_rate": 1.9674468774020516e-07, "epoch": 0.9599605900544623, "percentage": 96.0, "elapsed_time": "6 days, 16:22:22", "remaining_time": "6:40:31", "throughput": 2743.0, "total_tokens": 1583650208} {"current_steps": 8770, "total_steps": 9134, "loss": 0.9036, "learning_rate": 1.956695180054896e-07, "epoch": 0.9600700621254002, "percentage": 96.01, "elapsed_time": "6 days, 16:23:21", "remaining_time": "6:39:25", "throughput": 2742.99, "total_tokens": 1583807232} {"current_steps": 8771, "total_steps": 9134, "loss": 0.9012, "learning_rate": 1.9459728257565367e-07, "epoch": 0.9601795341963382, "percentage": 96.03, "elapsed_time": "6 days, 16:24:24", "remaining_time": "6:38:19", "throughput": 2742.99, "total_tokens": 1583978368} {"current_steps": 8772, "total_steps": 9134, "loss": 0.8983, "learning_rate": 1.935279815775376e-07, "epoch": 0.9602890062672761, "percentage": 96.04, "elapsed_time": "6 days, 16:25:26", "remaining_time": "6:37:13", "throughput": 2743.01, "total_tokens": 1584161824} {"current_steps": 8773, "total_steps": 9134, "loss": 1.0054, "learning_rate": 1.9246161513764015e-07, "epoch": 0.960398478338214, "percentage": 96.05, "elapsed_time": "6 days, 16:26:32", "remaining_time": "6:36:07", "throughput": 2743.05, "total_tokens": 1584365216} {"current_steps": 8774, "total_steps": 9134, "loss": 0.9221, "learning_rate": 1.9139818338211047e-07, "epoch": 0.9605079504091518, "percentage": 96.06, "elapsed_time": "6 days, 16:27:35", "remaining_time": "6:35:01", "throughput": 2743.05, "total_tokens": 1584538816} {"current_steps": 8775, "total_steps": 9134, "loss": 0.8978, "learning_rate": 1.903376864367451e-07, "epoch": 0.9606174224800897, "percentage": 96.07, "elapsed_time": "6 days, 16:28:38", "remaining_time": "6:33:55", "throughput": 2743.02, "total_tokens": 1584693600} {"current_steps": 8776, "total_steps": 9134, "loss": 0.9562, "learning_rate": 1.892801244270076e-07, "epoch": 0.9607268945510277, "percentage": 96.08, "elapsed_time": "6 days, 16:29:44", "remaining_time": "6:32:49", "throughput": 2743.06, "total_tokens": 1584897664} {"current_steps": 8777, "total_steps": 9134, "loss": 0.802, "learning_rate": 1.8822549747800066e-07, "epoch": 0.9608363666219656, "percentage": 96.09, "elapsed_time": "6 days, 16:30:47", "remaining_time": "6:31:43", "throughput": 2743.07, "total_tokens": 1585075072} {"current_steps": 8778, "total_steps": 9134, "loss": 0.7554, "learning_rate": 1.8717380571448562e-07, "epoch": 0.9609458386929035, "percentage": 96.1, "elapsed_time": "6 days, 16:31:48", "remaining_time": "6:30:37", "throughput": 2743.03, "total_tokens": 1585218656} {"current_steps": 8779, "total_steps": 9134, "loss": 0.8497, "learning_rate": 1.8612504926087405e-07, "epoch": 0.9610553107638413, "percentage": 96.11, "elapsed_time": "6 days, 16:32:54", "remaining_time": "6:29:31", "throughput": 2743.03, "total_tokens": 1585403904} {"current_steps": 8780, "total_steps": 9134, "loss": 0.9242, "learning_rate": 1.8507922824123614e-07, "epoch": 0.9611647828347792, "percentage": 96.12, "elapsed_time": "6 days, 16:33:54", "remaining_time": "6:28:25", "throughput": 2743.03, "total_tokens": 1585567200} {"current_steps": 8781, "total_steps": 9134, "loss": 0.8591, "learning_rate": 1.8403634277928407e-07, "epoch": 0.9612742549057172, "percentage": 96.14, "elapsed_time": "6 days, 16:34:59", "remaining_time": "6:27:19", "throughput": 2743.06, "total_tokens": 1585759168} {"current_steps": 8782, "total_steps": 9134, "loss": 1.0846, "learning_rate": 1.829963929983941e-07, "epoch": 0.9613837269766551, "percentage": 96.15, "elapsed_time": "6 days, 16:36:01", "remaining_time": "6:26:13", "throughput": 2743.05, "total_tokens": 1585928064} {"current_steps": 8783, "total_steps": 9134, "loss": 0.9992, "learning_rate": 1.8195937902158732e-07, "epoch": 0.961493199047593, "percentage": 96.16, "elapsed_time": "6 days, 16:37:04", "remaining_time": "6:25:07", "throughput": 2743.02, "total_tokens": 1586079264} {"current_steps": 8784, "total_steps": 9134, "loss": 0.921, "learning_rate": 1.8092530097154337e-07, "epoch": 0.9616026711185309, "percentage": 96.17, "elapsed_time": "6 days, 16:38:09", "remaining_time": "6:24:02", "throughput": 2743.02, "total_tokens": 1586261376} {"current_steps": 8785, "total_steps": 9134, "loss": 0.9677, "learning_rate": 1.7989415897058938e-07, "epoch": 0.9617121431894687, "percentage": 96.18, "elapsed_time": "6 days, 16:39:15", "remaining_time": "6:22:56", "throughput": 2743.04, "total_tokens": 1586453120} {"current_steps": 8786, "total_steps": 9134, "loss": 0.8934, "learning_rate": 1.7886595314070832e-07, "epoch": 0.9618216152604067, "percentage": 96.19, "elapsed_time": "6 days, 16:40:14", "remaining_time": "6:21:50", "throughput": 2743.03, "total_tokens": 1586608576} {"current_steps": 8787, "total_steps": 9134, "loss": 0.9203, "learning_rate": 1.7784068360353623e-07, "epoch": 0.9619310873313446, "percentage": 96.2, "elapsed_time": "6 days, 16:41:17", "remaining_time": "6:20:44", "throughput": 2743.05, "total_tokens": 1586790912} {"current_steps": 8788, "total_steps": 9134, "loss": 0.7854, "learning_rate": 1.7681835048035944e-07, "epoch": 0.9620405594022825, "percentage": 96.21, "elapsed_time": "6 days, 16:42:22", "remaining_time": "6:19:38", "throughput": 2743.05, "total_tokens": 1586973248} {"current_steps": 8789, "total_steps": 9134, "loss": 0.9243, "learning_rate": 1.7579895389211732e-07, "epoch": 0.9621500314732204, "percentage": 96.22, "elapsed_time": "6 days, 16:43:26", "remaining_time": "6:18:32", "throughput": 2743.05, "total_tokens": 1587143936} {"current_steps": 8790, "total_steps": 9134, "loss": 1.003, "learning_rate": 1.7478249395940227e-07, "epoch": 0.9622595035441583, "percentage": 96.23, "elapsed_time": "6 days, 16:44:27", "remaining_time": "6:17:26", "throughput": 2743.06, "total_tokens": 1587316640} {"current_steps": 8791, "total_steps": 9134, "loss": 1.0206, "learning_rate": 1.7376897080246257e-07, "epoch": 0.9623689756150962, "percentage": 96.24, "elapsed_time": "6 days, 16:45:28", "remaining_time": "6:16:20", "throughput": 2743.04, "total_tokens": 1587473440} {"current_steps": 8792, "total_steps": 9134, "loss": 1.0641, "learning_rate": 1.727583845411912e-07, "epoch": 0.9624784476860341, "percentage": 96.26, "elapsed_time": "6 days, 16:46:33", "remaining_time": "6:15:14", "throughput": 2743.07, "total_tokens": 1587673472} {"current_steps": 8793, "total_steps": 9134, "loss": 0.8737, "learning_rate": 1.717507352951453e-07, "epoch": 0.962587919756972, "percentage": 96.27, "elapsed_time": "6 days, 16:47:37", "remaining_time": "6:14:08", "throughput": 2743.05, "total_tokens": 1587836768} {"current_steps": 8794, "total_steps": 9134, "loss": 0.905, "learning_rate": 1.707460231835184e-07, "epoch": 0.9626973918279099, "percentage": 96.28, "elapsed_time": "6 days, 16:48:42", "remaining_time": "6:13:02", "throughput": 2743.08, "total_tokens": 1588030752} {"current_steps": 8795, "total_steps": 9134, "loss": 0.9741, "learning_rate": 1.6974424832517654e-07, "epoch": 0.9628068638988478, "percentage": 96.29, "elapsed_time": "6 days, 16:49:47", "remaining_time": "6:11:56", "throughput": 2743.06, "total_tokens": 1588196064} {"current_steps": 8796, "total_steps": 9134, "loss": 1.1864, "learning_rate": 1.687454108386194e-07, "epoch": 0.9629163359697858, "percentage": 96.3, "elapsed_time": "6 days, 16:50:52", "remaining_time": "6:10:50", "throughput": 2743.1, "total_tokens": 1588396096} {"current_steps": 8797, "total_steps": 9134, "loss": 0.9868, "learning_rate": 1.6774951084201073e-07, "epoch": 0.9630258080407236, "percentage": 96.31, "elapsed_time": "6 days, 16:51:57", "remaining_time": "6:09:45", "throughput": 2743.1, "total_tokens": 1588575296} {"current_steps": 8798, "total_steps": 9134, "loss": 0.7224, "learning_rate": 1.6675654845316746e-07, "epoch": 0.9631352801116615, "percentage": 96.32, "elapsed_time": "6 days, 16:52:56", "remaining_time": "6:08:39", "throughput": 2743.09, "total_tokens": 1588732768} {"current_steps": 8799, "total_steps": 9134, "loss": 0.8894, "learning_rate": 1.657665237895484e-07, "epoch": 0.9632447521825994, "percentage": 96.33, "elapsed_time": "6 days, 16:53:59", "remaining_time": "6:07:33", "throughput": 2743.08, "total_tokens": 1588898752} {"current_steps": 8800, "total_steps": 9134, "loss": 0.7983, "learning_rate": 1.6477943696827647e-07, "epoch": 0.9633542242535373, "percentage": 96.34, "elapsed_time": "6 days, 16:55:05", "remaining_time": "6:06:27", "throughput": 2743.08, "total_tokens": 1589081312} {"current_steps": 8801, "total_steps": 9134, "loss": 0.5396, "learning_rate": 1.6379528810611666e-07, "epoch": 0.9634636963244753, "percentage": 96.35, "elapsed_time": "6 days, 16:56:11", "remaining_time": "6:05:21", "throughput": 2743.11, "total_tokens": 1589277760} {"current_steps": 8802, "total_steps": 9134, "loss": 0.7957, "learning_rate": 1.6281407731949805e-07, "epoch": 0.9635731683954131, "percentage": 96.37, "elapsed_time": "6 days, 16:57:14", "remaining_time": "6:04:15", "throughput": 2743.12, "total_tokens": 1589457184} {"current_steps": 8803, "total_steps": 9134, "loss": 0.8748, "learning_rate": 1.6183580472449444e-07, "epoch": 0.963682640466351, "percentage": 96.38, "elapsed_time": "6 days, 16:58:21", "remaining_time": "6:03:09", "throughput": 2743.18, "total_tokens": 1589677824} {"current_steps": 8804, "total_steps": 9134, "loss": 0.6863, "learning_rate": 1.6086047043682994e-07, "epoch": 0.9637921125372889, "percentage": 96.39, "elapsed_time": "6 days, 16:59:24", "remaining_time": "6:02:03", "throughput": 2743.21, "total_tokens": 1589867328} {"current_steps": 8805, "total_steps": 9134, "loss": 0.9494, "learning_rate": 1.5988807457189003e-07, "epoch": 0.9639015846082268, "percentage": 96.4, "elapsed_time": "6 days, 17:00:31", "remaining_time": "6:00:58", "throughput": 2743.24, "total_tokens": 1590070720} {"current_steps": 8806, "total_steps": 9134, "loss": 0.9283, "learning_rate": 1.5891861724470214e-07, "epoch": 0.9640110566791648, "percentage": 96.41, "elapsed_time": "6 days, 17:01:34", "remaining_time": "5:59:52", "throughput": 2743.24, "total_tokens": 1590242528} {"current_steps": 8807, "total_steps": 9134, "loss": 0.978, "learning_rate": 1.5795209856995507e-07, "epoch": 0.9641205287501027, "percentage": 96.42, "elapsed_time": "6 days, 17:02:37", "remaining_time": "5:58:46", "throughput": 2743.25, "total_tokens": 1590418592} {"current_steps": 8808, "total_steps": 9134, "loss": 0.9938, "learning_rate": 1.5698851866198516e-07, "epoch": 0.9642300008210405, "percentage": 96.43, "elapsed_time": "6 days, 17:03:42", "remaining_time": "5:57:40", "throughput": 2743.26, "total_tokens": 1590605184} {"current_steps": 8809, "total_steps": 9134, "loss": 1.0023, "learning_rate": 1.5602787763478177e-07, "epoch": 0.9643394728919784, "percentage": 96.44, "elapsed_time": "6 days, 17:04:45", "remaining_time": "5:56:34", "throughput": 2743.25, "total_tokens": 1590773632} {"current_steps": 8810, "total_steps": 9134, "loss": 0.7938, "learning_rate": 1.5507017560198457e-07, "epoch": 0.9644489449629163, "percentage": 96.45, "elapsed_time": "6 days, 17:05:49", "remaining_time": "5:55:28", "throughput": 2743.26, "total_tokens": 1590953280} {"current_steps": 8811, "total_steps": 9134, "loss": 0.8998, "learning_rate": 1.5411541267689178e-07, "epoch": 0.9645584170338543, "percentage": 96.46, "elapsed_time": "6 days, 17:06:52", "remaining_time": "5:54:22", "throughput": 2743.28, "total_tokens": 1591138304} {"current_steps": 8812, "total_steps": 9134, "loss": 0.9486, "learning_rate": 1.531635889724492e-07, "epoch": 0.9646678891047922, "percentage": 96.47, "elapsed_time": "6 days, 17:07:58", "remaining_time": "5:53:16", "throughput": 2743.32, "total_tokens": 1591343488} {"current_steps": 8813, "total_steps": 9134, "loss": 1.0323, "learning_rate": 1.5221470460125565e-07, "epoch": 0.9647773611757301, "percentage": 96.49, "elapsed_time": "6 days, 17:09:02", "remaining_time": "5:52:10", "throughput": 2743.35, "total_tokens": 1591530304} {"current_steps": 8814, "total_steps": 9134, "loss": 1.1449, "learning_rate": 1.512687596755602e-07, "epoch": 0.9648868332466679, "percentage": 96.5, "elapsed_time": "6 days, 17:10:06", "remaining_time": "5:51:04", "throughput": 2743.36, "total_tokens": 1591717568} {"current_steps": 8815, "total_steps": 9134, "loss": 1.0165, "learning_rate": 1.5032575430726782e-07, "epoch": 0.9649963053176058, "percentage": 96.51, "elapsed_time": "6 days, 17:11:12", "remaining_time": "5:49:59", "throughput": 2743.39, "total_tokens": 1591910880} {"current_steps": 8816, "total_steps": 9134, "loss": 0.9565, "learning_rate": 1.4938568860793367e-07, "epoch": 0.9651057773885438, "percentage": 96.52, "elapsed_time": "6 days, 17:12:14", "remaining_time": "5:48:53", "throughput": 2743.41, "total_tokens": 1592096352} {"current_steps": 8817, "total_steps": 9134, "loss": 0.8753, "learning_rate": 1.4844856268876607e-07, "epoch": 0.9652152494594817, "percentage": 96.53, "elapsed_time": "6 days, 17:13:21", "remaining_time": "5:47:47", "throughput": 2743.4, "total_tokens": 1592276224} {"current_steps": 8818, "total_steps": 9134, "loss": 0.9768, "learning_rate": 1.475143766606263e-07, "epoch": 0.9653247215304196, "percentage": 96.54, "elapsed_time": "6 days, 17:14:23", "remaining_time": "5:46:41", "throughput": 2743.38, "total_tokens": 1592430784} {"current_steps": 8819, "total_steps": 9134, "loss": 0.9454, "learning_rate": 1.4658313063402595e-07, "epoch": 0.9654341936013574, "percentage": 96.55, "elapsed_time": "6 days, 17:15:26", "remaining_time": "5:45:35", "throughput": 2743.38, "total_tokens": 1592606848} {"current_steps": 8820, "total_steps": 9134, "loss": 0.9764, "learning_rate": 1.4565482471912971e-07, "epoch": 0.9655436656722953, "percentage": 96.56, "elapsed_time": "6 days, 17:16:27", "remaining_time": "5:44:29", "throughput": 2743.37, "total_tokens": 1592765216} {"current_steps": 8821, "total_steps": 9134, "loss": 0.684, "learning_rate": 1.447294590257553e-07, "epoch": 0.9656531377432332, "percentage": 96.57, "elapsed_time": "6 days, 17:17:34", "remaining_time": "5:43:23", "throughput": 2743.38, "total_tokens": 1592955840} {"current_steps": 8822, "total_steps": 9134, "loss": 0.7183, "learning_rate": 1.438070336633679e-07, "epoch": 0.9657626098141712, "percentage": 96.58, "elapsed_time": "6 days, 17:18:37", "remaining_time": "5:42:17", "throughput": 2743.41, "total_tokens": 1593144896} {"current_steps": 8823, "total_steps": 9134, "loss": 0.9583, "learning_rate": 1.4288754874109134e-07, "epoch": 0.9658720818851091, "percentage": 96.6, "elapsed_time": "6 days, 17:19:42", "remaining_time": "5:41:11", "throughput": 2743.43, "total_tokens": 1593338432} {"current_steps": 8824, "total_steps": 9134, "loss": 1.0413, "learning_rate": 1.419710043677025e-07, "epoch": 0.965981553956047, "percentage": 96.61, "elapsed_time": "6 days, 17:20:47", "remaining_time": "5:40:06", "throughput": 2743.45, "total_tokens": 1593528384} {"current_steps": 8825, "total_steps": 9134, "loss": 1.2107, "learning_rate": 1.410574006516202e-07, "epoch": 0.9660910260269848, "percentage": 96.62, "elapsed_time": "6 days, 17:21:53", "remaining_time": "5:39:00", "throughput": 2743.49, "total_tokens": 1593729312} {"current_steps": 8826, "total_steps": 9134, "loss": 0.8511, "learning_rate": 1.4014673770092746e-07, "epoch": 0.9662004980979227, "percentage": 96.63, "elapsed_time": "6 days, 17:22:57", "remaining_time": "5:37:54", "throughput": 2743.5, "total_tokens": 1593912992} {"current_steps": 8827, "total_steps": 9134, "loss": 0.7478, "learning_rate": 1.3923901562334917e-07, "epoch": 0.9663099701688607, "percentage": 96.64, "elapsed_time": "6 days, 17:23:56", "remaining_time": "5:36:48", "throughput": 2743.46, "total_tokens": 1594051872} {"current_steps": 8828, "total_steps": 9134, "loss": 0.7839, "learning_rate": 1.383342345262717e-07, "epoch": 0.9664194422397986, "percentage": 96.65, "elapsed_time": "6 days, 17:25:03", "remaining_time": "5:35:42", "throughput": 2743.47, "total_tokens": 1594242272} {"current_steps": 8829, "total_steps": 9134, "loss": 0.9916, "learning_rate": 1.3743239451672608e-07, "epoch": 0.9665289143107365, "percentage": 96.66, "elapsed_time": "6 days, 17:26:07", "remaining_time": "5:34:36", "throughput": 2743.49, "total_tokens": 1594425952} {"current_steps": 8830, "total_steps": 9134, "loss": 0.7943, "learning_rate": 1.3653349570139918e-07, "epoch": 0.9666383863816744, "percentage": 96.67, "elapsed_time": "6 days, 17:27:09", "remaining_time": "5:33:30", "throughput": 2743.48, "total_tokens": 1594588576} {"current_steps": 8831, "total_steps": 9134, "loss": 0.6632, "learning_rate": 1.3563753818663093e-07, "epoch": 0.9667478584526122, "percentage": 96.68, "elapsed_time": "6 days, 17:28:14", "remaining_time": "5:32:24", "throughput": 2743.49, "total_tokens": 1594774720} {"current_steps": 8832, "total_steps": 9134, "loss": 0.7547, "learning_rate": 1.3474452207840605e-07, "epoch": 0.9668573305235502, "percentage": 96.69, "elapsed_time": "6 days, 17:29:20", "remaining_time": "5:31:18", "throughput": 2743.5, "total_tokens": 1594959520} {"current_steps": 8833, "total_steps": 9134, "loss": 0.7651, "learning_rate": 1.3385444748237053e-07, "epoch": 0.9669668025944881, "percentage": 96.7, "elapsed_time": "6 days, 17:30:23", "remaining_time": "5:30:13", "throughput": 2743.49, "total_tokens": 1595127296} {"current_steps": 8834, "total_steps": 9134, "loss": 0.8201, "learning_rate": 1.3296731450381795e-07, "epoch": 0.967076274665426, "percentage": 96.72, "elapsed_time": "6 days, 17:31:24", "remaining_time": "5:29:07", "throughput": 2743.45, "total_tokens": 1595276032} {"current_steps": 8835, "total_steps": 9134, "loss": 0.9111, "learning_rate": 1.3208312324769766e-07, "epoch": 0.9671857467363639, "percentage": 96.73, "elapsed_time": "6 days, 17:32:29", "remaining_time": "5:28:01", "throughput": 2743.45, "total_tokens": 1595450080} {"current_steps": 8836, "total_steps": 9134, "loss": 0.8124, "learning_rate": 1.3120187381859826e-07, "epoch": 0.9672952188073017, "percentage": 96.74, "elapsed_time": "6 days, 17:33:31", "remaining_time": "5:26:55", "throughput": 2743.45, "total_tokens": 1595620096} {"current_steps": 8837, "total_steps": 9134, "loss": 0.9544, "learning_rate": 1.303235663207808e-07, "epoch": 0.9674046908782397, "percentage": 96.75, "elapsed_time": "6 days, 17:34:38", "remaining_time": "5:25:49", "throughput": 2743.47, "total_tokens": 1595820352} {"current_steps": 8838, "total_steps": 9134, "loss": 0.6601, "learning_rate": 1.2944820085814268e-07, "epoch": 0.9675141629491776, "percentage": 96.76, "elapsed_time": "6 days, 17:35:40", "remaining_time": "5:24:43", "throughput": 2743.45, "total_tokens": 1595978720} {"current_steps": 8839, "total_steps": 9134, "loss": 0.8659, "learning_rate": 1.2857577753423444e-07, "epoch": 0.9676236350201155, "percentage": 96.77, "elapsed_time": "6 days, 17:36:39", "remaining_time": "5:23:37", "throughput": 2743.43, "total_tokens": 1596122752} {"current_steps": 8840, "total_steps": 9134, "loss": 0.8747, "learning_rate": 1.2770629645226796e-07, "epoch": 0.9677331070910534, "percentage": 96.78, "elapsed_time": "6 days, 17:37:36", "remaining_time": "5:22:31", "throughput": 2743.39, "total_tokens": 1596258496} {"current_steps": 8841, "total_steps": 9134, "loss": 1.0417, "learning_rate": 1.2683975771509982e-07, "epoch": 0.9678425791619913, "percentage": 96.79, "elapsed_time": "6 days, 17:38:38", "remaining_time": "5:21:25", "throughput": 2743.35, "total_tokens": 1596404320} {"current_steps": 8842, "total_steps": 9134, "loss": 0.929, "learning_rate": 1.2597616142523973e-07, "epoch": 0.9679520512329292, "percentage": 96.8, "elapsed_time": "6 days, 17:39:42", "remaining_time": "5:20:19", "throughput": 2743.37, "total_tokens": 1596595168} {"current_steps": 8843, "total_steps": 9134, "loss": 0.9454, "learning_rate": 1.251155076848448e-07, "epoch": 0.9680615233038671, "percentage": 96.81, "elapsed_time": "6 days, 17:40:46", "remaining_time": "5:19:13", "throughput": 2743.38, "total_tokens": 1596775488} {"current_steps": 8844, "total_steps": 9134, "loss": 0.8901, "learning_rate": 1.2425779659573368e-07, "epoch": 0.968170995374805, "percentage": 96.83, "elapsed_time": "6 days, 17:41:53", "remaining_time": "5:18:07", "throughput": 2743.38, "total_tokens": 1596957152} {"current_steps": 8845, "total_steps": 9134, "loss": 0.6821, "learning_rate": 1.2340302825937232e-07, "epoch": 0.9682804674457429, "percentage": 96.84, "elapsed_time": "6 days, 17:42:52", "remaining_time": "5:17:01", "throughput": 2743.34, "total_tokens": 1597095360} {"current_steps": 8846, "total_steps": 9134, "loss": 0.9196, "learning_rate": 1.2255120277687714e-07, "epoch": 0.9683899395166808, "percentage": 96.85, "elapsed_time": "6 days, 17:43:55", "remaining_time": "5:15:55", "throughput": 2743.34, "total_tokens": 1597272320} {"current_steps": 8847, "total_steps": 9134, "loss": 0.964, "learning_rate": 1.2170232024901473e-07, "epoch": 0.9684994115876188, "percentage": 96.86, "elapsed_time": "6 days, 17:44:59", "remaining_time": "5:14:50", "throughput": 2743.32, "total_tokens": 1597433600} {"current_steps": 8848, "total_steps": 9134, "loss": 1.1229, "learning_rate": 1.208563807762103e-07, "epoch": 0.9686088836585566, "percentage": 96.87, "elapsed_time": "6 days, 17:46:06", "remaining_time": "5:13:44", "throughput": 2743.36, "total_tokens": 1597638784} {"current_steps": 8849, "total_steps": 9134, "loss": 0.8259, "learning_rate": 1.2001338445853382e-07, "epoch": 0.9687183557294945, "percentage": 96.88, "elapsed_time": "6 days, 17:47:13", "remaining_time": "5:12:38", "throughput": 2743.4, "total_tokens": 1597847328} {"current_steps": 8850, "total_steps": 9134, "loss": 1.1402, "learning_rate": 1.1917333139571385e-07, "epoch": 0.9688278278004324, "percentage": 96.89, "elapsed_time": "6 days, 17:48:17", "remaining_time": "5:11:32", "throughput": 2743.4, "total_tokens": 1598021152} {"current_steps": 8851, "total_steps": 9134, "loss": 0.7415, "learning_rate": 1.1833622168712366e-07, "epoch": 0.9689372998713703, "percentage": 96.9, "elapsed_time": "6 days, 17:49:19", "remaining_time": "5:10:26", "throughput": 2743.41, "total_tokens": 1598197888} {"current_steps": 8852, "total_steps": 9134, "loss": 1.1279, "learning_rate": 1.1750205543179239e-07, "epoch": 0.9690467719423083, "percentage": 96.91, "elapsed_time": "6 days, 17:50:23", "remaining_time": "5:09:20", "throughput": 2743.4, "total_tokens": 1598365888} {"current_steps": 8853, "total_steps": 9134, "loss": 0.6788, "learning_rate": 1.1667083272840218e-07, "epoch": 0.9691562440132461, "percentage": 96.92, "elapsed_time": "6 days, 17:51:27", "remaining_time": "5:08:14", "throughput": 2743.4, "total_tokens": 1598546880} {"current_steps": 8854, "total_steps": 9134, "loss": 0.7425, "learning_rate": 1.1584255367528274e-07, "epoch": 0.969265716084184, "percentage": 96.93, "elapsed_time": "6 days, 17:52:29", "remaining_time": "5:07:08", "throughput": 2743.4, "total_tokens": 1598715328} {"current_steps": 8855, "total_steps": 9134, "loss": 0.8326, "learning_rate": 1.1501721837041679e-07, "epoch": 0.9693751881551219, "percentage": 96.95, "elapsed_time": "6 days, 17:53:35", "remaining_time": "5:06:03", "throughput": 2743.43, "total_tokens": 1598913568} {"current_steps": 8856, "total_steps": 9134, "loss": 0.915, "learning_rate": 1.141948269114429e-07, "epoch": 0.9694846602260598, "percentage": 96.96, "elapsed_time": "6 days, 17:54:40", "remaining_time": "5:04:57", "throughput": 2743.43, "total_tokens": 1599093216} {"current_steps": 8857, "total_steps": 9134, "loss": 0.6336, "learning_rate": 1.133753793956499e-07, "epoch": 0.9695941322969978, "percentage": 96.97, "elapsed_time": "6 days, 17:55:40", "remaining_time": "5:03:51", "throughput": 2743.42, "total_tokens": 1599248896} {"current_steps": 8858, "total_steps": 9134, "loss": 0.7579, "learning_rate": 1.1255887591997138e-07, "epoch": 0.9697036043679357, "percentage": 96.98, "elapsed_time": "6 days, 17:56:42", "remaining_time": "5:02:45", "throughput": 2743.44, "total_tokens": 1599431456} {"current_steps": 8859, "total_steps": 9134, "loss": 1.0034, "learning_rate": 1.1174531658100229e-07, "epoch": 0.9698130764388735, "percentage": 96.99, "elapsed_time": "6 days, 17:57:49", "remaining_time": "5:01:39", "throughput": 2743.44, "total_tokens": 1599616032} {"current_steps": 8860, "total_steps": 9134, "loss": 0.9299, "learning_rate": 1.1093470147498231e-07, "epoch": 0.9699225485098114, "percentage": 97.0, "elapsed_time": "6 days, 17:58:56", "remaining_time": "5:00:33", "throughput": 2743.47, "total_tokens": 1599818528} {"current_steps": 8861, "total_steps": 9134, "loss": 1.0742, "learning_rate": 1.1012703069780972e-07, "epoch": 0.9700320205807493, "percentage": 97.01, "elapsed_time": "6 days, 17:59:58", "remaining_time": "4:59:27", "throughput": 2743.47, "total_tokens": 1599987872} {"current_steps": 8862, "total_steps": 9134, "loss": 0.9106, "learning_rate": 1.0932230434502755e-07, "epoch": 0.9701414926516873, "percentage": 97.02, "elapsed_time": "6 days, 18:01:02", "remaining_time": "4:58:21", "throughput": 2743.49, "total_tokens": 1600174912} {"current_steps": 8863, "total_steps": 9134, "loss": 0.9124, "learning_rate": 1.0852052251183187e-07, "epoch": 0.9702509647226252, "percentage": 97.03, "elapsed_time": "6 days, 18:02:03", "remaining_time": "4:57:16", "throughput": 2743.45, "total_tokens": 1600316928} {"current_steps": 8864, "total_steps": 9134, "loss": 1.0668, "learning_rate": 1.0772168529307736e-07, "epoch": 0.9703604367935631, "percentage": 97.04, "elapsed_time": "6 days, 18:03:10", "remaining_time": "4:56:10", "throughput": 2743.49, "total_tokens": 1600525248} {"current_steps": 8865, "total_steps": 9134, "loss": 0.8373, "learning_rate": 1.0692579278325788e-07, "epoch": 0.9704699088645009, "percentage": 97.05, "elapsed_time": "6 days, 18:04:14", "remaining_time": "4:55:04", "throughput": 2743.49, "total_tokens": 1600703552} {"current_steps": 8866, "total_steps": 9134, "loss": 0.9818, "learning_rate": 1.061328450765342e-07, "epoch": 0.9705793809354388, "percentage": 97.07, "elapsed_time": "6 days, 18:05:20", "remaining_time": "4:53:58", "throughput": 2743.51, "total_tokens": 1600892384} {"current_steps": 8867, "total_steps": 9134, "loss": 0.9934, "learning_rate": 1.0534284226670077e-07, "epoch": 0.9706888530063768, "percentage": 97.08, "elapsed_time": "6 days, 18:06:24", "remaining_time": "4:52:52", "throughput": 2743.5, "total_tokens": 1601065088} {"current_steps": 8868, "total_steps": 9134, "loss": 0.9454, "learning_rate": 1.045557844472217e-07, "epoch": 0.9707983250773147, "percentage": 97.09, "elapsed_time": "6 days, 18:07:25", "remaining_time": "4:51:46", "throughput": 2743.49, "total_tokens": 1601226592} {"current_steps": 8869, "total_steps": 9134, "loss": 1.0661, "learning_rate": 1.0377167171120028e-07, "epoch": 0.9709077971482526, "percentage": 97.1, "elapsed_time": "6 days, 18:08:31", "remaining_time": "4:50:40", "throughput": 2743.52, "total_tokens": 1601423488} {"current_steps": 8870, "total_steps": 9134, "loss": 1.0512, "learning_rate": 1.0299050415139844e-07, "epoch": 0.9710172692191904, "percentage": 97.11, "elapsed_time": "6 days, 18:09:32", "remaining_time": "4:49:34", "throughput": 2743.52, "total_tokens": 1601592608} {"current_steps": 8871, "total_steps": 9134, "loss": 0.9743, "learning_rate": 1.022122818602228e-07, "epoch": 0.9711267412901283, "percentage": 97.12, "elapsed_time": "6 days, 18:10:33", "remaining_time": "4:48:29", "throughput": 2743.5, "total_tokens": 1601750080} {"current_steps": 8872, "total_steps": 9134, "loss": 1.4801, "learning_rate": 1.0143700492973862e-07, "epoch": 0.9712362133610662, "percentage": 97.13, "elapsed_time": "6 days, 18:11:40", "remaining_time": "4:47:23", "throughput": 2743.54, "total_tokens": 1601954368} {"current_steps": 8873, "total_steps": 9134, "loss": 0.9686, "learning_rate": 1.0066467345165864e-07, "epoch": 0.9713456854320042, "percentage": 97.14, "elapsed_time": "6 days, 18:12:45", "remaining_time": "4:46:17", "throughput": 2743.57, "total_tokens": 1602149472} {"current_steps": 8874, "total_steps": 9134, "loss": 0.9571, "learning_rate": 9.989528751734867e-08, "epoch": 0.9714551575029421, "percentage": 97.15, "elapsed_time": "6 days, 18:13:45", "remaining_time": "4:45:11", "throughput": 2743.56, "total_tokens": 1602308736} {"current_steps": 8875, "total_steps": 9134, "loss": 0.9825, "learning_rate": 9.912884721782478e-08, "epoch": 0.97156462957388, "percentage": 97.16, "elapsed_time": "6 days, 18:14:50", "remaining_time": "4:44:05", "throughput": 2743.56, "total_tokens": 1602486368} {"current_steps": 8876, "total_steps": 9134, "loss": 0.6396, "learning_rate": 9.836535264375613e-08, "epoch": 0.9716741016448178, "percentage": 97.18, "elapsed_time": "6 days, 18:15:54", "remaining_time": "4:42:59", "throughput": 2743.6, "total_tokens": 1602684832} {"current_steps": 8877, "total_steps": 9134, "loss": 1.0107, "learning_rate": 9.760480388546211e-08, "epoch": 0.9717835737157557, "percentage": 97.19, "elapsed_time": "6 days, 18:16:56", "remaining_time": "4:41:53", "throughput": 2743.62, "total_tokens": 1602867392} {"current_steps": 8878, "total_steps": 9134, "loss": 0.9433, "learning_rate": 9.684720103291522e-08, "epoch": 0.9718930457866937, "percentage": 97.2, "elapsed_time": "6 days, 18:18:02", "remaining_time": "4:40:47", "throughput": 2743.66, "total_tokens": 1603068768} {"current_steps": 8879, "total_steps": 9134, "loss": 0.8469, "learning_rate": 9.609254417573543e-08, "epoch": 0.9720025178576316, "percentage": 97.21, "elapsed_time": "6 days, 18:19:03", "remaining_time": "4:39:42", "throughput": 2743.65, "total_tokens": 1603235648} {"current_steps": 8880, "total_steps": 9134, "loss": 0.7047, "learning_rate": 9.534083340320132e-08, "epoch": 0.9721119899285695, "percentage": 97.22, "elapsed_time": "6 days, 18:20:04", "remaining_time": "4:38:36", "throughput": 2743.65, "total_tokens": 1603398944} {"current_steps": 8881, "total_steps": 9134, "loss": 0.8611, "learning_rate": 9.459206880423621e-08, "epoch": 0.9722214619995074, "percentage": 97.23, "elapsed_time": "6 days, 18:21:05", "remaining_time": "4:37:30", "throughput": 2743.66, "total_tokens": 1603575008} {"current_steps": 8882, "total_steps": 9134, "loss": 0.9154, "learning_rate": 9.384625046741924e-08, "epoch": 0.9723309340704452, "percentage": 97.24, "elapsed_time": "6 days, 18:22:09", "remaining_time": "4:36:24", "throughput": 2743.63, "total_tokens": 1603734944} {"current_steps": 8883, "total_steps": 9134, "loss": 1.0286, "learning_rate": 9.310337848097705e-08, "epoch": 0.9724404061413832, "percentage": 97.25, "elapsed_time": "6 days, 18:23:12", "remaining_time": "4:35:18", "throughput": 2743.64, "total_tokens": 1603910560} {"current_steps": 8884, "total_steps": 9134, "loss": 0.6788, "learning_rate": 9.236345293279492e-08, "epoch": 0.9725498782123211, "percentage": 97.26, "elapsed_time": "6 days, 18:24:16", "remaining_time": "4:34:12", "throughput": 2743.67, "total_tokens": 1604103200} {"current_steps": 8885, "total_steps": 9134, "loss": 0.8142, "learning_rate": 9.162647391039724e-08, "epoch": 0.972659350283259, "percentage": 97.27, "elapsed_time": "6 days, 18:25:22", "remaining_time": "4:33:06", "throughput": 2743.67, "total_tokens": 1604284640} {"current_steps": 8886, "total_steps": 9134, "loss": 0.8404, "learning_rate": 9.089244150097265e-08, "epoch": 0.9727688223541969, "percentage": 97.28, "elapsed_time": "6 days, 18:26:21", "remaining_time": "4:32:00", "throughput": 2743.65, "total_tokens": 1604438976} {"current_steps": 8887, "total_steps": 9134, "loss": 0.9308, "learning_rate": 9.016135579135165e-08, "epoch": 0.9728782944251347, "percentage": 97.3, "elapsed_time": "6 days, 18:27:26", "remaining_time": "4:30:54", "throughput": 2743.66, "total_tokens": 1604619520} {"current_steps": 8888, "total_steps": 9134, "loss": 0.8302, "learning_rate": 8.943321686802619e-08, "epoch": 0.9729877664960727, "percentage": 97.31, "elapsed_time": "6 days, 18:28:30", "remaining_time": "4:29:49", "throughput": 2743.69, "total_tokens": 1604815072} {"current_steps": 8889, "total_steps": 9134, "loss": 0.7656, "learning_rate": 8.870802481712736e-08, "epoch": 0.9730972385670106, "percentage": 97.32, "elapsed_time": "6 days, 18:29:33", "remaining_time": "4:28:43", "throughput": 2743.69, "total_tokens": 1604983520} {"current_steps": 8890, "total_steps": 9134, "loss": 0.853, "learning_rate": 8.798577972445043e-08, "epoch": 0.9732067106379485, "percentage": 97.33, "elapsed_time": "6 days, 18:30:38", "remaining_time": "4:27:37", "throughput": 2743.67, "total_tokens": 1605153984} {"current_steps": 8891, "total_steps": 9134, "loss": 0.9289, "learning_rate": 8.726648167542706e-08, "epoch": 0.9733161827088864, "percentage": 97.34, "elapsed_time": "6 days, 18:31:37", "remaining_time": "4:26:31", "throughput": 2743.63, "total_tokens": 1605291968} {"current_steps": 8892, "total_steps": 9134, "loss": 0.8955, "learning_rate": 8.65501307551586e-08, "epoch": 0.9734256547798243, "percentage": 97.35, "elapsed_time": "6 days, 18:32:42", "remaining_time": "4:25:25", "throughput": 2743.63, "total_tokens": 1605467808} {"current_steps": 8893, "total_steps": 9134, "loss": 1.1198, "learning_rate": 8.583672704838008e-08, "epoch": 0.9735351268507622, "percentage": 97.36, "elapsed_time": "6 days, 18:33:49", "remaining_time": "4:24:19", "throughput": 2743.66, "total_tokens": 1605672768} {"current_steps": 8894, "total_steps": 9134, "loss": 0.832, "learning_rate": 8.512627063949064e-08, "epoch": 0.9736445989217001, "percentage": 97.37, "elapsed_time": "6 days, 18:34:53", "remaining_time": "4:23:13", "throughput": 2743.68, "total_tokens": 1605858016} {"current_steps": 8895, "total_steps": 9134, "loss": 0.9512, "learning_rate": 8.441876161253414e-08, "epoch": 0.973754070992638, "percentage": 97.38, "elapsed_time": "6 days, 18:35:56", "remaining_time": "4:22:07", "throughput": 2743.68, "total_tokens": 1606034752} {"current_steps": 8896, "total_steps": 9134, "loss": 0.7818, "learning_rate": 8.371420005120756e-08, "epoch": 0.9738635430635759, "percentage": 97.39, "elapsed_time": "6 days, 18:37:02", "remaining_time": "4:21:02", "throughput": 2743.7, "total_tokens": 1606222912} {"current_steps": 8897, "total_steps": 9134, "loss": 0.6377, "learning_rate": 8.301258603885808e-08, "epoch": 0.9739730151345138, "percentage": 97.41, "elapsed_time": "6 days, 18:38:07", "remaining_time": "4:19:56", "throughput": 2743.71, "total_tokens": 1606407040} {"current_steps": 8898, "total_steps": 9134, "loss": 0.9861, "learning_rate": 8.231391965848601e-08, "epoch": 0.9740824872054518, "percentage": 97.42, "elapsed_time": "6 days, 18:39:08", "remaining_time": "4:18:50", "throughput": 2743.72, "total_tokens": 1606579296} {"current_steps": 8899, "total_steps": 9134, "loss": 0.9617, "learning_rate": 8.161820099274464e-08, "epoch": 0.9741919592763896, "percentage": 97.43, "elapsed_time": "6 days, 18:40:14", "remaining_time": "4:17:44", "throughput": 2743.75, "total_tokens": 1606779776} {"current_steps": 8900, "total_steps": 9134, "loss": 0.9095, "learning_rate": 8.092543012393483e-08, "epoch": 0.9743014313473275, "percentage": 97.44, "elapsed_time": "6 days, 18:41:16", "remaining_time": "4:16:38", "throughput": 2743.75, "total_tokens": 1606950464} {"current_steps": 8901, "total_steps": 9134, "loss": 0.9943, "learning_rate": 8.023560713400769e-08, "epoch": 0.9744109034182654, "percentage": 97.45, "elapsed_time": "6 days, 18:42:16", "remaining_time": "4:15:32", "throughput": 2743.69, "total_tokens": 1607079040} {"current_steps": 8902, "total_steps": 9134, "loss": 0.9535, "learning_rate": 7.954873210457015e-08, "epoch": 0.9745203754892033, "percentage": 97.46, "elapsed_time": "6 days, 18:43:22", "remaining_time": "4:14:26", "throughput": 2743.74, "total_tokens": 1607285792} {"current_steps": 8903, "total_steps": 9134, "loss": 0.8621, "learning_rate": 7.886480511687666e-08, "epoch": 0.9746298475601413, "percentage": 97.47, "elapsed_time": "6 days, 18:44:23", "remaining_time": "4:13:20", "throughput": 2743.74, "total_tokens": 1607454912} {"current_steps": 8904, "total_steps": 9134, "loss": 1.0413, "learning_rate": 7.81838262518375e-08, "epoch": 0.9747393196310791, "percentage": 97.48, "elapsed_time": "6 days, 18:45:29", "remaining_time": "4:12:15", "throughput": 2743.77, "total_tokens": 1607654496} {"current_steps": 8905, "total_steps": 9134, "loss": 1.0182, "learning_rate": 7.75057955900077e-08, "epoch": 0.974848791702017, "percentage": 97.49, "elapsed_time": "6 days, 18:46:33", "remaining_time": "4:11:09", "throughput": 2743.77, "total_tokens": 1607828768} {"current_steps": 8906, "total_steps": 9134, "loss": 0.7526, "learning_rate": 7.683071321160085e-08, "epoch": 0.9749582637729549, "percentage": 97.5, "elapsed_time": "6 days, 18:47:37", "remaining_time": "4:10:03", "throughput": 2743.77, "total_tokens": 1608007744} {"current_steps": 8907, "total_steps": 9134, "loss": 1.0368, "learning_rate": 7.615857919647252e-08, "epoch": 0.9750677358438928, "percentage": 97.51, "elapsed_time": "6 days, 18:48:45", "remaining_time": "4:08:57", "throughput": 2743.78, "total_tokens": 1608198144} {"current_steps": 8908, "total_steps": 9134, "loss": 0.9094, "learning_rate": 7.548939362414243e-08, "epoch": 0.9751772079148308, "percentage": 97.53, "elapsed_time": "6 days, 18:49:47", "remaining_time": "4:07:51", "throughput": 2743.78, "total_tokens": 1608370848} {"current_steps": 8909, "total_steps": 9134, "loss": 1.0805, "learning_rate": 7.482315657376394e-08, "epoch": 0.9752866799857687, "percentage": 97.54, "elapsed_time": "6 days, 18:50:52", "remaining_time": "4:06:46", "throughput": 2743.81, "total_tokens": 1608565056} {"current_steps": 8910, "total_steps": 9134, "loss": 1.0569, "learning_rate": 7.41598681241601e-08, "epoch": 0.9753961520567065, "percentage": 97.55, "elapsed_time": "6 days, 18:51:57", "remaining_time": "4:05:40", "throughput": 2743.85, "total_tokens": 1608769568} {"current_steps": 8911, "total_steps": 9134, "loss": 1.0158, "learning_rate": 7.349952835379592e-08, "epoch": 0.9755056241276444, "percentage": 97.56, "elapsed_time": "6 days, 18:53:04", "remaining_time": "4:04:34", "throughput": 2743.87, "total_tokens": 1608961088} {"current_steps": 8912, "total_steps": 9134, "loss": 0.9854, "learning_rate": 7.284213734078394e-08, "epoch": 0.9756150961985823, "percentage": 97.57, "elapsed_time": "6 days, 18:54:08", "remaining_time": "4:03:28", "throughput": 2743.89, "total_tokens": 1609147008} {"current_steps": 8913, "total_steps": 9134, "loss": 0.9069, "learning_rate": 7.218769516289247e-08, "epoch": 0.9757245682695203, "percentage": 97.58, "elapsed_time": "6 days, 18:55:14", "remaining_time": "4:02:22", "throughput": 2743.91, "total_tokens": 1609344576} {"current_steps": 8914, "total_steps": 9134, "loss": 0.8174, "learning_rate": 7.153620189754573e-08, "epoch": 0.9758340403404582, "percentage": 97.59, "elapsed_time": "6 days, 18:56:20", "remaining_time": "4:01:16", "throughput": 2743.94, "total_tokens": 1609543040} {"current_steps": 8915, "total_steps": 9134, "loss": 0.9677, "learning_rate": 7.088765762180982e-08, "epoch": 0.9759435124113961, "percentage": 97.6, "elapsed_time": "6 days, 18:57:24", "remaining_time": "4:00:11", "throughput": 2743.95, "total_tokens": 1609726048} {"current_steps": 8916, "total_steps": 9134, "loss": 0.8634, "learning_rate": 7.024206241240671e-08, "epoch": 0.9760529844823339, "percentage": 97.61, "elapsed_time": "6 days, 18:58:30", "remaining_time": "3:59:05", "throughput": 2743.96, "total_tokens": 1609911520} {"current_steps": 8917, "total_steps": 9134, "loss": 1.1983, "learning_rate": 6.959941634571143e-08, "epoch": 0.9761624565532718, "percentage": 97.62, "elapsed_time": "6 days, 18:59:32", "remaining_time": "3:57:59", "throughput": 2743.99, "total_tokens": 1610100128} {"current_steps": 8918, "total_steps": 9134, "loss": 0.7806, "learning_rate": 6.895971949774649e-08, "epoch": 0.9762719286242098, "percentage": 97.64, "elapsed_time": "6 days, 19:00:32", "remaining_time": "3:56:53", "throughput": 2743.99, "total_tokens": 1610260288} {"current_steps": 8919, "total_steps": 9134, "loss": 0.8743, "learning_rate": 6.832297194418746e-08, "epoch": 0.9763814006951477, "percentage": 97.65, "elapsed_time": "6 days, 19:01:38", "remaining_time": "3:55:47", "throughput": 2744.01, "total_tokens": 1610456960} {"current_steps": 8920, "total_steps": 9134, "loss": 0.9147, "learning_rate": 6.768917376035744e-08, "epoch": 0.9764908727660856, "percentage": 97.66, "elapsed_time": "6 days, 19:02:45", "remaining_time": "3:54:41", "throughput": 2743.99, "total_tokens": 1610629888} {"current_steps": 8921, "total_steps": 9134, "loss": 0.8439, "learning_rate": 6.70583250212381e-08, "epoch": 0.9766003448370234, "percentage": 97.67, "elapsed_time": "6 days, 19:03:48", "remaining_time": "3:53:36", "throughput": 2743.99, "total_tokens": 1610801248} {"current_steps": 8922, "total_steps": 9134, "loss": 1.0172, "learning_rate": 6.643042580145309e-08, "epoch": 0.9767098169079613, "percentage": 97.68, "elapsed_time": "6 days, 19:04:54", "remaining_time": "3:52:30", "throughput": 2744.03, "total_tokens": 1611002624} {"current_steps": 8923, "total_steps": 9134, "loss": 1.2454, "learning_rate": 6.580547617528465e-08, "epoch": 0.9768192889788992, "percentage": 97.69, "elapsed_time": "6 days, 19:05:59", "remaining_time": "3:51:24", "throughput": 2744.05, "total_tokens": 1611194592} {"current_steps": 8924, "total_steps": 9134, "loss": 0.8735, "learning_rate": 6.518347621666255e-08, "epoch": 0.9769287610498372, "percentage": 97.7, "elapsed_time": "6 days, 19:07:04", "remaining_time": "3:50:18", "throughput": 2744.06, "total_tokens": 1611380736} {"current_steps": 8925, "total_steps": 9134, "loss": 0.8455, "learning_rate": 6.456442599916679e-08, "epoch": 0.9770382331207751, "percentage": 97.71, "elapsed_time": "6 days, 19:08:07", "remaining_time": "3:49:12", "throughput": 2744.06, "total_tokens": 1611552768} {"current_steps": 8926, "total_steps": 9134, "loss": 0.7613, "learning_rate": 6.394832559603048e-08, "epoch": 0.977147705191713, "percentage": 97.72, "elapsed_time": "6 days, 19:09:04", "remaining_time": "3:48:06", "throughput": 2744.04, "total_tokens": 1611695008} {"current_steps": 8927, "total_steps": 9134, "loss": 1.1046, "learning_rate": 6.333517508013975e-08, "epoch": 0.9772571772626508, "percentage": 97.73, "elapsed_time": "6 days, 19:10:11", "remaining_time": "3:47:00", "throughput": 2744.06, "total_tokens": 1611891008} {"current_steps": 8928, "total_steps": 9134, "loss": 0.8751, "learning_rate": 6.272497452402548e-08, "epoch": 0.9773666493335887, "percentage": 97.74, "elapsed_time": "6 days, 19:11:12", "remaining_time": "3:45:55", "throughput": 2744.06, "total_tokens": 1612056320} {"current_steps": 8929, "total_steps": 9134, "loss": 0.88, "learning_rate": 6.211772399987715e-08, "epoch": 0.9774761214045267, "percentage": 97.76, "elapsed_time": "6 days, 19:12:15", "remaining_time": "3:44:49", "throughput": 2744.07, "total_tokens": 1612241120} {"current_steps": 8930, "total_steps": 9134, "loss": 1.1554, "learning_rate": 6.151342357952617e-08, "epoch": 0.9775855934754646, "percentage": 97.77, "elapsed_time": "6 days, 19:13:19", "remaining_time": "3:43:43", "throughput": 2744.07, "total_tokens": 1612416288} {"current_steps": 8931, "total_steps": 9134, "loss": 1.2414, "learning_rate": 6.091207333446259e-08, "epoch": 0.9776950655464025, "percentage": 97.78, "elapsed_time": "6 days, 19:14:18", "remaining_time": "3:42:37", "throughput": 2744.06, "total_tokens": 1612573760} {"current_steps": 8932, "total_steps": 9134, "loss": 0.9695, "learning_rate": 6.031367333582949e-08, "epoch": 0.9778045376173404, "percentage": 97.79, "elapsed_time": "6 days, 19:15:22", "remaining_time": "3:41:31", "throughput": 2744.03, "total_tokens": 1612730112} {"current_steps": 8933, "total_steps": 9134, "loss": 0.6102, "learning_rate": 5.971822365440639e-08, "epoch": 0.9779140096882782, "percentage": 97.8, "elapsed_time": "6 days, 19:16:26", "remaining_time": "3:40:25", "throughput": 2744.02, "total_tokens": 1612899456} {"current_steps": 8934, "total_steps": 9134, "loss": 1.0883, "learning_rate": 5.912572436064523e-08, "epoch": 0.9780234817592162, "percentage": 97.81, "elapsed_time": "6 days, 19:17:30", "remaining_time": "3:39:19", "throughput": 2744.02, "total_tokens": 1613075968} {"current_steps": 8935, "total_steps": 9134, "loss": 0.6987, "learning_rate": 5.853617552462887e-08, "epoch": 0.9781329538301541, "percentage": 97.82, "elapsed_time": "6 days, 19:18:31", "remaining_time": "3:38:13", "throughput": 2744.0, "total_tokens": 1613227392} {"current_steps": 8936, "total_steps": 9134, "loss": 0.7384, "learning_rate": 5.794957721610428e-08, "epoch": 0.978242425901092, "percentage": 97.83, "elapsed_time": "6 days, 19:19:34", "remaining_time": "3:37:08", "throughput": 2744.0, "total_tokens": 1613399200} {"current_steps": 8937, "total_steps": 9134, "loss": 1.0244, "learning_rate": 5.7365929504460404e-08, "epoch": 0.9783518979720299, "percentage": 97.84, "elapsed_time": "6 days, 19:20:34", "remaining_time": "3:36:02", "throughput": 2744.0, "total_tokens": 1613564960} {"current_steps": 8938, "total_steps": 9134, "loss": 0.9379, "learning_rate": 5.678523245874756e-08, "epoch": 0.9784613700429677, "percentage": 97.85, "elapsed_time": "6 days, 19:21:39", "remaining_time": "3:34:56", "throughput": 2744.02, "total_tokens": 1613755136} {"current_steps": 8939, "total_steps": 9134, "loss": 0.9636, "learning_rate": 5.620748614765803e-08, "epoch": 0.9785708421139057, "percentage": 97.87, "elapsed_time": "6 days, 19:22:41", "remaining_time": "3:33:50", "throughput": 2744.02, "total_tokens": 1613927616} {"current_steps": 8940, "total_steps": 9134, "loss": 0.8928, "learning_rate": 5.563269063953991e-08, "epoch": 0.9786803141848436, "percentage": 97.88, "elapsed_time": "6 days, 19:23:49", "remaining_time": "3:32:44", "throughput": 2744.06, "total_tokens": 1614135712} {"current_steps": 8941, "total_steps": 9134, "loss": 0.6238, "learning_rate": 5.506084600238881e-08, "epoch": 0.9787897862557815, "percentage": 97.89, "elapsed_time": "6 days, 19:24:52", "remaining_time": "3:31:38", "throughput": 2744.08, "total_tokens": 1614321408} {"current_steps": 8942, "total_steps": 9134, "loss": 1.0358, "learning_rate": 5.4491952303850624e-08, "epoch": 0.9788992583267194, "percentage": 97.9, "elapsed_time": "6 days, 19:25:53", "remaining_time": "3:30:32", "throughput": 2744.07, "total_tokens": 1614481344} {"current_steps": 8943, "total_steps": 9134, "loss": 1.0387, "learning_rate": 5.392600961122707e-08, "epoch": 0.9790087303976573, "percentage": 97.91, "elapsed_time": "6 days, 19:26:59", "remaining_time": "3:29:27", "throughput": 2744.09, "total_tokens": 1614679808} {"current_steps": 8944, "total_steps": 9134, "loss": 0.7523, "learning_rate": 5.3363017991470145e-08, "epoch": 0.9791182024685952, "percentage": 97.92, "elapsed_time": "6 days, 19:28:01", "remaining_time": "3:28:21", "throughput": 2744.09, "total_tokens": 1614847360} {"current_steps": 8945, "total_steps": 9134, "loss": 1.0129, "learning_rate": 5.280297751117658e-08, "epoch": 0.9792276745395331, "percentage": 97.93, "elapsed_time": "6 days, 19:29:07", "remaining_time": "3:27:15", "throughput": 2744.12, "total_tokens": 1615044032} {"current_steps": 8946, "total_steps": 9134, "loss": 0.9199, "learning_rate": 5.224588823659893e-08, "epoch": 0.979337146610471, "percentage": 97.94, "elapsed_time": "6 days, 19:30:11", "remaining_time": "3:26:09", "throughput": 2744.14, "total_tokens": 1615236448} {"current_steps": 8947, "total_steps": 9134, "loss": 0.9877, "learning_rate": 5.169175023364003e-08, "epoch": 0.9794466186814089, "percentage": 97.95, "elapsed_time": "6 days, 19:31:18", "remaining_time": "3:25:03", "throughput": 2744.21, "total_tokens": 1615457536} {"current_steps": 8948, "total_steps": 9134, "loss": 0.8683, "learning_rate": 5.114056356785857e-08, "epoch": 0.9795560907523468, "percentage": 97.96, "elapsed_time": "6 days, 19:32:18", "remaining_time": "3:23:57", "throughput": 2744.18, "total_tokens": 1615602912} {"current_steps": 8949, "total_steps": 9134, "loss": 0.9934, "learning_rate": 5.05923283044496e-08, "epoch": 0.9796655628232848, "percentage": 97.97, "elapsed_time": "6 days, 19:33:19", "remaining_time": "3:22:52", "throughput": 2744.18, "total_tokens": 1615769568} {"current_steps": 8950, "total_steps": 9134, "loss": 0.743, "learning_rate": 5.004704450827513e-08, "epoch": 0.9797750348942226, "percentage": 97.99, "elapsed_time": "6 days, 19:34:23", "remaining_time": "3:21:46", "throughput": 2744.19, "total_tokens": 1615955936} {"current_steps": 8951, "total_steps": 9134, "loss": 0.9042, "learning_rate": 4.9504712243839126e-08, "epoch": 0.9798845069651605, "percentage": 98.0, "elapsed_time": "6 days, 19:35:29", "remaining_time": "3:20:40", "throughput": 2744.24, "total_tokens": 1616162240} {"current_steps": 8952, "total_steps": 9134, "loss": 0.9349, "learning_rate": 4.896533157529859e-08, "epoch": 0.9799939790360984, "percentage": 98.01, "elapsed_time": "6 days, 19:36:36", "remaining_time": "3:19:34", "throughput": 2744.24, "total_tokens": 1616347712} {"current_steps": 8953, "total_steps": 9134, "loss": 0.8569, "learning_rate": 4.842890256646082e-08, "epoch": 0.9801034511070363, "percentage": 98.02, "elapsed_time": "6 days, 19:37:37", "remaining_time": "3:18:28", "throughput": 2744.21, "total_tokens": 1616497120} {"current_steps": 8954, "total_steps": 9134, "loss": 1.0539, "learning_rate": 4.789542528078339e-08, "epoch": 0.9802129231779743, "percentage": 98.03, "elapsed_time": "6 days, 19:38:37", "remaining_time": "3:17:22", "throughput": 2744.18, "total_tokens": 1616643168} {"current_steps": 8955, "total_steps": 9134, "loss": 0.8197, "learning_rate": 4.73648997813797e-08, "epoch": 0.9803223952489121, "percentage": 98.04, "elapsed_time": "6 days, 19:39:40", "remaining_time": "3:16:17", "throughput": 2744.16, "total_tokens": 1616805120} {"current_steps": 8956, "total_steps": 9134, "loss": 1.0513, "learning_rate": 4.6837326131002336e-08, "epoch": 0.98043186731985, "percentage": 98.05, "elapsed_time": "6 days, 19:40:46", "remaining_time": "3:15:11", "throughput": 2744.19, "total_tokens": 1617007616} {"current_steps": 8957, "total_steps": 9134, "loss": 1.0188, "learning_rate": 4.63127043920708e-08, "epoch": 0.9805413393907879, "percentage": 98.06, "elapsed_time": "6 days, 19:41:48", "remaining_time": "3:14:05", "throughput": 2744.18, "total_tokens": 1617166208} {"current_steps": 8958, "total_steps": 9134, "loss": 1.1022, "learning_rate": 4.579103462664103e-08, "epoch": 0.9806508114617258, "percentage": 98.07, "elapsed_time": "6 days, 19:42:52", "remaining_time": "3:12:59", "throughput": 2744.18, "total_tokens": 1617345856} {"current_steps": 8959, "total_steps": 9134, "loss": 1.048, "learning_rate": 4.52723168964303e-08, "epoch": 0.9807602835326638, "percentage": 98.08, "elapsed_time": "6 days, 19:43:57", "remaining_time": "3:11:53", "throughput": 2744.18, "total_tokens": 1617523712} {"current_steps": 8960, "total_steps": 9134, "loss": 0.6062, "learning_rate": 4.4756551262795096e-08, "epoch": 0.9808697556036017, "percentage": 98.1, "elapsed_time": "6 days, 19:44:59", "remaining_time": "3:10:47", "throughput": 2744.2, "total_tokens": 1617704480} {"current_steps": 8961, "total_steps": 9134, "loss": 0.794, "learning_rate": 4.424373778675606e-08, "epoch": 0.9809792276745395, "percentage": 98.11, "elapsed_time": "6 days, 19:46:00", "remaining_time": "3:09:41", "throughput": 2744.17, "total_tokens": 1617854112} {"current_steps": 8962, "total_steps": 9134, "loss": 0.8626, "learning_rate": 4.373387652897576e-08, "epoch": 0.9810886997454774, "percentage": 98.12, "elapsed_time": "6 days, 19:47:03", "remaining_time": "3:08:36", "throughput": 2744.18, "total_tokens": 1618029952} {"current_steps": 8963, "total_steps": 9134, "loss": 0.8156, "learning_rate": 4.3226967549769845e-08, "epoch": 0.9811981718164153, "percentage": 98.13, "elapsed_time": "6 days, 19:48:06", "remaining_time": "3:07:30", "throughput": 2744.21, "total_tokens": 1618221920} {"current_steps": 8964, "total_steps": 9134, "loss": 1.0326, "learning_rate": 4.2723010909104244e-08, "epoch": 0.9813076438873533, "percentage": 98.14, "elapsed_time": "6 days, 19:49:13", "remaining_time": "3:06:24", "throughput": 2744.24, "total_tokens": 1618427328} {"current_steps": 8965, "total_steps": 9134, "loss": 0.8037, "learning_rate": 4.222200666659515e-08, "epoch": 0.9814171159582912, "percentage": 98.15, "elapsed_time": "6 days, 19:50:17", "remaining_time": "3:05:18", "throughput": 2744.26, "total_tokens": 1618609888} {"current_steps": 8966, "total_steps": 9134, "loss": 1.0293, "learning_rate": 4.1723954881511816e-08, "epoch": 0.9815265880292291, "percentage": 98.16, "elapsed_time": "6 days, 19:51:22", "remaining_time": "3:04:12", "throughput": 2744.25, "total_tokens": 1618783936} {"current_steps": 8967, "total_steps": 9134, "loss": 0.9095, "learning_rate": 4.122885561277101e-08, "epoch": 0.9816360601001669, "percentage": 98.17, "elapsed_time": "6 days, 19:52:27", "remaining_time": "3:03:07", "throughput": 2744.27, "total_tokens": 1618977696} {"current_steps": 8968, "total_steps": 9134, "loss": 0.886, "learning_rate": 4.073670891894532e-08, "epoch": 0.9817455321711048, "percentage": 98.18, "elapsed_time": "6 days, 19:53:35", "remaining_time": "3:02:01", "throughput": 2744.3, "total_tokens": 1619176832} {"current_steps": 8969, "total_steps": 9134, "loss": 0.9492, "learning_rate": 4.0247514858252065e-08, "epoch": 0.9818550042420428, "percentage": 98.19, "elapsed_time": "6 days, 19:54:38", "remaining_time": "3:00:55", "throughput": 2744.29, "total_tokens": 1619348416} {"current_steps": 8970, "total_steps": 9134, "loss": 0.7255, "learning_rate": 3.97612734885644e-08, "epoch": 0.9819644763129807, "percentage": 98.2, "elapsed_time": "6 days, 19:55:45", "remaining_time": "2:59:49", "throughput": 2744.32, "total_tokens": 1619550464} {"current_steps": 8971, "total_steps": 9134, "loss": 0.8936, "learning_rate": 3.9277984867400196e-08, "epoch": 0.9820739483839186, "percentage": 98.22, "elapsed_time": "6 days, 19:56:48", "remaining_time": "2:58:43", "throughput": 2744.31, "total_tokens": 1619718016} {"current_steps": 8972, "total_steps": 9134, "loss": 0.9367, "learning_rate": 3.879764905193595e-08, "epoch": 0.9821834204548564, "percentage": 98.23, "elapsed_time": "6 days, 19:57:55", "remaining_time": "2:57:38", "throughput": 2744.34, "total_tokens": 1619916480} {"current_steps": 8973, "total_steps": 9134, "loss": 0.8873, "learning_rate": 3.832026609899009e-08, "epoch": 0.9822928925257943, "percentage": 98.24, "elapsed_time": "6 days, 19:59:02", "remaining_time": "2:56:32", "throughput": 2744.33, "total_tokens": 1620096128} {"current_steps": 8974, "total_steps": 9134, "loss": 0.8523, "learning_rate": 3.7845836065039664e-08, "epoch": 0.9824023645967322, "percentage": 98.25, "elapsed_time": "6 days, 20:00:06", "remaining_time": "2:55:26", "throughput": 2744.34, "total_tokens": 1620272640} {"current_steps": 8975, "total_steps": 9134, "loss": 1.1305, "learning_rate": 3.737435900620645e-08, "epoch": 0.9825118366676702, "percentage": 98.26, "elapsed_time": "6 days, 20:01:08", "remaining_time": "2:54:20", "throughput": 2744.32, "total_tokens": 1620433024} {"current_steps": 8976, "total_steps": 9134, "loss": 0.789, "learning_rate": 3.690583497826528e-08, "epoch": 0.9826213087386081, "percentage": 98.27, "elapsed_time": "6 days, 20:02:10", "remaining_time": "2:53:14", "throughput": 2744.28, "total_tokens": 1620584000} {"current_steps": 8977, "total_steps": 9134, "loss": 1.2681, "learning_rate": 3.644026403664402e-08, "epoch": 0.982730780809546, "percentage": 98.28, "elapsed_time": "6 days, 20:03:15", "remaining_time": "2:52:09", "throughput": 2744.31, "total_tokens": 1620780448} {"current_steps": 8978, "total_steps": 9134, "loss": 0.8091, "learning_rate": 3.5977646236415306e-08, "epoch": 0.9828402528804838, "percentage": 98.29, "elapsed_time": "6 days, 20:04:17", "remaining_time": "2:51:03", "throughput": 2744.32, "total_tokens": 1620955392} {"current_steps": 8979, "total_steps": 9134, "loss": 0.792, "learning_rate": 3.551798163231035e-08, "epoch": 0.9829497249514217, "percentage": 98.3, "elapsed_time": "6 days, 20:05:17", "remaining_time": "2:49:57", "throughput": 2744.32, "total_tokens": 1621118016} {"current_steps": 8980, "total_steps": 9134, "loss": 0.8992, "learning_rate": 3.506127027870232e-08, "epoch": 0.9830591970223597, "percentage": 98.31, "elapsed_time": "6 days, 20:06:21", "remaining_time": "2:48:51", "throughput": 2744.33, "total_tokens": 1621302144} {"current_steps": 8981, "total_steps": 9134, "loss": 0.9606, "learning_rate": 3.4607512229622993e-08, "epoch": 0.9831686690932976, "percentage": 98.32, "elapsed_time": "6 days, 20:07:26", "remaining_time": "2:47:45", "throughput": 2744.37, "total_tokens": 1621499264} {"current_steps": 8982, "total_steps": 9134, "loss": 0.9206, "learning_rate": 3.415670753874889e-08, "epoch": 0.9832781411642355, "percentage": 98.34, "elapsed_time": "6 days, 20:08:33", "remaining_time": "2:46:39", "throughput": 2744.39, "total_tokens": 1621696384} {"current_steps": 8983, "total_steps": 9134, "loss": 1.0507, "learning_rate": 3.370885625940956e-08, "epoch": 0.9833876132351734, "percentage": 98.35, "elapsed_time": "6 days, 20:09:37", "remaining_time": "2:45:34", "throughput": 2744.42, "total_tokens": 1621890144} {"current_steps": 8984, "total_steps": 9134, "loss": 0.7291, "learning_rate": 3.3263958444582076e-08, "epoch": 0.9834970853061112, "percentage": 98.36, "elapsed_time": "6 days, 20:10:41", "remaining_time": "2:44:28", "throughput": 2744.43, "total_tokens": 1622071808} {"current_steps": 8985, "total_steps": 9134, "loss": 1.017, "learning_rate": 3.2822014146902114e-08, "epoch": 0.9836065573770492, "percentage": 98.37, "elapsed_time": "6 days, 20:11:44", "remaining_time": "2:43:22", "throughput": 2744.42, "total_tokens": 1622241376} {"current_steps": 8986, "total_steps": 9134, "loss": 1.0597, "learning_rate": 3.2383023418650074e-08, "epoch": 0.9837160294479871, "percentage": 98.38, "elapsed_time": "6 days, 20:12:50", "remaining_time": "2:42:16", "throughput": 2744.46, "total_tokens": 1622440288} {"current_steps": 8987, "total_steps": 9134, "loss": 1.0105, "learning_rate": 3.1946986311756634e-08, "epoch": 0.983825501518925, "percentage": 98.39, "elapsed_time": "6 days, 20:13:55", "remaining_time": "2:41:10", "throughput": 2744.47, "total_tokens": 1622629792} {"current_steps": 8988, "total_steps": 9134, "loss": 1.0486, "learning_rate": 3.151390287780276e-08, "epoch": 0.9839349735898629, "percentage": 98.4, "elapsed_time": "6 days, 20:15:01", "remaining_time": "2:40:05", "throughput": 2744.48, "total_tokens": 1622814592} {"current_steps": 8989, "total_steps": 9134, "loss": 0.9022, "learning_rate": 3.108377316801969e-08, "epoch": 0.9840444456608007, "percentage": 98.41, "elapsed_time": "6 days, 20:16:05", "remaining_time": "2:38:59", "throughput": 2744.51, "total_tokens": 1623006560} {"current_steps": 8990, "total_steps": 9134, "loss": 1.0511, "learning_rate": 3.065659723329728e-08, "epoch": 0.9841539177317387, "percentage": 98.42, "elapsed_time": "6 days, 20:17:08", "remaining_time": "2:37:53", "throughput": 2744.52, "total_tokens": 1623185088} {"current_steps": 8991, "total_steps": 9134, "loss": 0.7805, "learning_rate": 3.023237512416455e-08, "epoch": 0.9842633898026766, "percentage": 98.43, "elapsed_time": "6 days, 20:18:09", "remaining_time": "2:36:47", "throughput": 2744.5, "total_tokens": 1623339872} {"current_steps": 8992, "total_steps": 9134, "loss": 1.0692, "learning_rate": 2.981110689080913e-08, "epoch": 0.9843728618736145, "percentage": 98.45, "elapsed_time": "6 days, 20:19:16", "remaining_time": "2:35:41", "throughput": 2744.54, "total_tokens": 1623551552} {"current_steps": 8993, "total_steps": 9134, "loss": 1.0629, "learning_rate": 2.9392792583066154e-08, "epoch": 0.9844823339445524, "percentage": 98.46, "elapsed_time": "6 days, 20:20:24", "remaining_time": "2:34:35", "throughput": 2744.56, "total_tokens": 1623748896} {"current_steps": 8994, "total_steps": 9134, "loss": 1.0581, "learning_rate": 2.8977432250418267e-08, "epoch": 0.9845918060154903, "percentage": 98.47, "elapsed_time": "6 days, 20:21:29", "remaining_time": "2:33:30", "throughput": 2744.56, "total_tokens": 1623929664} {"current_steps": 8995, "total_steps": 9134, "loss": 0.9712, "learning_rate": 2.8565025942001166e-08, "epoch": 0.9847012780864282, "percentage": 98.48, "elapsed_time": "6 days, 20:22:31", "remaining_time": "2:32:24", "throughput": 2744.56, "total_tokens": 1624095648} {"current_steps": 8996, "total_steps": 9134, "loss": 0.9379, "learning_rate": 2.8155573706609152e-08, "epoch": 0.9848107501573661, "percentage": 98.49, "elapsed_time": "6 days, 20:23:38", "remaining_time": "2:31:18", "throughput": 2744.58, "total_tokens": 1624291200} {"current_steps": 8997, "total_steps": 9134, "loss": 0.6978, "learning_rate": 2.7749075592670148e-08, "epoch": 0.984920222228304, "percentage": 98.5, "elapsed_time": "6 days, 20:24:40", "remaining_time": "2:30:12", "throughput": 2744.55, "total_tokens": 1624448224} {"current_steps": 8998, "total_steps": 9134, "loss": 0.9129, "learning_rate": 2.734553164827902e-08, "epoch": 0.9850296942992419, "percentage": 98.51, "elapsed_time": "6 days, 20:25:45", "remaining_time": "2:29:06", "throughput": 2744.56, "total_tokens": 1624633024} {"current_steps": 8999, "total_steps": 9134, "loss": 0.8035, "learning_rate": 2.6944941921172585e-08, "epoch": 0.9851391663701798, "percentage": 98.52, "elapsed_time": "6 days, 20:26:49", "remaining_time": "2:28:01", "throughput": 2744.58, "total_tokens": 1624819840} {"current_steps": 9000, "total_steps": 9134, "loss": 1.0822, "learning_rate": 2.654730645873793e-08, "epoch": 0.9852486384411178, "percentage": 98.53, "elapsed_time": "6 days, 20:27:53", "remaining_time": "2:26:55", "throughput": 2744.54, "total_tokens": 1624968800} {"current_steps": 9001, "total_steps": 9134, "loss": 0.8484, "learning_rate": 2.6152625308015212e-08, "epoch": 0.9853581105120556, "percentage": 98.54, "elapsed_time": "6 days, 20:28:58", "remaining_time": "2:25:49", "throughput": 2744.57, "total_tokens": 1625164352} {"current_steps": 9002, "total_steps": 9134, "loss": 0.8313, "learning_rate": 2.576089851569763e-08, "epoch": 0.9854675825829935, "percentage": 98.55, "elapsed_time": "6 days, 20:30:02", "remaining_time": "2:24:43", "throughput": 2744.55, "total_tokens": 1625326304} {"current_steps": 9003, "total_steps": 9134, "loss": 1.1665, "learning_rate": 2.5372126128120345e-08, "epoch": 0.9855770546539314, "percentage": 98.57, "elapsed_time": "6 days, 20:31:07", "remaining_time": "2:23:37", "throughput": 2744.59, "total_tokens": 1625534176} {"current_steps": 9004, "total_steps": 9134, "loss": 0.9605, "learning_rate": 2.4986308191277118e-08, "epoch": 0.9856865267248693, "percentage": 98.58, "elapsed_time": "6 days, 20:32:12", "remaining_time": "2:22:32", "throughput": 2744.63, "total_tokens": 1625736672} {"current_steps": 9005, "total_steps": 9134, "loss": 0.7496, "learning_rate": 2.4603444750811998e-08, "epoch": 0.9857959987958073, "percentage": 98.59, "elapsed_time": "6 days, 20:33:12", "remaining_time": "2:21:26", "throughput": 2744.61, "total_tokens": 1625883840} {"current_steps": 9006, "total_steps": 9134, "loss": 0.7944, "learning_rate": 2.4223535852010983e-08, "epoch": 0.9859054708667451, "percentage": 98.6, "elapsed_time": "6 days, 20:34:13", "remaining_time": "2:20:20", "throughput": 2744.6, "total_tokens": 1626046240} {"current_steps": 9007, "total_steps": 9134, "loss": 0.8618, "learning_rate": 2.384658153982422e-08, "epoch": 0.986014942937683, "percentage": 98.61, "elapsed_time": "6 days, 20:35:18", "remaining_time": "2:19:14", "throughput": 2744.63, "total_tokens": 1626240224} {"current_steps": 9008, "total_steps": 9134, "loss": 1.0287, "learning_rate": 2.347258185883827e-08, "epoch": 0.9861244150086209, "percentage": 98.62, "elapsed_time": "6 days, 20:36:22", "remaining_time": "2:18:08", "throughput": 2744.64, "total_tokens": 1626426144} {"current_steps": 9009, "total_steps": 9134, "loss": 0.7897, "learning_rate": 2.31015368532983e-08, "epoch": 0.9862338870795588, "percentage": 98.63, "elapsed_time": "6 days, 20:37:24", "remaining_time": "2:17:02", "throughput": 2744.62, "total_tokens": 1626586976} {"current_steps": 9010, "total_steps": 9134, "loss": 0.9115, "learning_rate": 2.2733446567099747e-08, "epoch": 0.9863433591504968, "percentage": 98.64, "elapsed_time": "6 days, 20:38:27", "remaining_time": "2:15:57", "throughput": 2744.62, "total_tokens": 1626755872} {"current_steps": 9011, "total_steps": 9134, "loss": 0.6701, "learning_rate": 2.236831104378556e-08, "epoch": 0.9864528312214347, "percentage": 98.65, "elapsed_time": "6 days, 20:39:30", "remaining_time": "2:14:51", "throughput": 2744.64, "total_tokens": 1626938432} {"current_steps": 9012, "total_steps": 9134, "loss": 0.9218, "learning_rate": 2.2006130326551745e-08, "epoch": 0.9865623032923725, "percentage": 98.66, "elapsed_time": "6 days, 20:40:34", "remaining_time": "2:13:45", "throughput": 2744.68, "total_tokens": 1627142272} {"current_steps": 9013, "total_steps": 9134, "loss": 0.6784, "learning_rate": 2.16469044582418e-08, "epoch": 0.9866717753633104, "percentage": 98.68, "elapsed_time": "6 days, 20:41:38", "remaining_time": "2:12:39", "throughput": 2744.7, "total_tokens": 1627328416} {"current_steps": 9014, "total_steps": 9134, "loss": 0.8195, "learning_rate": 2.129063348135507e-08, "epoch": 0.9867812474342483, "percentage": 98.69, "elapsed_time": "6 days, 20:42:41", "remaining_time": "2:11:33", "throughput": 2744.72, "total_tokens": 1627513664} {"current_steps": 9015, "total_steps": 9134, "loss": 1.1298, "learning_rate": 2.0937317438032844e-08, "epoch": 0.9868907195051863, "percentage": 98.7, "elapsed_time": "6 days, 20:43:48", "remaining_time": "2:10:28", "throughput": 2744.74, "total_tokens": 1627709216} {"current_steps": 9016, "total_steps": 9134, "loss": 0.7539, "learning_rate": 2.0586956370075018e-08, "epoch": 0.9870001915761242, "percentage": 98.71, "elapsed_time": "6 days, 20:44:52", "remaining_time": "2:09:22", "throughput": 2744.73, "total_tokens": 1627878112} {"current_steps": 9017, "total_steps": 9134, "loss": 1.1311, "learning_rate": 2.0239550318926215e-08, "epoch": 0.9871096636470621, "percentage": 98.72, "elapsed_time": "6 days, 20:45:58", "remaining_time": "2:08:16", "throughput": 2744.73, "total_tokens": 1628060896} {"current_steps": 9018, "total_steps": 9134, "loss": 1.0293, "learning_rate": 1.9895099325686894e-08, "epoch": 0.9872191357179999, "percentage": 98.73, "elapsed_time": "6 days, 20:47:03", "remaining_time": "2:07:10", "throughput": 2744.74, "total_tokens": 1628242784} {"current_steps": 9019, "total_steps": 9134, "loss": 0.8484, "learning_rate": 1.955360343110224e-08, "epoch": 0.9873286077889378, "percentage": 98.74, "elapsed_time": "6 days, 20:48:09", "remaining_time": "2:06:04", "throughput": 2744.77, "total_tokens": 1628446624} {"current_steps": 9020, "total_steps": 9134, "loss": 0.8816, "learning_rate": 1.921506267557327e-08, "epoch": 0.9874380798598758, "percentage": 98.75, "elapsed_time": "6 days, 20:49:11", "remaining_time": "2:04:59", "throughput": 2744.8, "total_tokens": 1628632768} {"current_steps": 9021, "total_steps": 9134, "loss": 1.1487, "learning_rate": 1.8879477099145726e-08, "epoch": 0.9875475519308137, "percentage": 98.76, "elapsed_time": "6 days, 20:50:18", "remaining_time": "2:03:53", "throughput": 2744.82, "total_tokens": 1628825856} {"current_steps": 9022, "total_steps": 9134, "loss": 0.8833, "learning_rate": 1.8546846741521184e-08, "epoch": 0.9876570240017516, "percentage": 98.77, "elapsed_time": "6 days, 20:51:25", "remaining_time": "2:02:47", "throughput": 2744.8, "total_tokens": 1628998112} {"current_steps": 9023, "total_steps": 9134, "loss": 0.9563, "learning_rate": 1.8217171642048726e-08, "epoch": 0.9877664960726894, "percentage": 98.78, "elapsed_time": "6 days, 20:52:30", "remaining_time": "2:01:41", "throughput": 2744.82, "total_tokens": 1629189632} {"current_steps": 9024, "total_steps": 9134, "loss": 1.1399, "learning_rate": 1.7890451839727707e-08, "epoch": 0.9878759681436273, "percentage": 98.8, "elapsed_time": "6 days, 20:53:37", "remaining_time": "2:00:36", "throughput": 2744.86, "total_tokens": 1629393696} {"current_steps": 9025, "total_steps": 9134, "loss": 0.8137, "learning_rate": 1.756668737320777e-08, "epoch": 0.9879854402145652, "percentage": 98.81, "elapsed_time": "6 days, 20:54:38", "remaining_time": "1:59:30", "throughput": 2744.84, "total_tokens": 1629550496} {"current_steps": 9026, "total_steps": 9134, "loss": 0.86, "learning_rate": 1.7245878280791606e-08, "epoch": 0.9880949122855032, "percentage": 98.82, "elapsed_time": "6 days, 20:55:41", "remaining_time": "1:58:24", "throughput": 2744.84, "total_tokens": 1629728128} {"current_steps": 9027, "total_steps": 9134, "loss": 0.6698, "learning_rate": 1.692802460042664e-08, "epoch": 0.9882043843564411, "percentage": 98.83, "elapsed_time": "6 days, 20:56:43", "remaining_time": "1:57:18", "throughput": 2744.84, "total_tokens": 1629894784} {"current_steps": 9028, "total_steps": 9134, "loss": 0.7303, "learning_rate": 1.66131263697189e-08, "epoch": 0.988313856427379, "percentage": 98.84, "elapsed_time": "6 days, 20:57:45", "remaining_time": "1:56:12", "throughput": 2744.84, "total_tokens": 1630068384} {"current_steps": 9029, "total_steps": 9134, "loss": 0.8252, "learning_rate": 1.630118362591915e-08, "epoch": 0.9884233284983168, "percentage": 98.85, "elapsed_time": "6 days, 20:58:42", "remaining_time": "1:55:06", "throughput": 2744.8, "total_tokens": 1630201440} {"current_steps": 9030, "total_steps": 9134, "loss": 0.7654, "learning_rate": 1.5992196405925642e-08, "epoch": 0.9885328005692547, "percentage": 98.86, "elapsed_time": "6 days, 20:59:47", "remaining_time": "1:54:01", "throughput": 2744.81, "total_tokens": 1630383776} {"current_steps": 9031, "total_steps": 9134, "loss": 0.6067, "learning_rate": 1.568616474629525e-08, "epoch": 0.9886422726401927, "percentage": 98.87, "elapsed_time": "6 days, 21:00:47", "remaining_time": "1:52:55", "throughput": 2744.8, "total_tokens": 1630543040} {"current_steps": 9032, "total_steps": 9134, "loss": 0.7099, "learning_rate": 1.5383088683229574e-08, "epoch": 0.9887517447111306, "percentage": 98.88, "elapsed_time": "6 days, 21:01:49", "remaining_time": "1:51:49", "throughput": 2744.81, "total_tokens": 1630716416} {"current_steps": 9033, "total_steps": 9134, "loss": 0.8025, "learning_rate": 1.5082968252583263e-08, "epoch": 0.9888612167820685, "percentage": 98.89, "elapsed_time": "6 days, 21:02:52", "remaining_time": "1:50:43", "throughput": 2744.8, "total_tokens": 1630883520} {"current_steps": 9034, "total_steps": 9134, "loss": 0.8531, "learning_rate": 1.4785803489858474e-08, "epoch": 0.9889706888530064, "percentage": 98.91, "elapsed_time": "6 days, 21:03:59", "remaining_time": "1:49:37", "throughput": 2744.82, "total_tokens": 1631082880} {"current_steps": 9035, "total_steps": 9134, "loss": 0.973, "learning_rate": 1.4491594430207645e-08, "epoch": 0.9890801609239442, "percentage": 98.92, "elapsed_time": "6 days, 21:05:02", "remaining_time": "1:48:31", "throughput": 2744.84, "total_tokens": 1631262976} {"current_steps": 9036, "total_steps": 9134, "loss": 0.9446, "learning_rate": 1.4200341108439042e-08, "epoch": 0.9891896329948822, "percentage": 98.93, "elapsed_time": "6 days, 21:06:04", "remaining_time": "1:47:26", "throughput": 2744.88, "total_tokens": 1631457632} {"current_steps": 9037, "total_steps": 9134, "loss": 0.9806, "learning_rate": 1.3912043559005661e-08, "epoch": 0.9892991050658201, "percentage": 98.94, "elapsed_time": "6 days, 21:07:11", "remaining_time": "1:46:20", "throughput": 2744.92, "total_tokens": 1631667296} {"current_steps": 9038, "total_steps": 9134, "loss": 0.871, "learning_rate": 1.3626701816010778e-08, "epoch": 0.989408577136758, "percentage": 98.95, "elapsed_time": "6 days, 21:08:16", "remaining_time": "1:45:14", "throughput": 2744.94, "total_tokens": 1631859040} {"current_steps": 9039, "total_steps": 9134, "loss": 0.7274, "learning_rate": 1.3344315913210725e-08, "epoch": 0.9895180492076959, "percentage": 98.96, "elapsed_time": "6 days, 21:09:19", "remaining_time": "1:44:08", "throughput": 2744.97, "total_tokens": 1632046304} {"current_steps": 9040, "total_steps": 9134, "loss": 0.8064, "learning_rate": 1.3064885884012112e-08, "epoch": 0.9896275212786337, "percentage": 98.97, "elapsed_time": "6 days, 21:10:24", "remaining_time": "1:43:03", "throughput": 2745.01, "total_tokens": 1632251040} {"current_steps": 9041, "total_steps": 9134, "loss": 0.9352, "learning_rate": 1.278841176147183e-08, "epoch": 0.9897369933495717, "percentage": 98.98, "elapsed_time": "6 days, 21:11:28", "remaining_time": "1:41:57", "throughput": 2745.01, "total_tokens": 1632424864} {"current_steps": 9042, "total_steps": 9134, "loss": 0.9728, "learning_rate": 1.2514893578294274e-08, "epoch": 0.9898464654205096, "percentage": 98.99, "elapsed_time": "6 days, 21:12:33", "remaining_time": "1:40:51", "throughput": 2745.02, "total_tokens": 1632613248} {"current_steps": 9043, "total_steps": 9134, "loss": 0.773, "learning_rate": 1.2244331366836892e-08, "epoch": 0.9899559374914475, "percentage": 99.0, "elapsed_time": "6 days, 21:13:36", "remaining_time": "1:39:45", "throughput": 2745.03, "total_tokens": 1632790656} {"current_steps": 9044, "total_steps": 9134, "loss": 0.7169, "learning_rate": 1.1976725159107415e-08, "epoch": 0.9900654095623854, "percentage": 99.01, "elapsed_time": "6 days, 21:14:31", "remaining_time": "1:38:39", "throughput": 2745.0, "total_tokens": 1632921248} {"current_steps": 9045, "total_steps": 9134, "loss": 0.9976, "learning_rate": 1.1712074986761079e-08, "epoch": 0.9901748816333233, "percentage": 99.03, "elapsed_time": "6 days, 21:15:38", "remaining_time": "1:37:34", "throughput": 2745.01, "total_tokens": 1633111648} {"current_steps": 9046, "total_steps": 9134, "loss": 0.863, "learning_rate": 1.1450380881106171e-08, "epoch": 0.9902843537042612, "percentage": 99.04, "elapsed_time": "6 days, 21:16:44", "remaining_time": "1:36:28", "throughput": 2745.04, "total_tokens": 1633312800} {"current_steps": 9047, "total_steps": 9134, "loss": 0.6596, "learning_rate": 1.1191642873104036e-08, "epoch": 0.9903938257751991, "percentage": 99.05, "elapsed_time": "6 days, 21:17:48", "remaining_time": "1:35:22", "throughput": 2745.04, "total_tokens": 1633488864} {"current_steps": 9048, "total_steps": 9134, "loss": 0.798, "learning_rate": 1.0935860993357971e-08, "epoch": 0.990503297846137, "percentage": 99.06, "elapsed_time": "6 days, 21:18:51", "remaining_time": "1:34:16", "throughput": 2745.05, "total_tokens": 1633666720} {"current_steps": 9049, "total_steps": 9134, "loss": 0.9445, "learning_rate": 1.0683035272127107e-08, "epoch": 0.9906127699170749, "percentage": 99.07, "elapsed_time": "6 days, 21:19:56", "remaining_time": "1:33:10", "throughput": 2745.07, "total_tokens": 1633856224} {"current_steps": 9050, "total_steps": 9134, "loss": 0.7118, "learning_rate": 1.0433165739323625e-08, "epoch": 0.9907222419880128, "percentage": 99.08, "elapsed_time": "6 days, 21:20:58", "remaining_time": "1:32:05", "throughput": 2745.08, "total_tokens": 1634033408} {"current_steps": 9051, "total_steps": 9134, "loss": 0.6755, "learning_rate": 1.0186252424504439e-08, "epoch": 0.9908317140589508, "percentage": 99.09, "elapsed_time": "6 days, 21:22:05", "remaining_time": "1:30:59", "throughput": 2745.11, "total_tokens": 1634234784} {"current_steps": 9052, "total_steps": 9134, "loss": 1.0072, "learning_rate": 9.942295356879517e-09, "epoch": 0.9909411861298886, "percentage": 99.1, "elapsed_time": "6 days, 21:23:10", "remaining_time": "1:29:53", "throughput": 2745.14, "total_tokens": 1634433472} {"current_steps": 9053, "total_steps": 9134, "loss": 1.1832, "learning_rate": 9.701294565309105e-09, "epoch": 0.9910506582008265, "percentage": 99.11, "elapsed_time": "6 days, 21:24:13", "remaining_time": "1:28:47", "throughput": 2745.16, "total_tokens": 1634616256} {"current_steps": 9054, "total_steps": 9134, "loss": 0.7886, "learning_rate": 9.463250078300955e-09, "epoch": 0.9911601302717644, "percentage": 99.12, "elapsed_time": "6 days, 21:25:15", "remaining_time": "1:27:41", "throughput": 2745.19, "total_tokens": 1634806208} {"current_steps": 9055, "total_steps": 9134, "loss": 0.9664, "learning_rate": 9.228161924015877e-09, "epoch": 0.9912696023427023, "percentage": 99.14, "elapsed_time": "6 days, 21:26:18", "remaining_time": "1:26:36", "throughput": 2745.19, "total_tokens": 1634977120} {"current_steps": 9056, "total_steps": 9134, "loss": 0.9962, "learning_rate": 8.99603013026773e-09, "epoch": 0.9913790744136403, "percentage": 99.15, "elapsed_time": "6 days, 21:27:25", "remaining_time": "1:25:30", "throughput": 2745.21, "total_tokens": 1635175136} {"current_steps": 9057, "total_steps": 9134, "loss": 0.9536, "learning_rate": 8.766854724509555e-09, "epoch": 0.9914885464845781, "percentage": 99.16, "elapsed_time": "6 days, 21:28:30", "remaining_time": "1:24:24", "throughput": 2745.22, "total_tokens": 1635353664} {"current_steps": 9058, "total_steps": 9134, "loss": 0.7651, "learning_rate": 8.540635733861325e-09, "epoch": 0.991598018555516, "percentage": 99.17, "elapsed_time": "6 days, 21:29:34", "remaining_time": "1:23:18", "throughput": 2745.22, "total_tokens": 1635531968} {"current_steps": 9059, "total_steps": 9134, "loss": 0.9625, "learning_rate": 8.317373185079413e-09, "epoch": 0.9917074906264539, "percentage": 99.18, "elapsed_time": "6 days, 21:30:39", "remaining_time": "1:22:12", "throughput": 2745.27, "total_tokens": 1635738048} {"current_steps": 9060, "total_steps": 9134, "loss": 1.0214, "learning_rate": 8.097067104576029e-09, "epoch": 0.9918169626973918, "percentage": 99.19, "elapsed_time": "6 days, 21:31:41", "remaining_time": "1:21:07", "throughput": 2745.26, "total_tokens": 1635904928} {"current_steps": 9061, "total_steps": 9134, "loss": 0.8122, "learning_rate": 7.879717518413654e-09, "epoch": 0.9919264347683298, "percentage": 99.2, "elapsed_time": "6 days, 21:32:43", "remaining_time": "1:20:01", "throughput": 2745.27, "total_tokens": 1636081440} {"current_steps": 9062, "total_steps": 9134, "loss": 0.9507, "learning_rate": 7.66532445230228e-09, "epoch": 0.9920359068392677, "percentage": 99.21, "elapsed_time": "6 days, 21:33:47", "remaining_time": "1:18:55", "throughput": 2745.3, "total_tokens": 1636274976} {"current_steps": 9063, "total_steps": 9134, "loss": 0.9778, "learning_rate": 7.453887931607728e-09, "epoch": 0.9921453789102055, "percentage": 99.22, "elapsed_time": "6 days, 21:34:53", "remaining_time": "1:17:49", "throughput": 2745.33, "total_tokens": 1636476800} {"current_steps": 9064, "total_steps": 9134, "loss": 0.9354, "learning_rate": 7.2454079813405465e-09, "epoch": 0.9922548509811434, "percentage": 99.23, "elapsed_time": "6 days, 21:35:58", "remaining_time": "1:16:44", "throughput": 2745.36, "total_tokens": 1636672576} {"current_steps": 9065, "total_steps": 9134, "loss": 0.9738, "learning_rate": 7.039884626164339e-09, "epoch": 0.9923643230520813, "percentage": 99.24, "elapsed_time": "6 days, 21:36:58", "remaining_time": "1:15:38", "throughput": 2745.34, "total_tokens": 1636825344} {"current_steps": 9066, "total_steps": 9134, "loss": 1.1323, "learning_rate": 6.83731789038744e-09, "epoch": 0.9924737951230193, "percentage": 99.26, "elapsed_time": "6 days, 21:38:05", "remaining_time": "1:14:32", "throughput": 2745.37, "total_tokens": 1637027840} {"current_steps": 9067, "total_steps": 9134, "loss": 0.8698, "learning_rate": 6.637707797979564e-09, "epoch": 0.9925832671939572, "percentage": 99.27, "elapsed_time": "6 days, 21:39:08", "remaining_time": "1:13:26", "throughput": 2745.39, "total_tokens": 1637210848} {"current_steps": 9068, "total_steps": 9134, "loss": 0.8906, "learning_rate": 6.44105437255238e-09, "epoch": 0.9926927392648951, "percentage": 99.28, "elapsed_time": "6 days, 21:40:14", "remaining_time": "1:12:20", "throughput": 2745.4, "total_tokens": 1637398112} {"current_steps": 9069, "total_steps": 9134, "loss": 0.8269, "learning_rate": 6.247357637367834e-09, "epoch": 0.9928022113358329, "percentage": 99.29, "elapsed_time": "6 days, 21:41:21", "remaining_time": "1:11:15", "throughput": 2745.44, "total_tokens": 1637601280} {"current_steps": 9070, "total_steps": 9134, "loss": 0.8737, "learning_rate": 6.056617615340931e-09, "epoch": 0.9929116834067708, "percentage": 99.3, "elapsed_time": "6 days, 21:42:24", "remaining_time": "1:10:09", "throughput": 2745.44, "total_tokens": 1637776896} {"current_steps": 9071, "total_steps": 9134, "loss": 0.8278, "learning_rate": 5.868834329036954e-09, "epoch": 0.9930211554777088, "percentage": 99.31, "elapsed_time": "6 days, 21:43:26", "remaining_time": "1:09:03", "throughput": 2745.41, "total_tokens": 1637931232} {"current_steps": 9072, "total_steps": 9134, "loss": 0.9059, "learning_rate": 5.684007800668689e-09, "epoch": 0.9931306275486467, "percentage": 99.32, "elapsed_time": "6 days, 21:44:31", "remaining_time": "1:07:57", "throughput": 2745.41, "total_tokens": 1638106400} {"current_steps": 9073, "total_steps": 9134, "loss": 1.0028, "learning_rate": 5.50213805210198e-09, "epoch": 0.9932400996195846, "percentage": 99.33, "elapsed_time": "6 days, 21:45:36", "remaining_time": "1:06:52", "throughput": 2745.41, "total_tokens": 1638288512} {"current_steps": 9074, "total_steps": 9134, "loss": 0.7726, "learning_rate": 5.3232251048473956e-09, "epoch": 0.9933495716905224, "percentage": 99.34, "elapsed_time": "6 days, 21:46:43", "remaining_time": "1:05:46", "throughput": 2745.43, "total_tokens": 1638480032} {"current_steps": 9075, "total_steps": 9134, "loss": 0.8973, "learning_rate": 5.147268980076891e-09, "epoch": 0.9934590437614603, "percentage": 99.35, "elapsed_time": "6 days, 21:47:50", "remaining_time": "1:04:40", "throughput": 2745.49, "total_tokens": 1638698880} {"current_steps": 9076, "total_steps": 9134, "loss": 0.841, "learning_rate": 4.974269698601597e-09, "epoch": 0.9935685158323982, "percentage": 99.37, "elapsed_time": "6 days, 21:48:54", "remaining_time": "1:03:34", "throughput": 2745.51, "total_tokens": 1638887712} {"current_steps": 9077, "total_steps": 9134, "loss": 1.1056, "learning_rate": 4.804227280888473e-09, "epoch": 0.9936779879033362, "percentage": 99.38, "elapsed_time": "6 days, 21:50:00", "remaining_time": "1:02:28", "throughput": 2745.52, "total_tokens": 1639076096} {"current_steps": 9078, "total_steps": 9134, "loss": 0.7488, "learning_rate": 4.637141747051987e-09, "epoch": 0.9937874599742741, "percentage": 99.39, "elapsed_time": "6 days, 21:51:01", "remaining_time": "1:01:23", "throughput": 2745.53, "total_tokens": 1639248128} {"current_steps": 9079, "total_steps": 9134, "loss": 0.796, "learning_rate": 4.473013116859659e-09, "epoch": 0.993896932045212, "percentage": 99.4, "elapsed_time": "6 days, 21:52:08", "remaining_time": "1:00:17", "throughput": 2745.56, "total_tokens": 1639449504} {"current_steps": 9080, "total_steps": 9134, "loss": 0.9079, "learning_rate": 4.311841409723738e-09, "epoch": 0.9940064041161498, "percentage": 99.41, "elapsed_time": "6 days, 21:53:14", "remaining_time": "0:59:11", "throughput": 2745.56, "total_tokens": 1639632960} {"current_steps": 9081, "total_steps": 9134, "loss": 0.8292, "learning_rate": 4.153626644715081e-09, "epoch": 0.9941158761870877, "percentage": 99.42, "elapsed_time": "6 days, 21:54:19", "remaining_time": "0:58:05", "throughput": 2745.57, "total_tokens": 1639814848} {"current_steps": 9082, "total_steps": 9134, "loss": 1.1794, "learning_rate": 3.998368840549271e-09, "epoch": 0.9942253482580257, "percentage": 99.43, "elapsed_time": "6 days, 21:55:25", "remaining_time": "0:57:00", "throughput": 2745.6, "total_tokens": 1640018240} {"current_steps": 9083, "total_steps": 9134, "loss": 0.7232, "learning_rate": 3.8460680155921746e-09, "epoch": 0.9943348203289636, "percentage": 99.44, "elapsed_time": "6 days, 21:56:31", "remaining_time": "0:55:54", "throughput": 2745.62, "total_tokens": 1640209088} {"current_steps": 9084, "total_steps": 9134, "loss": 1.1266, "learning_rate": 3.6967241878599347e-09, "epoch": 0.9944442923999015, "percentage": 99.45, "elapsed_time": "6 days, 21:57:35", "remaining_time": "0:54:48", "throughput": 2745.64, "total_tokens": 1640398144} {"current_steps": 9085, "total_steps": 9134, "loss": 1.0705, "learning_rate": 3.550337375018975e-09, "epoch": 0.9945537644708394, "percentage": 99.46, "elapsed_time": "6 days, 21:58:41", "remaining_time": "0:53:42", "throughput": 2745.68, "total_tokens": 1640599968} {"current_steps": 9086, "total_steps": 9134, "loss": 0.822, "learning_rate": 3.406907594388775e-09, "epoch": 0.9946632365417772, "percentage": 99.47, "elapsed_time": "6 days, 21:59:47", "remaining_time": "0:52:36", "throughput": 2745.71, "total_tokens": 1640798656} {"current_steps": 9087, "total_steps": 9134, "loss": 0.8315, "learning_rate": 3.2664348629363183e-09, "epoch": 0.9947727086127152, "percentage": 99.49, "elapsed_time": "6 days, 22:00:51", "remaining_time": "0:51:31", "throughput": 2745.74, "total_tokens": 1640993760} {"current_steps": 9088, "total_steps": 9134, "loss": 0.7504, "learning_rate": 3.1289191972816435e-09, "epoch": 0.9948821806836531, "percentage": 99.5, "elapsed_time": "6 days, 22:01:56", "remaining_time": "0:50:25", "throughput": 2745.75, "total_tokens": 1641179456} {"current_steps": 9089, "total_steps": 9134, "loss": 1.1492, "learning_rate": 2.994360613686742e-09, "epoch": 0.994991652754591, "percentage": 99.51, "elapsed_time": "6 days, 22:03:01", "remaining_time": "0:49:19", "throughput": 2745.76, "total_tokens": 1641367168} {"current_steps": 9090, "total_steps": 9134, "loss": 0.7467, "learning_rate": 2.862759128072212e-09, "epoch": 0.9951011248255289, "percentage": 99.52, "elapsed_time": "6 days, 22:04:09", "remaining_time": "0:48:13", "throughput": 2745.81, "total_tokens": 1641579520} {"current_steps": 9091, "total_steps": 9134, "loss": 1.2505, "learning_rate": 2.734114756008932e-09, "epoch": 0.9952105968964667, "percentage": 99.53, "elapsed_time": "6 days, 22:05:13", "remaining_time": "0:47:08", "throughput": 2745.83, "total_tokens": 1641769024} {"current_steps": 9092, "total_steps": 9134, "loss": 1.1067, "learning_rate": 2.6084275127125078e-09, "epoch": 0.9953200689674047, "percentage": 99.54, "elapsed_time": "6 days, 22:06:17", "remaining_time": "0:46:02", "throughput": 2745.83, "total_tokens": 1641945312} {"current_steps": 9093, "total_steps": 9134, "loss": 0.8964, "learning_rate": 2.485697413051602e-09, "epoch": 0.9954295410383426, "percentage": 99.55, "elapsed_time": "6 days, 22:07:19", "remaining_time": "0:44:56", "throughput": 2745.79, "total_tokens": 1642090016} {"current_steps": 9094, "total_steps": 9134, "loss": 0.8095, "learning_rate": 2.365924471547931e-09, "epoch": 0.9955390131092805, "percentage": 99.56, "elapsed_time": "6 days, 22:08:25", "remaining_time": "0:43:50", "throughput": 2745.79, "total_tokens": 1642273248} {"current_steps": 9095, "total_steps": 9134, "loss": 0.7469, "learning_rate": 2.2491087023651657e-09, "epoch": 0.9956484851802184, "percentage": 99.57, "elapsed_time": "6 days, 22:09:31", "remaining_time": "0:42:45", "throughput": 2745.8, "total_tokens": 1642460512} {"current_steps": 9096, "total_steps": 9134, "loss": 1.0862, "learning_rate": 2.1352501193255824e-09, "epoch": 0.9957579572511563, "percentage": 99.58, "elapsed_time": "6 days, 22:10:35", "remaining_time": "0:41:39", "throughput": 2745.84, "total_tokens": 1642660096} {"current_steps": 9097, "total_steps": 9134, "loss": 0.8892, "learning_rate": 2.0243487358989623e-09, "epoch": 0.9958674293220942, "percentage": 99.59, "elapsed_time": "6 days, 22:11:39", "remaining_time": "0:40:33", "throughput": 2745.87, "total_tokens": 1642850272} {"current_steps": 9098, "total_steps": 9134, "loss": 0.8041, "learning_rate": 1.9164045652053655e-09, "epoch": 0.9959769013930321, "percentage": 99.61, "elapsed_time": "6 days, 22:12:43", "remaining_time": "0:39:27", "throughput": 2745.84, "total_tokens": 1643012000} {"current_steps": 9099, "total_steps": 9134, "loss": 1.183, "learning_rate": 1.8114176200123567e-09, "epoch": 0.99608637346397, "percentage": 99.62, "elapsed_time": "6 days, 22:13:48", "remaining_time": "0:38:21", "throughput": 2745.87, "total_tokens": 1643208224} {"current_steps": 9100, "total_steps": 9134, "loss": 0.8781, "learning_rate": 1.709387912737781e-09, "epoch": 0.9961958455349079, "percentage": 99.63, "elapsed_time": "6 days, 22:14:52", "remaining_time": "0:37:16", "throughput": 2745.84, "total_tokens": 1643364800} {"current_steps": 9101, "total_steps": 9134, "loss": 0.9975, "learning_rate": 1.6103154554553135e-09, "epoch": 0.9963053176058458, "percentage": 99.64, "elapsed_time": "6 days, 22:15:57", "remaining_time": "0:36:10", "throughput": 2745.82, "total_tokens": 1643532352} {"current_steps": 9102, "total_steps": 9134, "loss": 1.0536, "learning_rate": 1.5142002598833581e-09, "epoch": 0.9964147896767838, "percentage": 99.65, "elapsed_time": "6 days, 22:17:00", "remaining_time": "0:35:04", "throughput": 2745.82, "total_tokens": 1643704832} {"current_steps": 9103, "total_steps": 9134, "loss": 0.8358, "learning_rate": 1.4210423373933746e-09, "epoch": 0.9965242617477216, "percentage": 99.66, "elapsed_time": "6 days, 22:17:54", "remaining_time": "0:33:58", "throughput": 2745.76, "total_tokens": 1643816160} {"current_steps": 9104, "total_steps": 9134, "loss": 1.0104, "learning_rate": 1.330841699004326e-09, "epoch": 0.9966337338186595, "percentage": 99.67, "elapsed_time": "6 days, 22:18:58", "remaining_time": "0:32:52", "throughput": 2745.76, "total_tokens": 1643993568} {"current_steps": 9105, "total_steps": 9134, "loss": 0.856, "learning_rate": 1.2435983553882314e-09, "epoch": 0.9967432058895974, "percentage": 99.68, "elapsed_time": "6 days, 22:20:00", "remaining_time": "0:31:47", "throughput": 2745.75, "total_tokens": 1644159328} {"current_steps": 9106, "total_steps": 9134, "loss": 0.8713, "learning_rate": 1.1593123168646137e-09, "epoch": 0.9968526779605353, "percentage": 99.69, "elapsed_time": "6 days, 22:21:04", "remaining_time": "0:30:41", "throughput": 2745.76, "total_tokens": 1644339200} {"current_steps": 9107, "total_steps": 9134, "loss": 0.9679, "learning_rate": 1.0779835934032755e-09, "epoch": 0.9969621500314733, "percentage": 99.7, "elapsed_time": "6 days, 22:22:08", "remaining_time": "0:29:35", "throughput": 2745.77, "total_tokens": 1644517952} {"current_steps": 9108, "total_steps": 9134, "loss": 0.9056, "learning_rate": 9.996121946270753e-10, "epoch": 0.9970716221024111, "percentage": 99.72, "elapsed_time": "6 days, 22:23:13", "remaining_time": "0:28:29", "throughput": 2745.79, "total_tokens": 1644713504} {"current_steps": 9109, "total_steps": 9134, "loss": 1.0041, "learning_rate": 9.241981298091506e-10, "epoch": 0.997181094173349, "percentage": 99.73, "elapsed_time": "6 days, 22:24:19", "remaining_time": "0:27:24", "throughput": 2745.77, "total_tokens": 1644880832} {"current_steps": 9110, "total_steps": 9134, "loss": 0.7762, "learning_rate": 8.517414078645925e-10, "epoch": 0.9972905662442869, "percentage": 99.74, "elapsed_time": "6 days, 22:25:21", "remaining_time": "0:26:18", "throughput": 2745.76, "total_tokens": 1645044576} {"current_steps": 9111, "total_steps": 9134, "loss": 0.9477, "learning_rate": 7.822420373726491e-10, "epoch": 0.9974000383152248, "percentage": 99.75, "elapsed_time": "6 days, 22:26:28", "remaining_time": "0:25:12", "throughput": 2745.74, "total_tokens": 1645214592} {"current_steps": 9112, "total_steps": 9134, "loss": 1.1317, "learning_rate": 7.157000265489711e-10, "epoch": 0.9975095103861628, "percentage": 99.76, "elapsed_time": "6 days, 22:27:33", "remaining_time": "0:24:06", "throughput": 2745.76, "total_tokens": 1645404096} {"current_steps": 9113, "total_steps": 9134, "loss": 0.7154, "learning_rate": 6.521153832678151e-10, "epoch": 0.9976189824571007, "percentage": 99.77, "elapsed_time": "6 days, 22:28:35", "remaining_time": "0:23:01", "throughput": 2745.73, "total_tokens": 1645558880} {"current_steps": 9114, "total_steps": 9134, "loss": 0.8393, "learning_rate": 5.914881150509422e-10, "epoch": 0.9977284545280385, "percentage": 99.78, "elapsed_time": "6 days, 22:29:35", "remaining_time": "0:21:55", "throughput": 2745.68, "total_tokens": 1645694848} {"current_steps": 9115, "total_steps": 9134, "loss": 0.9212, "learning_rate": 5.33818229070393e-10, "epoch": 0.9978379265989764, "percentage": 99.79, "elapsed_time": "6 days, 22:30:39", "remaining_time": "0:20:49", "throughput": 2745.7, "total_tokens": 1645879648} {"current_steps": 9116, "total_steps": 9134, "loss": 0.9202, "learning_rate": 4.791057321484882e-10, "epoch": 0.9979473986699143, "percentage": 99.8, "elapsed_time": "6 days, 22:31:45", "remaining_time": "0:19:43", "throughput": 2745.72, "total_tokens": 1646073856} {"current_steps": 9117, "total_steps": 9134, "loss": 0.8831, "learning_rate": 4.273506307550523e-10, "epoch": 0.9980568707408523, "percentage": 99.81, "elapsed_time": "6 days, 22:32:49", "remaining_time": "0:18:37", "throughput": 2745.72, "total_tokens": 1646248576} {"current_steps": 9118, "total_steps": 9134, "loss": 0.9692, "learning_rate": 3.785529310185165e-10, "epoch": 0.9981663428117902, "percentage": 99.82, "elapsed_time": "6 days, 22:33:51", "remaining_time": "0:17:32", "throughput": 2745.72, "total_tokens": 1646420160} {"current_steps": 9119, "total_steps": 9134, "loss": 0.8842, "learning_rate": 3.327126387064894e-10, "epoch": 0.9982758148827281, "percentage": 99.84, "elapsed_time": "6 days, 22:34:55", "remaining_time": "0:16:26", "throughput": 2745.7, "total_tokens": 1646585696} {"current_steps": 9120, "total_steps": 9134, "loss": 0.828, "learning_rate": 2.898297592424104e-10, "epoch": 0.9983852869536659, "percentage": 99.85, "elapsed_time": "6 days, 22:36:00", "remaining_time": "0:15:20", "throughput": 2745.71, "total_tokens": 1646765792} {"current_steps": 9121, "total_steps": 9134, "loss": 0.7106, "learning_rate": 2.499042976999988e-10, "epoch": 0.9984947590246038, "percentage": 99.86, "elapsed_time": "6 days, 22:37:02", "remaining_time": "0:14:14", "throughput": 2745.7, "total_tokens": 1646930656} {"current_steps": 9122, "total_steps": 9134, "loss": 0.8705, "learning_rate": 2.1293625880325352e-10, "epoch": 0.9986042310955418, "percentage": 99.87, "elapsed_time": "6 days, 22:38:06", "remaining_time": "0:13:09", "throughput": 2745.71, "total_tokens": 1647114560} {"current_steps": 9123, "total_steps": 9134, "loss": 0.8217, "learning_rate": 1.7892564692367775e-10, "epoch": 0.9987137031664797, "percentage": 99.88, "elapsed_time": "6 days, 22:39:13", "remaining_time": "0:12:03", "throughput": 2745.74, "total_tokens": 1647317504} {"current_steps": 9124, "total_steps": 9134, "loss": 0.8254, "learning_rate": 1.478724660886055e-10, "epoch": 0.9988231752374176, "percentage": 99.89, "elapsed_time": "6 days, 22:40:12", "remaining_time": "0:10:57", "throughput": 2745.73, "total_tokens": 1647472512} {"current_steps": 9125, "total_steps": 9134, "loss": 0.9125, "learning_rate": 1.1977671996732388e-10, "epoch": 0.9989326473083554, "percentage": 99.9, "elapsed_time": "6 days, 22:41:13", "remaining_time": "0:09:51", "throughput": 2745.73, "total_tokens": 1647639840} {"current_steps": 9126, "total_steps": 9134, "loss": 0.8639, "learning_rate": 9.463841188217527e-11, "epoch": 0.9990421193792933, "percentage": 99.91, "elapsed_time": "6 days, 22:42:17", "remaining_time": "0:08:46", "throughput": 2745.72, "total_tokens": 1647810976} {"current_steps": 9127, "total_steps": 9134, "loss": 1.132, "learning_rate": 7.245754481133294e-11, "epoch": 0.9991515914502312, "percentage": 99.92, "elapsed_time": "6 days, 22:43:21", "remaining_time": "0:07:40", "throughput": 2745.75, "total_tokens": 1648004064} {"current_steps": 9128, "total_steps": 9134, "loss": 0.7971, "learning_rate": 5.3234121377698785e-11, "epoch": 0.9992610635211692, "percentage": 99.93, "elapsed_time": "6 days, 22:44:25", "remaining_time": "0:06:34", "throughput": 2745.77, "total_tokens": 1648192000} {"current_steps": 9129, "total_steps": 9134, "loss": 0.6711, "learning_rate": 3.696814385445446e-11, "epoch": 0.9993705355921071, "percentage": 99.95, "elapsed_time": "6 days, 22:45:31", "remaining_time": "0:05:28", "throughput": 2745.78, "total_tokens": 1648376800} {"current_steps": 9130, "total_steps": 9134, "loss": 1.0707, "learning_rate": 2.365961416506135e-11, "epoch": 0.999480007663045, "percentage": 99.96, "elapsed_time": "6 days, 22:46:35", "remaining_time": "0:04:23", "throughput": 2745.79, "total_tokens": 1648559808} {"current_steps": 9131, "total_steps": 9134, "loss": 0.8996, "learning_rate": 1.3308533886036145e-11, "epoch": 0.9995894797339828, "percentage": 99.97, "elapsed_time": "6 days, 22:47:36", "remaining_time": "0:03:17", "throughput": 2745.77, "total_tokens": 1648714144} {"current_steps": 9132, "total_steps": 9134, "loss": 0.7928, "learning_rate": 5.914904241399732e-12, "epoch": 0.9996989518049207, "percentage": 99.98, "elapsed_time": "6 days, 22:48:43", "remaining_time": "0:02:11", "throughput": 2745.79, "total_tokens": 1648911264} {"current_steps": 9133, "total_steps": 9134, "loss": 0.8593, "learning_rate": 1.4787261026771859e-12, "epoch": 0.9998084238758587, "percentage": 99.99, "elapsed_time": "6 days, 22:49:47", "remaining_time": "0:01:05", "throughput": 2745.81, "total_tokens": 1649101216} {"current_steps": 9134, "total_steps": 9134, "loss": 0.7529, "learning_rate": 0.0, "epoch": 0.9999178959467966, "percentage": 100.0, "elapsed_time": "6 days, 22:50:49", "remaining_time": "0:00:00", "throughput": 2745.81, "total_tokens": 1649269888} {"current_steps": 9134, "total_steps": 9134, "epoch": 0.9999178959467966, "percentage": 100.0, "elapsed_time": "6 days, 22:53:20", "remaining_time": "0:00:00", "throughput": 2745.12, "total_tokens": 1649269888}