GENOME-gemma-2b-it / cot /trainer_log.jsonl
Estwld's picture
Upload 15 files
e64b907 verified
{"current_steps": 10, "total_steps": 7385, "loss": 2.3319, "learning_rate": 2.7063599458728013e-06, "epoch": 0.006770480704129994, "percentage": 0.14, "elapsed_time": "0:00:08", "remaining_time": "1:48:38"}
{"current_steps": 20, "total_steps": 7385, "loss": 2.3443, "learning_rate": 5.4127198917456026e-06, "epoch": 0.013540961408259987, "percentage": 0.27, "elapsed_time": "0:00:16", "remaining_time": "1:42:27"}
{"current_steps": 30, "total_steps": 7385, "loss": 2.3759, "learning_rate": 8.119079837618404e-06, "epoch": 0.020311442112389978, "percentage": 0.41, "elapsed_time": "0:00:23", "remaining_time": "1:37:08"}
{"current_steps": 40, "total_steps": 7385, "loss": 2.1286, "learning_rate": 1.0825439783491205e-05, "epoch": 0.027081922816519974, "percentage": 0.54, "elapsed_time": "0:00:31", "remaining_time": "1:36:38"}
{"current_steps": 50, "total_steps": 7385, "loss": 1.9161, "learning_rate": 1.3531799729364006e-05, "epoch": 0.033852403520649964, "percentage": 0.68, "elapsed_time": "0:00:40", "remaining_time": "1:38:36"}
{"current_steps": 60, "total_steps": 7385, "loss": 1.6287, "learning_rate": 1.6238159675236808e-05, "epoch": 0.040622884224779957, "percentage": 0.81, "elapsed_time": "0:00:48", "remaining_time": "1:37:58"}
{"current_steps": 70, "total_steps": 7385, "loss": 1.5206, "learning_rate": 1.894451962110961e-05, "epoch": 0.04739336492890995, "percentage": 0.95, "elapsed_time": "0:00:55", "remaining_time": "1:37:28"}
{"current_steps": 80, "total_steps": 7385, "loss": 1.3484, "learning_rate": 2.165087956698241e-05, "epoch": 0.05416384563303995, "percentage": 1.08, "elapsed_time": "0:01:03", "remaining_time": "1:35:57"}
{"current_steps": 90, "total_steps": 7385, "loss": 1.3352, "learning_rate": 2.435723951285521e-05, "epoch": 0.06093432633716994, "percentage": 1.22, "elapsed_time": "0:01:11", "remaining_time": "1:36:03"}
{"current_steps": 100, "total_steps": 7385, "loss": 1.2605, "learning_rate": 2.7063599458728013e-05, "epoch": 0.06770480704129993, "percentage": 1.35, "elapsed_time": "0:01:18", "remaining_time": "1:35:50"}
{"current_steps": 110, "total_steps": 7385, "loss": 1.1888, "learning_rate": 2.976995940460081e-05, "epoch": 0.07447528774542993, "percentage": 1.49, "elapsed_time": "0:01:27", "remaining_time": "1:36:50"}
{"current_steps": 120, "total_steps": 7385, "loss": 1.1998, "learning_rate": 3.2476319350473615e-05, "epoch": 0.08124576844955991, "percentage": 1.62, "elapsed_time": "0:01:34", "remaining_time": "1:35:32"}
{"current_steps": 130, "total_steps": 7385, "loss": 1.1426, "learning_rate": 3.518267929634642e-05, "epoch": 0.08801624915368991, "percentage": 1.76, "elapsed_time": "0:01:43", "remaining_time": "1:36:34"}
{"current_steps": 140, "total_steps": 7385, "loss": 1.1437, "learning_rate": 3.788903924221922e-05, "epoch": 0.0947867298578199, "percentage": 1.9, "elapsed_time": "0:01:51", "remaining_time": "1:35:46"}
{"current_steps": 150, "total_steps": 7385, "loss": 1.0564, "learning_rate": 4.059539918809202e-05, "epoch": 0.1015572105619499, "percentage": 2.03, "elapsed_time": "0:01:58", "remaining_time": "1:34:58"}
{"current_steps": 160, "total_steps": 7385, "loss": 1.0382, "learning_rate": 4.330175913396482e-05, "epoch": 0.1083276912660799, "percentage": 2.17, "elapsed_time": "0:02:05", "remaining_time": "1:34:35"}
{"current_steps": 170, "total_steps": 7385, "loss": 1.0717, "learning_rate": 4.600811907983762e-05, "epoch": 0.11509817197020988, "percentage": 2.3, "elapsed_time": "0:02:13", "remaining_time": "1:34:24"}
{"current_steps": 180, "total_steps": 7385, "loss": 1.0294, "learning_rate": 4.871447902571042e-05, "epoch": 0.12186865267433988, "percentage": 2.44, "elapsed_time": "0:02:20", "remaining_time": "1:34:03"}
{"current_steps": 190, "total_steps": 7385, "loss": 1.0081, "learning_rate": 5.142083897158322e-05, "epoch": 0.12863913337846988, "percentage": 2.57, "elapsed_time": "0:02:28", "remaining_time": "1:33:55"}
{"current_steps": 200, "total_steps": 7385, "loss": 0.9383, "learning_rate": 5.4127198917456026e-05, "epoch": 0.13540961408259986, "percentage": 2.71, "elapsed_time": "0:02:36", "remaining_time": "1:33:52"}
{"current_steps": 210, "total_steps": 7385, "loss": 0.927, "learning_rate": 5.683355886332883e-05, "epoch": 0.14218009478672985, "percentage": 2.84, "elapsed_time": "0:02:44", "remaining_time": "1:33:24"}
{"current_steps": 220, "total_steps": 7385, "loss": 0.9617, "learning_rate": 5.953991880920162e-05, "epoch": 0.14895057549085985, "percentage": 2.98, "elapsed_time": "0:02:52", "remaining_time": "1:33:31"}
{"current_steps": 230, "total_steps": 7385, "loss": 1.0176, "learning_rate": 6.224627875507443e-05, "epoch": 0.15572105619498985, "percentage": 3.11, "elapsed_time": "0:03:00", "remaining_time": "1:33:44"}
{"current_steps": 240, "total_steps": 7385, "loss": 0.9733, "learning_rate": 6.495263870094723e-05, "epoch": 0.16249153689911983, "percentage": 3.25, "elapsed_time": "0:03:09", "remaining_time": "1:34:03"}
{"current_steps": 250, "total_steps": 7385, "loss": 1.0141, "learning_rate": 6.765899864682003e-05, "epoch": 0.16926201760324983, "percentage": 3.39, "elapsed_time": "0:03:16", "remaining_time": "1:33:40"}
{"current_steps": 260, "total_steps": 7385, "loss": 0.977, "learning_rate": 7.036535859269283e-05, "epoch": 0.17603249830737983, "percentage": 3.52, "elapsed_time": "0:03:26", "remaining_time": "1:34:08"}
{"current_steps": 270, "total_steps": 7385, "loss": 0.9624, "learning_rate": 7.307171853856563e-05, "epoch": 0.18280297901150983, "percentage": 3.66, "elapsed_time": "0:03:33", "remaining_time": "1:33:39"}
{"current_steps": 280, "total_steps": 7385, "loss": 1.0063, "learning_rate": 7.577807848443844e-05, "epoch": 0.1895734597156398, "percentage": 3.79, "elapsed_time": "0:03:41", "remaining_time": "1:33:28"}
{"current_steps": 290, "total_steps": 7385, "loss": 0.9562, "learning_rate": 7.848443843031124e-05, "epoch": 0.1963439404197698, "percentage": 3.93, "elapsed_time": "0:03:49", "remaining_time": "1:33:32"}
{"current_steps": 300, "total_steps": 7385, "loss": 1.0207, "learning_rate": 8.119079837618404e-05, "epoch": 0.2031144211238998, "percentage": 4.06, "elapsed_time": "0:03:56", "remaining_time": "1:32:56"}
{"current_steps": 310, "total_steps": 7385, "loss": 0.9731, "learning_rate": 8.389715832205684e-05, "epoch": 0.2098849018280298, "percentage": 4.2, "elapsed_time": "0:04:04", "remaining_time": "1:32:54"}
{"current_steps": 320, "total_steps": 7385, "loss": 0.9732, "learning_rate": 8.660351826792964e-05, "epoch": 0.2166553825321598, "percentage": 4.33, "elapsed_time": "0:04:11", "remaining_time": "1:32:39"}
{"current_steps": 330, "total_steps": 7385, "loss": 0.9645, "learning_rate": 8.930987821380244e-05, "epoch": 0.22342586323628977, "percentage": 4.47, "elapsed_time": "0:04:18", "remaining_time": "1:32:07"}
{"current_steps": 340, "total_steps": 7385, "loss": 0.9825, "learning_rate": 9.201623815967524e-05, "epoch": 0.23019634394041977, "percentage": 4.6, "elapsed_time": "0:04:26", "remaining_time": "1:31:56"}
{"current_steps": 350, "total_steps": 7385, "loss": 0.9521, "learning_rate": 9.472259810554804e-05, "epoch": 0.23696682464454977, "percentage": 4.74, "elapsed_time": "0:04:33", "remaining_time": "1:31:41"}
{"current_steps": 360, "total_steps": 7385, "loss": 0.9418, "learning_rate": 9.742895805142085e-05, "epoch": 0.24373730534867977, "percentage": 4.87, "elapsed_time": "0:04:41", "remaining_time": "1:31:35"}
{"current_steps": 370, "total_steps": 7385, "loss": 1.0314, "learning_rate": 0.00010013531799729365, "epoch": 0.25050778605280977, "percentage": 5.01, "elapsed_time": "0:04:49", "remaining_time": "1:31:20"}
{"current_steps": 380, "total_steps": 7385, "loss": 0.9194, "learning_rate": 0.00010284167794316644, "epoch": 0.25727826675693977, "percentage": 5.15, "elapsed_time": "0:04:57", "remaining_time": "1:31:28"}
{"current_steps": 390, "total_steps": 7385, "loss": 0.9, "learning_rate": 0.00010554803788903924, "epoch": 0.2640487474610697, "percentage": 5.28, "elapsed_time": "0:05:04", "remaining_time": "1:31:05"}
{"current_steps": 400, "total_steps": 7385, "loss": 0.911, "learning_rate": 0.00010825439783491205, "epoch": 0.2708192281651997, "percentage": 5.42, "elapsed_time": "0:05:12", "remaining_time": "1:30:52"}
{"current_steps": 410, "total_steps": 7385, "loss": 0.9127, "learning_rate": 0.00011096075778078485, "epoch": 0.2775897088693297, "percentage": 5.55, "elapsed_time": "0:05:20", "remaining_time": "1:30:46"}
{"current_steps": 420, "total_steps": 7385, "loss": 0.9206, "learning_rate": 0.00011366711772665765, "epoch": 0.2843601895734597, "percentage": 5.69, "elapsed_time": "0:05:28", "remaining_time": "1:30:48"}
{"current_steps": 430, "total_steps": 7385, "loss": 0.9248, "learning_rate": 0.00011637347767253047, "epoch": 0.2911306702775897, "percentage": 5.82, "elapsed_time": "0:05:36", "remaining_time": "1:30:37"}
{"current_steps": 440, "total_steps": 7385, "loss": 0.897, "learning_rate": 0.00011907983761840324, "epoch": 0.2979011509817197, "percentage": 5.96, "elapsed_time": "0:05:43", "remaining_time": "1:30:28"}
{"current_steps": 450, "total_steps": 7385, "loss": 0.9503, "learning_rate": 0.00012178619756427604, "epoch": 0.3046716316858497, "percentage": 6.09, "elapsed_time": "0:05:52", "remaining_time": "1:30:26"}
{"current_steps": 460, "total_steps": 7385, "loss": 0.885, "learning_rate": 0.00012449255751014886, "epoch": 0.3114421123899797, "percentage": 6.23, "elapsed_time": "0:06:00", "remaining_time": "1:30:29"}
{"current_steps": 470, "total_steps": 7385, "loss": 0.937, "learning_rate": 0.00012719891745602166, "epoch": 0.3182125930941097, "percentage": 6.36, "elapsed_time": "0:06:07", "remaining_time": "1:30:08"}
{"current_steps": 480, "total_steps": 7385, "loss": 0.9407, "learning_rate": 0.00012990527740189446, "epoch": 0.32498307379823965, "percentage": 6.5, "elapsed_time": "0:06:14", "remaining_time": "1:29:42"}
{"current_steps": 490, "total_steps": 7385, "loss": 0.9349, "learning_rate": 0.00013261163734776726, "epoch": 0.33175355450236965, "percentage": 6.64, "elapsed_time": "0:06:21", "remaining_time": "1:29:25"}
{"current_steps": 500, "total_steps": 7385, "loss": 0.9034, "learning_rate": 0.00013531799729364006, "epoch": 0.33852403520649965, "percentage": 6.77, "elapsed_time": "0:06:28", "remaining_time": "1:29:03"}
{"current_steps": 510, "total_steps": 7385, "loss": 0.8431, "learning_rate": 0.00013802435723951287, "epoch": 0.34529451591062965, "percentage": 6.91, "elapsed_time": "0:06:35", "remaining_time": "1:28:53"}
{"current_steps": 520, "total_steps": 7385, "loss": 0.9392, "learning_rate": 0.00014073071718538567, "epoch": 0.35206499661475965, "percentage": 7.04, "elapsed_time": "0:06:44", "remaining_time": "1:28:57"}
{"current_steps": 530, "total_steps": 7385, "loss": 0.9557, "learning_rate": 0.00014343707713125847, "epoch": 0.35883547731888965, "percentage": 7.18, "elapsed_time": "0:06:51", "remaining_time": "1:28:43"}
{"current_steps": 540, "total_steps": 7385, "loss": 0.8982, "learning_rate": 0.00014614343707713127, "epoch": 0.36560595802301965, "percentage": 7.31, "elapsed_time": "0:06:59", "remaining_time": "1:28:36"}
{"current_steps": 550, "total_steps": 7385, "loss": 0.8719, "learning_rate": 0.00014884979702300404, "epoch": 0.37237643872714965, "percentage": 7.45, "elapsed_time": "0:07:06", "remaining_time": "1:28:19"}
{"current_steps": 560, "total_steps": 7385, "loss": 0.9412, "learning_rate": 0.00015155615696887687, "epoch": 0.3791469194312796, "percentage": 7.58, "elapsed_time": "0:07:13", "remaining_time": "1:28:03"}
{"current_steps": 570, "total_steps": 7385, "loss": 0.9476, "learning_rate": 0.00015426251691474967, "epoch": 0.3859174001354096, "percentage": 7.72, "elapsed_time": "0:07:21", "remaining_time": "1:27:54"}
{"current_steps": 580, "total_steps": 7385, "loss": 0.9401, "learning_rate": 0.00015696887686062247, "epoch": 0.3926878808395396, "percentage": 7.85, "elapsed_time": "0:07:28", "remaining_time": "1:27:46"}
{"current_steps": 590, "total_steps": 7385, "loss": 0.8447, "learning_rate": 0.00015967523680649528, "epoch": 0.3994583615436696, "percentage": 7.99, "elapsed_time": "0:07:35", "remaining_time": "1:27:31"}
{"current_steps": 600, "total_steps": 7385, "loss": 0.9562, "learning_rate": 0.00016238159675236808, "epoch": 0.4062288422477996, "percentage": 8.12, "elapsed_time": "0:07:43", "remaining_time": "1:27:26"}
{"current_steps": 610, "total_steps": 7385, "loss": 0.8706, "learning_rate": 0.00016508795669824085, "epoch": 0.4129993229519296, "percentage": 8.26, "elapsed_time": "0:07:51", "remaining_time": "1:27:12"}
{"current_steps": 620, "total_steps": 7385, "loss": 0.9437, "learning_rate": 0.00016779431664411368, "epoch": 0.4197698036560596, "percentage": 8.4, "elapsed_time": "0:07:58", "remaining_time": "1:27:04"}
{"current_steps": 630, "total_steps": 7385, "loss": 0.9078, "learning_rate": 0.00017050067658998648, "epoch": 0.4265402843601896, "percentage": 8.53, "elapsed_time": "0:08:07", "remaining_time": "1:27:05"}
{"current_steps": 640, "total_steps": 7385, "loss": 0.8835, "learning_rate": 0.00017320703653585928, "epoch": 0.4333107650643196, "percentage": 8.67, "elapsed_time": "0:08:15", "remaining_time": "1:27:01"}
{"current_steps": 650, "total_steps": 7385, "loss": 0.9088, "learning_rate": 0.00017591339648173208, "epoch": 0.44008124576844954, "percentage": 8.8, "elapsed_time": "0:08:23", "remaining_time": "1:26:54"}
{"current_steps": 660, "total_steps": 7385, "loss": 0.8967, "learning_rate": 0.00017861975642760488, "epoch": 0.44685172647257954, "percentage": 8.94, "elapsed_time": "0:08:30", "remaining_time": "1:26:43"}
{"current_steps": 670, "total_steps": 7385, "loss": 0.9158, "learning_rate": 0.00018132611637347766, "epoch": 0.45362220717670954, "percentage": 9.07, "elapsed_time": "0:08:38", "remaining_time": "1:26:33"}
{"current_steps": 680, "total_steps": 7385, "loss": 0.872, "learning_rate": 0.0001840324763193505, "epoch": 0.46039268788083954, "percentage": 9.21, "elapsed_time": "0:08:45", "remaining_time": "1:26:19"}
{"current_steps": 690, "total_steps": 7385, "loss": 0.9062, "learning_rate": 0.0001867388362652233, "epoch": 0.46716316858496953, "percentage": 9.34, "elapsed_time": "0:08:52", "remaining_time": "1:26:10"}
{"current_steps": 700, "total_steps": 7385, "loss": 0.89, "learning_rate": 0.0001894451962110961, "epoch": 0.47393364928909953, "percentage": 9.48, "elapsed_time": "0:08:59", "remaining_time": "1:25:56"}
{"current_steps": 710, "total_steps": 7385, "loss": 0.8825, "learning_rate": 0.0001921515561569689, "epoch": 0.48070412999322953, "percentage": 9.61, "elapsed_time": "0:09:07", "remaining_time": "1:25:50"}
{"current_steps": 720, "total_steps": 7385, "loss": 0.8121, "learning_rate": 0.0001948579161028417, "epoch": 0.48747461069735953, "percentage": 9.75, "elapsed_time": "0:09:15", "remaining_time": "1:25:43"}
{"current_steps": 730, "total_steps": 7385, "loss": 0.8458, "learning_rate": 0.0001975642760487145, "epoch": 0.4942450914014895, "percentage": 9.88, "elapsed_time": "0:09:22", "remaining_time": "1:25:29"}
{"current_steps": 740, "total_steps": 7385, "loss": 0.8679, "learning_rate": 0.00019999998882753333, "epoch": 0.5010155721056195, "percentage": 10.02, "elapsed_time": "0:09:30", "remaining_time": "1:25:22"}
{"current_steps": 750, "total_steps": 7385, "loss": 0.8797, "learning_rate": 0.00019999864813455363, "epoch": 0.5077860528097495, "percentage": 10.16, "elapsed_time": "0:09:37", "remaining_time": "1:25:10"}
{"current_steps": 760, "total_steps": 7385, "loss": 0.8789, "learning_rate": 0.0001999950729825663, "epoch": 0.5145565335138795, "percentage": 10.29, "elapsed_time": "0:09:45", "remaining_time": "1:25:00"}
{"current_steps": 770, "total_steps": 7385, "loss": 0.9156, "learning_rate": 0.00019998926345145775, "epoch": 0.5213270142180095, "percentage": 10.43, "elapsed_time": "0:09:52", "remaining_time": "1:24:52"}
{"current_steps": 780, "total_steps": 7385, "loss": 0.919, "learning_rate": 0.00019998121967104132, "epoch": 0.5280974949221394, "percentage": 10.56, "elapsed_time": "0:10:00", "remaining_time": "1:24:43"}
{"current_steps": 790, "total_steps": 7385, "loss": 0.8619, "learning_rate": 0.00019997094182105447, "epoch": 0.5348679756262694, "percentage": 10.7, "elapsed_time": "0:10:08", "remaining_time": "1:24:38"}
{"current_steps": 800, "total_steps": 7385, "loss": 0.86, "learning_rate": 0.00019995843013115454, "epoch": 0.5416384563303994, "percentage": 10.83, "elapsed_time": "0:10:15", "remaining_time": "1:24:27"}
{"current_steps": 810, "total_steps": 7385, "loss": 0.9258, "learning_rate": 0.00019994368488091398, "epoch": 0.5484089370345294, "percentage": 10.97, "elapsed_time": "0:10:22", "remaining_time": "1:24:16"}
{"current_steps": 820, "total_steps": 7385, "loss": 0.8758, "learning_rate": 0.00019992670639981376, "epoch": 0.5551794177386594, "percentage": 11.1, "elapsed_time": "0:10:30", "remaining_time": "1:24:10"}
{"current_steps": 830, "total_steps": 7385, "loss": 0.9112, "learning_rate": 0.00019990749506723624, "epoch": 0.5619498984427894, "percentage": 11.24, "elapsed_time": "0:10:38", "remaining_time": "1:24:00"}
{"current_steps": 840, "total_steps": 7385, "loss": 0.899, "learning_rate": 0.00019988605131245662, "epoch": 0.5687203791469194, "percentage": 11.37, "elapsed_time": "0:10:45", "remaining_time": "1:23:52"}
{"current_steps": 850, "total_steps": 7385, "loss": 0.8604, "learning_rate": 0.00019986237561463318, "epoch": 0.5754908598510494, "percentage": 11.51, "elapsed_time": "0:10:53", "remaining_time": "1:23:43"}
{"current_steps": 860, "total_steps": 7385, "loss": 0.8411, "learning_rate": 0.00019983646850279692, "epoch": 0.5822613405551794, "percentage": 11.65, "elapsed_time": "0:11:00", "remaining_time": "1:23:29"}
{"current_steps": 870, "total_steps": 7385, "loss": 0.9106, "learning_rate": 0.0001998083305558394, "epoch": 0.5890318212593094, "percentage": 11.78, "elapsed_time": "0:11:07", "remaining_time": "1:23:17"}
{"current_steps": 880, "total_steps": 7385, "loss": 0.9071, "learning_rate": 0.00019977796240250008, "epoch": 0.5958023019634394, "percentage": 11.92, "elapsed_time": "0:11:14", "remaining_time": "1:23:06"}
{"current_steps": 890, "total_steps": 7385, "loss": 0.9038, "learning_rate": 0.00019974536472135203, "epoch": 0.6025727826675694, "percentage": 12.05, "elapsed_time": "0:11:22", "remaining_time": "1:22:58"}
{"current_steps": 900, "total_steps": 7385, "loss": 0.8832, "learning_rate": 0.00019971053824078693, "epoch": 0.6093432633716994, "percentage": 12.19, "elapsed_time": "0:11:28", "remaining_time": "1:22:42"}
{"current_steps": 910, "total_steps": 7385, "loss": 0.845, "learning_rate": 0.00019967348373899868, "epoch": 0.6161137440758294, "percentage": 12.32, "elapsed_time": "0:11:37", "remaining_time": "1:22:42"}
{"current_steps": 920, "total_steps": 7385, "loss": 0.9287, "learning_rate": 0.0001996342020439662, "epoch": 0.6228842247799594, "percentage": 12.46, "elapsed_time": "0:11:44", "remaining_time": "1:22:30"}
{"current_steps": 930, "total_steps": 7385, "loss": 0.8836, "learning_rate": 0.00019959269403343474, "epoch": 0.6296547054840894, "percentage": 12.59, "elapsed_time": "0:11:52", "remaining_time": "1:22:22"}
{"current_steps": 940, "total_steps": 7385, "loss": 0.8759, "learning_rate": 0.00019954896063489622, "epoch": 0.6364251861882194, "percentage": 12.73, "elapsed_time": "0:12:00", "remaining_time": "1:22:21"}
{"current_steps": 950, "total_steps": 7385, "loss": 0.9136, "learning_rate": 0.0001995030028255688, "epoch": 0.6431956668923493, "percentage": 12.86, "elapsed_time": "0:12:08", "remaining_time": "1:22:17"}
{"current_steps": 960, "total_steps": 7385, "loss": 0.8388, "learning_rate": 0.00019945482163237472, "epoch": 0.6499661475964793, "percentage": 13.0, "elapsed_time": "0:12:15", "remaining_time": "1:22:01"}
{"current_steps": 970, "total_steps": 7385, "loss": 0.8804, "learning_rate": 0.0001994044181319176, "epoch": 0.6567366283006093, "percentage": 13.13, "elapsed_time": "0:12:22", "remaining_time": "1:21:52"}
{"current_steps": 980, "total_steps": 7385, "loss": 0.8671, "learning_rate": 0.00019935179345045815, "epoch": 0.6635071090047393, "percentage": 13.27, "elapsed_time": "0:12:29", "remaining_time": "1:21:39"}
{"current_steps": 990, "total_steps": 7385, "loss": 0.8661, "learning_rate": 0.0001992969487638893, "epoch": 0.6702775897088693, "percentage": 13.41, "elapsed_time": "0:12:37", "remaining_time": "1:21:33"}
{"current_steps": 1000, "total_steps": 7385, "loss": 0.7901, "learning_rate": 0.00019923988529770958, "epoch": 0.6770480704129993, "percentage": 13.54, "elapsed_time": "0:12:44", "remaining_time": "1:21:22"}
{"current_steps": 1000, "total_steps": 7385, "eval_loss": 0.8919770121574402, "epoch": 0.6770480704129993, "percentage": 13.54, "elapsed_time": "0:13:08", "remaining_time": "1:23:53"}
{"current_steps": 1010, "total_steps": 7385, "loss": 0.8084, "learning_rate": 0.000199180604326996, "epoch": 0.6838185511171293, "percentage": 13.68, "elapsed_time": "0:13:17", "remaining_time": "1:23:52"}
{"current_steps": 1020, "total_steps": 7385, "loss": 0.8708, "learning_rate": 0.00019911910717637548, "epoch": 0.6905890318212593, "percentage": 13.81, "elapsed_time": "0:13:24", "remaining_time": "1:23:40"}
{"current_steps": 1030, "total_steps": 7385, "loss": 0.8608, "learning_rate": 0.00019905539521999517, "epoch": 0.6973595125253893, "percentage": 13.95, "elapsed_time": "0:13:32", "remaining_time": "1:23:33"}
{"current_steps": 1040, "total_steps": 7385, "loss": 0.9042, "learning_rate": 0.00019898946988149193, "epoch": 0.7041299932295193, "percentage": 14.08, "elapsed_time": "0:13:40", "remaining_time": "1:23:27"}
{"current_steps": 1050, "total_steps": 7385, "loss": 0.8896, "learning_rate": 0.0001989213326339603, "epoch": 0.7109004739336493, "percentage": 14.22, "elapsed_time": "0:13:48", "remaining_time": "1:23:20"}
{"current_steps": 1060, "total_steps": 7385, "loss": 0.8685, "learning_rate": 0.00019885098499991972, "epoch": 0.7176709546377793, "percentage": 14.35, "elapsed_time": "0:13:56", "remaining_time": "1:23:14"}
{"current_steps": 1070, "total_steps": 7385, "loss": 0.8615, "learning_rate": 0.0001987784285512805, "epoch": 0.7244414353419093, "percentage": 14.49, "elapsed_time": "0:14:03", "remaining_time": "1:22:59"}
{"current_steps": 1080, "total_steps": 7385, "loss": 0.8786, "learning_rate": 0.00019870366490930868, "epoch": 0.7312119160460393, "percentage": 14.62, "elapsed_time": "0:14:13", "remaining_time": "1:23:02"}
{"current_steps": 1090, "total_steps": 7385, "loss": 0.8872, "learning_rate": 0.0001986266957445897, "epoch": 0.7379823967501693, "percentage": 14.76, "elapsed_time": "0:14:21", "remaining_time": "1:22:53"}
{"current_steps": 1100, "total_steps": 7385, "loss": 0.8544, "learning_rate": 0.00019854752277699138, "epoch": 0.7447528774542993, "percentage": 14.9, "elapsed_time": "0:14:29", "remaining_time": "1:22:46"}
{"current_steps": 1110, "total_steps": 7385, "loss": 0.8256, "learning_rate": 0.000198466147775625, "epoch": 0.7515233581584293, "percentage": 15.03, "elapsed_time": "0:14:36", "remaining_time": "1:22:37"}
{"current_steps": 1120, "total_steps": 7385, "loss": 0.8642, "learning_rate": 0.00019838257255880626, "epoch": 0.7582938388625592, "percentage": 15.17, "elapsed_time": "0:14:44", "remaining_time": "1:22:28"}
{"current_steps": 1130, "total_steps": 7385, "loss": 0.8624, "learning_rate": 0.00019829679899401436, "epoch": 0.7650643195666892, "percentage": 15.3, "elapsed_time": "0:14:51", "remaining_time": "1:22:16"}
{"current_steps": 1140, "total_steps": 7385, "loss": 0.8312, "learning_rate": 0.00019820882899785038, "epoch": 0.7718348002708192, "percentage": 15.44, "elapsed_time": "0:14:59", "remaining_time": "1:22:06"}
{"current_steps": 1150, "total_steps": 7385, "loss": 0.8467, "learning_rate": 0.00019811866453599435, "epoch": 0.7786052809749492, "percentage": 15.57, "elapsed_time": "0:15:07", "remaining_time": "1:21:58"}
{"current_steps": 1160, "total_steps": 7385, "loss": 0.8456, "learning_rate": 0.00019802630762316145, "epoch": 0.7853757616790792, "percentage": 15.71, "elapsed_time": "0:15:14", "remaining_time": "1:21:48"}
{"current_steps": 1170, "total_steps": 7385, "loss": 0.8391, "learning_rate": 0.00019793176032305697, "epoch": 0.7921462423832092, "percentage": 15.84, "elapsed_time": "0:15:21", "remaining_time": "1:21:37"}
{"current_steps": 1180, "total_steps": 7385, "loss": 0.904, "learning_rate": 0.00019783502474833009, "epoch": 0.7989167230873392, "percentage": 15.98, "elapsed_time": "0:15:29", "remaining_time": "1:21:26"}
{"current_steps": 1190, "total_steps": 7385, "loss": 0.8494, "learning_rate": 0.00019773610306052683, "epoch": 0.8056872037914692, "percentage": 16.11, "elapsed_time": "0:15:37", "remaining_time": "1:21:22"}
{"current_steps": 1200, "total_steps": 7385, "loss": 0.8865, "learning_rate": 0.00019763499747004165, "epoch": 0.8124576844955992, "percentage": 16.25, "elapsed_time": "0:15:45", "remaining_time": "1:21:12"}
{"current_steps": 1210, "total_steps": 7385, "loss": 0.8733, "learning_rate": 0.000197531710236068, "epoch": 0.8192281651997292, "percentage": 16.38, "elapsed_time": "0:15:53", "remaining_time": "1:21:04"}
{"current_steps": 1220, "total_steps": 7385, "loss": 0.9122, "learning_rate": 0.00019742624366654802, "epoch": 0.8259986459038592, "percentage": 16.52, "elapsed_time": "0:16:00", "remaining_time": "1:20:55"}
{"current_steps": 1230, "total_steps": 7385, "loss": 0.8429, "learning_rate": 0.00019731860011812087, "epoch": 0.8327691266079892, "percentage": 16.66, "elapsed_time": "0:16:07", "remaining_time": "1:20:41"}
{"current_steps": 1240, "total_steps": 7385, "loss": 0.9004, "learning_rate": 0.00019720878199606996, "epoch": 0.8395396073121192, "percentage": 16.79, "elapsed_time": "0:16:15", "remaining_time": "1:20:33"}
{"current_steps": 1250, "total_steps": 7385, "loss": 0.9241, "learning_rate": 0.00019709679175426942, "epoch": 0.8463100880162492, "percentage": 16.93, "elapsed_time": "0:16:22", "remaining_time": "1:20:23"}
{"current_steps": 1260, "total_steps": 7385, "loss": 0.8566, "learning_rate": 0.00019698263189512914, "epoch": 0.8530805687203792, "percentage": 17.06, "elapsed_time": "0:16:30", "remaining_time": "1:20:16"}
{"current_steps": 1270, "total_steps": 7385, "loss": 0.9116, "learning_rate": 0.00019686630496953882, "epoch": 0.8598510494245092, "percentage": 17.2, "elapsed_time": "0:16:37", "remaining_time": "1:20:02"}
{"current_steps": 1280, "total_steps": 7385, "loss": 0.8052, "learning_rate": 0.00019674781357681108, "epoch": 0.8666215301286392, "percentage": 17.33, "elapsed_time": "0:16:44", "remaining_time": "1:19:53"}
{"current_steps": 1290, "total_steps": 7385, "loss": 0.89, "learning_rate": 0.00019662716036462335, "epoch": 0.8733920108327691, "percentage": 17.47, "elapsed_time": "0:16:52", "remaining_time": "1:19:43"}
{"current_steps": 1300, "total_steps": 7385, "loss": 0.8191, "learning_rate": 0.0001965043480289586, "epoch": 0.8801624915368991, "percentage": 17.6, "elapsed_time": "0:16:58", "remaining_time": "1:19:29"}
{"current_steps": 1310, "total_steps": 7385, "loss": 0.8995, "learning_rate": 0.00019637937931404523, "epoch": 0.8869329722410291, "percentage": 17.74, "elapsed_time": "0:17:06", "remaining_time": "1:19:20"}
{"current_steps": 1320, "total_steps": 7385, "loss": 0.8582, "learning_rate": 0.00019625225701229573, "epoch": 0.8937034529451591, "percentage": 17.87, "elapsed_time": "0:17:15", "remaining_time": "1:19:15"}
{"current_steps": 1330, "total_steps": 7385, "loss": 0.844, "learning_rate": 0.00019612298396424417, "epoch": 0.9004739336492891, "percentage": 18.01, "elapsed_time": "0:17:22", "remaining_time": "1:19:06"}
{"current_steps": 1340, "total_steps": 7385, "loss": 0.8609, "learning_rate": 0.0001959915630584829, "epoch": 0.9072444143534191, "percentage": 18.14, "elapsed_time": "0:17:31", "remaining_time": "1:19:03"}
{"current_steps": 1350, "total_steps": 7385, "loss": 0.91, "learning_rate": 0.00019585799723159788, "epoch": 0.9140148950575491, "percentage": 18.28, "elapsed_time": "0:17:38", "remaining_time": "1:18:53"}
{"current_steps": 1360, "total_steps": 7385, "loss": 0.8287, "learning_rate": 0.0001957222894681031, "epoch": 0.9207853757616791, "percentage": 18.42, "elapsed_time": "0:17:46", "remaining_time": "1:18:44"}
{"current_steps": 1370, "total_steps": 7385, "loss": 0.7931, "learning_rate": 0.00019558444280037393, "epoch": 0.9275558564658091, "percentage": 18.55, "elapsed_time": "0:17:53", "remaining_time": "1:18:34"}
{"current_steps": 1380, "total_steps": 7385, "loss": 0.8941, "learning_rate": 0.00019544446030857922, "epoch": 0.9343263371699391, "percentage": 18.69, "elapsed_time": "0:18:02", "remaining_time": "1:18:29"}
{"current_steps": 1390, "total_steps": 7385, "loss": 0.8674, "learning_rate": 0.0001953023451206127, "epoch": 0.9410968178740691, "percentage": 18.82, "elapsed_time": "0:18:08", "remaining_time": "1:18:16"}
{"current_steps": 1400, "total_steps": 7385, "loss": 0.8462, "learning_rate": 0.00019515810041202295, "epoch": 0.9478672985781991, "percentage": 18.96, "elapsed_time": "0:18:16", "remaining_time": "1:18:08"}
{"current_steps": 1410, "total_steps": 7385, "loss": 0.8594, "learning_rate": 0.00019501172940594242, "epoch": 0.9546377792823291, "percentage": 19.09, "elapsed_time": "0:18:24", "remaining_time": "1:18:01"}
{"current_steps": 1420, "total_steps": 7385, "loss": 0.8622, "learning_rate": 0.00019486323537301538, "epoch": 0.9614082599864591, "percentage": 19.23, "elapsed_time": "0:18:31", "remaining_time": "1:17:49"}
{"current_steps": 1430, "total_steps": 7385, "loss": 0.8626, "learning_rate": 0.00019471262163132504, "epoch": 0.9681787406905891, "percentage": 19.36, "elapsed_time": "0:18:38", "remaining_time": "1:17:38"}
{"current_steps": 1440, "total_steps": 7385, "loss": 0.871, "learning_rate": 0.0001945598915463192, "epoch": 0.9749492213947191, "percentage": 19.5, "elapsed_time": "0:18:45", "remaining_time": "1:17:28"}
{"current_steps": 1450, "total_steps": 7385, "loss": 0.8555, "learning_rate": 0.00019440504853073516, "epoch": 0.9817197020988491, "percentage": 19.63, "elapsed_time": "0:18:54", "remaining_time": "1:17:23"}
{"current_steps": 1460, "total_steps": 7385, "loss": 0.826, "learning_rate": 0.00019424809604452338, "epoch": 0.988490182802979, "percentage": 19.77, "elapsed_time": "0:19:03", "remaining_time": "1:17:18"}
{"current_steps": 1470, "total_steps": 7385, "loss": 0.8657, "learning_rate": 0.00019408903759477025, "epoch": 0.995260663507109, "percentage": 19.91, "elapsed_time": "0:19:10", "remaining_time": "1:17:09"}
{"current_steps": 1480, "total_steps": 7385, "loss": 0.8114, "learning_rate": 0.00019392787673561964, "epoch": 1.002031144211239, "percentage": 20.04, "elapsed_time": "0:19:18", "remaining_time": "1:17:00"}
{"current_steps": 1490, "total_steps": 7385, "loss": 0.7081, "learning_rate": 0.00019376461706819358, "epoch": 1.008801624915369, "percentage": 20.18, "elapsed_time": "0:19:25", "remaining_time": "1:16:49"}
{"current_steps": 1500, "total_steps": 7385, "loss": 0.697, "learning_rate": 0.00019359926224051178, "epoch": 1.015572105619499, "percentage": 20.31, "elapsed_time": "0:19:32", "remaining_time": "1:16:41"}
{"current_steps": 1510, "total_steps": 7385, "loss": 0.7743, "learning_rate": 0.00019343181594740996, "epoch": 1.022342586323629, "percentage": 20.45, "elapsed_time": "0:19:40", "remaining_time": "1:16:32"}
{"current_steps": 1520, "total_steps": 7385, "loss": 0.7965, "learning_rate": 0.00019326228193045753, "epoch": 1.029113067027759, "percentage": 20.58, "elapsed_time": "0:19:48", "remaining_time": "1:16:24"}
{"current_steps": 1530, "total_steps": 7385, "loss": 0.7399, "learning_rate": 0.00019309066397787378, "epoch": 1.035883547731889, "percentage": 20.72, "elapsed_time": "0:19:55", "remaining_time": "1:16:13"}
{"current_steps": 1540, "total_steps": 7385, "loss": 0.7503, "learning_rate": 0.0001929169659244434, "epoch": 1.042654028436019, "percentage": 20.85, "elapsed_time": "0:20:03", "remaining_time": "1:16:06"}
{"current_steps": 1550, "total_steps": 7385, "loss": 0.7867, "learning_rate": 0.00019274119165143064, "epoch": 1.0494245091401488, "percentage": 20.99, "elapsed_time": "0:20:11", "remaining_time": "1:16:02"}
{"current_steps": 1560, "total_steps": 7385, "loss": 0.7303, "learning_rate": 0.00019256334508649262, "epoch": 1.0561949898442788, "percentage": 21.12, "elapsed_time": "0:20:19", "remaining_time": "1:15:52"}
{"current_steps": 1570, "total_steps": 7385, "loss": 0.7375, "learning_rate": 0.00019238343020359174, "epoch": 1.0629654705484088, "percentage": 21.26, "elapsed_time": "0:20:26", "remaining_time": "1:15:41"}
{"current_steps": 1580, "total_steps": 7385, "loss": 0.7569, "learning_rate": 0.00019220145102290658, "epoch": 1.0697359512525388, "percentage": 21.39, "elapsed_time": "0:20:34", "remaining_time": "1:15:35"}
{"current_steps": 1590, "total_steps": 7385, "loss": 0.7594, "learning_rate": 0.00019201741161074234, "epoch": 1.0765064319566688, "percentage": 21.53, "elapsed_time": "0:20:42", "remaining_time": "1:15:27"}
{"current_steps": 1600, "total_steps": 7385, "loss": 0.7721, "learning_rate": 0.00019183131607943983, "epoch": 1.0832769126607988, "percentage": 21.67, "elapsed_time": "0:20:50", "remaining_time": "1:15:21"}
{"current_steps": 1610, "total_steps": 7385, "loss": 0.6816, "learning_rate": 0.00019164316858728364, "epoch": 1.0900473933649288, "percentage": 21.8, "elapsed_time": "0:20:58", "remaining_time": "1:15:13"}
{"current_steps": 1620, "total_steps": 7385, "loss": 0.7927, "learning_rate": 0.00019145297333840916, "epoch": 1.0968178740690588, "percentage": 21.94, "elapsed_time": "0:21:06", "remaining_time": "1:15:06"}
{"current_steps": 1630, "total_steps": 7385, "loss": 0.8416, "learning_rate": 0.00019126073458270874, "epoch": 1.1035883547731888, "percentage": 22.07, "elapsed_time": "0:21:14", "remaining_time": "1:14:58"}
{"current_steps": 1640, "total_steps": 7385, "loss": 0.7731, "learning_rate": 0.00019106645661573667, "epoch": 1.1103588354773188, "percentage": 22.21, "elapsed_time": "0:21:21", "remaining_time": "1:14:48"}
{"current_steps": 1650, "total_steps": 7385, "loss": 0.7954, "learning_rate": 0.0001908701437786131, "epoch": 1.1171293161814488, "percentage": 22.34, "elapsed_time": "0:21:29", "remaining_time": "1:14:40"}
{"current_steps": 1660, "total_steps": 7385, "loss": 0.7224, "learning_rate": 0.00019067180045792724, "epoch": 1.1238997968855788, "percentage": 22.48, "elapsed_time": "0:21:37", "remaining_time": "1:14:34"}
{"current_steps": 1670, "total_steps": 7385, "loss": 0.7761, "learning_rate": 0.0001904714310856392, "epoch": 1.1306702775897088, "percentage": 22.61, "elapsed_time": "0:21:45", "remaining_time": "1:14:26"}
{"current_steps": 1680, "total_steps": 7385, "loss": 0.7552, "learning_rate": 0.00019026904013898097, "epoch": 1.1374407582938388, "percentage": 22.75, "elapsed_time": "0:21:53", "remaining_time": "1:14:19"}
{"current_steps": 1690, "total_steps": 7385, "loss": 0.7458, "learning_rate": 0.00019006463214035646, "epoch": 1.1442112389979688, "percentage": 22.88, "elapsed_time": "0:22:00", "remaining_time": "1:14:10"}
{"current_steps": 1700, "total_steps": 7385, "loss": 0.7811, "learning_rate": 0.00018985821165724034, "epoch": 1.1509817197020988, "percentage": 23.02, "elapsed_time": "0:22:10", "remaining_time": "1:14:08"}
{"current_steps": 1710, "total_steps": 7385, "loss": 0.7596, "learning_rate": 0.00018964978330207605, "epoch": 1.1577522004062288, "percentage": 23.16, "elapsed_time": "0:22:18", "remaining_time": "1:14:00"}
{"current_steps": 1720, "total_steps": 7385, "loss": 0.7075, "learning_rate": 0.0001894393517321727, "epoch": 1.1645226811103588, "percentage": 23.29, "elapsed_time": "0:22:25", "remaining_time": "1:13:52"}
{"current_steps": 1730, "total_steps": 7385, "loss": 0.7585, "learning_rate": 0.00018922692164960098, "epoch": 1.1712931618144888, "percentage": 23.43, "elapsed_time": "0:22:32", "remaining_time": "1:13:42"}
{"current_steps": 1740, "total_steps": 7385, "loss": 0.7459, "learning_rate": 0.00018901249780108823, "epoch": 1.1780636425186188, "percentage": 23.56, "elapsed_time": "0:22:39", "remaining_time": "1:13:32"}
{"current_steps": 1750, "total_steps": 7385, "loss": 0.7271, "learning_rate": 0.00018879608497791224, "epoch": 1.1848341232227488, "percentage": 23.7, "elapsed_time": "0:22:47", "remaining_time": "1:13:22"}
{"current_steps": 1760, "total_steps": 7385, "loss": 0.7932, "learning_rate": 0.00018857768801579415, "epoch": 1.1916046039268788, "percentage": 23.83, "elapsed_time": "0:22:54", "remaining_time": "1:13:13"}
{"current_steps": 1770, "total_steps": 7385, "loss": 0.8144, "learning_rate": 0.00018835731179479056, "epoch": 1.1983750846310088, "percentage": 23.97, "elapsed_time": "0:23:02", "remaining_time": "1:13:04"}
{"current_steps": 1780, "total_steps": 7385, "loss": 0.7402, "learning_rate": 0.00018813496123918432, "epoch": 1.2051455653351388, "percentage": 24.1, "elapsed_time": "0:23:09", "remaining_time": "1:12:56"}
{"current_steps": 1790, "total_steps": 7385, "loss": 0.7852, "learning_rate": 0.00018791064131737462, "epoch": 1.2119160460392688, "percentage": 24.24, "elapsed_time": "0:23:17", "remaining_time": "1:12:48"}
{"current_steps": 1800, "total_steps": 7385, "loss": 0.7128, "learning_rate": 0.00018768435704176597, "epoch": 1.2186865267433988, "percentage": 24.37, "elapsed_time": "0:23:25", "remaining_time": "1:12:39"}
{"current_steps": 1810, "total_steps": 7385, "loss": 0.7488, "learning_rate": 0.00018745611346865606, "epoch": 1.2254570074475288, "percentage": 24.51, "elapsed_time": "0:23:33", "remaining_time": "1:12:32"}
{"current_steps": 1820, "total_steps": 7385, "loss": 0.8368, "learning_rate": 0.00018722591569812294, "epoch": 1.2322274881516588, "percentage": 24.64, "elapsed_time": "0:23:40", "remaining_time": "1:12:24"}
{"current_steps": 1830, "total_steps": 7385, "loss": 0.8279, "learning_rate": 0.00018699376887391093, "epoch": 1.2389979688557888, "percentage": 24.78, "elapsed_time": "0:23:49", "remaining_time": "1:12:19"}
{"current_steps": 1840, "total_steps": 7385, "loss": 0.7308, "learning_rate": 0.0001867596781833158, "epoch": 1.2457684495599188, "percentage": 24.92, "elapsed_time": "0:23:57", "remaining_time": "1:12:10"}
{"current_steps": 1850, "total_steps": 7385, "loss": 0.783, "learning_rate": 0.0001865236488570688, "epoch": 1.2525389302640488, "percentage": 25.05, "elapsed_time": "0:24:04", "remaining_time": "1:12:03"}
{"current_steps": 1860, "total_steps": 7385, "loss": 0.7581, "learning_rate": 0.00018628568616921976, "epoch": 1.2593094109681786, "percentage": 25.19, "elapsed_time": "0:24:13", "remaining_time": "1:11:58"}
{"current_steps": 1870, "total_steps": 7385, "loss": 0.7696, "learning_rate": 0.00018604579543701926, "epoch": 1.2660798916723088, "percentage": 25.32, "elapsed_time": "0:24:21", "remaining_time": "1:11:51"}
{"current_steps": 1880, "total_steps": 7385, "loss": 0.7202, "learning_rate": 0.00018580398202079987, "epoch": 1.2728503723764386, "percentage": 25.46, "elapsed_time": "0:24:30", "remaining_time": "1:11:44"}
{"current_steps": 1890, "total_steps": 7385, "loss": 0.7685, "learning_rate": 0.00018556025132385626, "epoch": 1.2796208530805688, "percentage": 25.59, "elapsed_time": "0:24:38", "remaining_time": "1:11:37"}
{"current_steps": 1900, "total_steps": 7385, "loss": 0.7814, "learning_rate": 0.00018531460879232456, "epoch": 1.2863913337846986, "percentage": 25.73, "elapsed_time": "0:24:44", "remaining_time": "1:11:26"}
{"current_steps": 1910, "total_steps": 7385, "loss": 0.7202, "learning_rate": 0.00018506705991506067, "epoch": 1.2931618144888288, "percentage": 25.86, "elapsed_time": "0:24:52", "remaining_time": "1:11:18"}
{"current_steps": 1920, "total_steps": 7385, "loss": 0.785, "learning_rate": 0.00018481761022351757, "epoch": 1.2999322951929586, "percentage": 26.0, "elapsed_time": "0:24:59", "remaining_time": "1:11:08"}
{"current_steps": 1930, "total_steps": 7385, "loss": 0.7693, "learning_rate": 0.0001845662652916217, "epoch": 1.3067027758970888, "percentage": 26.13, "elapsed_time": "0:25:07", "remaining_time": "1:11:01"}
{"current_steps": 1940, "total_steps": 7385, "loss": 0.8127, "learning_rate": 0.00018431303073564842, "epoch": 1.3134732566012186, "percentage": 26.27, "elapsed_time": "0:25:14", "remaining_time": "1:10:51"}
{"current_steps": 1950, "total_steps": 7385, "loss": 0.7804, "learning_rate": 0.0001840579122140966, "epoch": 1.3202437373053486, "percentage": 26.4, "elapsed_time": "0:25:22", "remaining_time": "1:10:44"}
{"current_steps": 1960, "total_steps": 7385, "loss": 0.7563, "learning_rate": 0.00018380091542756212, "epoch": 1.3270142180094786, "percentage": 26.54, "elapsed_time": "0:25:30", "remaining_time": "1:10:35"}
{"current_steps": 1970, "total_steps": 7385, "loss": 0.7382, "learning_rate": 0.00018354204611861042, "epoch": 1.3337846987136086, "percentage": 26.68, "elapsed_time": "0:25:37", "remaining_time": "1:10:26"}
{"current_steps": 1980, "total_steps": 7385, "loss": 0.7543, "learning_rate": 0.00018328131007164827, "epoch": 1.3405551794177386, "percentage": 26.81, "elapsed_time": "0:25:44", "remaining_time": "1:10:16"}
{"current_steps": 1990, "total_steps": 7385, "loss": 0.7877, "learning_rate": 0.00018301871311279455, "epoch": 1.3473256601218686, "percentage": 26.95, "elapsed_time": "0:25:52", "remaining_time": "1:10:08"}
{"current_steps": 2000, "total_steps": 7385, "loss": 0.7599, "learning_rate": 0.00018275426110975, "epoch": 1.3540961408259986, "percentage": 27.08, "elapsed_time": "0:25:59", "remaining_time": "1:09:59"}
{"current_steps": 2000, "total_steps": 7385, "eval_loss": 0.8573334813117981, "epoch": 1.3540961408259986, "percentage": 27.08, "elapsed_time": "0:26:22", "remaining_time": "1:11:01"}
{"current_steps": 2010, "total_steps": 7385, "loss": 0.772, "learning_rate": 0.00018248795997166607, "epoch": 1.3608666215301286, "percentage": 27.22, "elapsed_time": "0:26:31", "remaining_time": "1:10:54"}
{"current_steps": 2020, "total_steps": 7385, "loss": 0.8211, "learning_rate": 0.000182219815649013, "epoch": 1.3676371022342586, "percentage": 27.35, "elapsed_time": "0:26:39", "remaining_time": "1:10:47"}
{"current_steps": 2030, "total_steps": 7385, "loss": 0.7549, "learning_rate": 0.00018194983413344674, "epoch": 1.3744075829383886, "percentage": 27.49, "elapsed_time": "0:26:47", "remaining_time": "1:10:39"}
{"current_steps": 2040, "total_steps": 7385, "loss": 0.7133, "learning_rate": 0.00018167802145767513, "epoch": 1.3811780636425186, "percentage": 27.62, "elapsed_time": "0:26:54", "remaining_time": "1:10:30"}
{"current_steps": 2050, "total_steps": 7385, "loss": 0.7562, "learning_rate": 0.0001814043836953231, "epoch": 1.3879485443466486, "percentage": 27.76, "elapsed_time": "0:27:02", "remaining_time": "1:10:22"}
{"current_steps": 2060, "total_steps": 7385, "loss": 0.7411, "learning_rate": 0.00018112892696079698, "epoch": 1.3947190250507786, "percentage": 27.89, "elapsed_time": "0:27:10", "remaining_time": "1:10:14"}
{"current_steps": 2070, "total_steps": 7385, "loss": 0.7568, "learning_rate": 0.00018085165740914776, "epoch": 1.4014895057549086, "percentage": 28.03, "elapsed_time": "0:27:18", "remaining_time": "1:10:07"}
{"current_steps": 2080, "total_steps": 7385, "loss": 0.7358, "learning_rate": 0.00018057258123593367, "epoch": 1.4082599864590386, "percentage": 28.17, "elapsed_time": "0:27:26", "remaining_time": "1:09:59"}
{"current_steps": 2090, "total_steps": 7385, "loss": 0.7352, "learning_rate": 0.00018029170467708165, "epoch": 1.4150304671631686, "percentage": 28.3, "elapsed_time": "0:27:34", "remaining_time": "1:09:51"}
{"current_steps": 2100, "total_steps": 7385, "loss": 0.8073, "learning_rate": 0.00018000903400874823, "epoch": 1.4218009478672986, "percentage": 28.44, "elapsed_time": "0:27:42", "remaining_time": "1:09:44"}
{"current_steps": 2110, "total_steps": 7385, "loss": 0.7886, "learning_rate": 0.0001797245755471789, "epoch": 1.4285714285714286, "percentage": 28.57, "elapsed_time": "0:27:49", "remaining_time": "1:09:33"}
{"current_steps": 2120, "total_steps": 7385, "loss": 0.7216, "learning_rate": 0.00017943833564856737, "epoch": 1.4353419092755586, "percentage": 28.71, "elapsed_time": "0:27:56", "remaining_time": "1:09:24"}
{"current_steps": 2130, "total_steps": 7385, "loss": 0.7077, "learning_rate": 0.00017915032070891327, "epoch": 1.4421123899796886, "percentage": 28.84, "elapsed_time": "0:28:04", "remaining_time": "1:09:16"}
{"current_steps": 2140, "total_steps": 7385, "loss": 0.7511, "learning_rate": 0.00017886053716387935, "epoch": 1.4488828706838186, "percentage": 28.98, "elapsed_time": "0:28:12", "remaining_time": "1:09:07"}
{"current_steps": 2150, "total_steps": 7385, "loss": 0.7603, "learning_rate": 0.00017856899148864774, "epoch": 1.4556533513879486, "percentage": 29.11, "elapsed_time": "0:28:19", "remaining_time": "1:08:57"}
{"current_steps": 2160, "total_steps": 7385, "loss": 0.7301, "learning_rate": 0.00017827569019777503, "epoch": 1.4624238320920786, "percentage": 29.25, "elapsed_time": "0:28:26", "remaining_time": "1:08:48"}
{"current_steps": 2170, "total_steps": 7385, "loss": 0.7858, "learning_rate": 0.00017798063984504698, "epoch": 1.4691943127962086, "percentage": 29.38, "elapsed_time": "0:28:35", "remaining_time": "1:08:42"}
{"current_steps": 2180, "total_steps": 7385, "loss": 0.8125, "learning_rate": 0.00017768384702333188, "epoch": 1.4759647935003386, "percentage": 29.52, "elapsed_time": "0:28:43", "remaining_time": "1:08:34"}
{"current_steps": 2190, "total_steps": 7385, "loss": 0.7731, "learning_rate": 0.00017738531836443332, "epoch": 1.4827352742044684, "percentage": 29.65, "elapsed_time": "0:28:50", "remaining_time": "1:08:25"}
{"current_steps": 2200, "total_steps": 7385, "loss": 0.7407, "learning_rate": 0.000177085060538942, "epoch": 1.4895057549085986, "percentage": 29.79, "elapsed_time": "0:28:58", "remaining_time": "1:08:17"}
{"current_steps": 2210, "total_steps": 7385, "loss": 0.7751, "learning_rate": 0.00017678308025608665, "epoch": 1.4962762356127284, "percentage": 29.93, "elapsed_time": "0:29:06", "remaining_time": "1:08:10"}
{"current_steps": 2220, "total_steps": 7385, "loss": 0.7642, "learning_rate": 0.00017647938426358412, "epoch": 1.5030467163168586, "percentage": 30.06, "elapsed_time": "0:29:13", "remaining_time": "1:08:00"}
{"current_steps": 2230, "total_steps": 7385, "loss": 0.8069, "learning_rate": 0.00017617397934748859, "epoch": 1.5098171970209884, "percentage": 30.2, "elapsed_time": "0:29:22", "remaining_time": "1:07:53"}
{"current_steps": 2240, "total_steps": 7385, "loss": 0.7463, "learning_rate": 0.00017586687233204, "epoch": 1.5165876777251186, "percentage": 30.33, "elapsed_time": "0:29:29", "remaining_time": "1:07:44"}
{"current_steps": 2250, "total_steps": 7385, "loss": 0.8157, "learning_rate": 0.00017555807007951142, "epoch": 1.5233581584292484, "percentage": 30.47, "elapsed_time": "0:29:37", "remaining_time": "1:07:36"}
{"current_steps": 2260, "total_steps": 7385, "loss": 0.8012, "learning_rate": 0.00017524757949005597, "epoch": 1.5301286391333786, "percentage": 30.6, "elapsed_time": "0:29:45", "remaining_time": "1:07:28"}
{"current_steps": 2270, "total_steps": 7385, "loss": 0.7429, "learning_rate": 0.00017493540750155236, "epoch": 1.5368991198375084, "percentage": 30.74, "elapsed_time": "0:29:52", "remaining_time": "1:07:18"}
{"current_steps": 2280, "total_steps": 7385, "loss": 0.7619, "learning_rate": 0.00017462156108944996, "epoch": 1.5436696005416386, "percentage": 30.87, "elapsed_time": "0:30:00", "remaining_time": "1:07:10"}
{"current_steps": 2290, "total_steps": 7385, "loss": 0.7792, "learning_rate": 0.00017430604726661304, "epoch": 1.5504400812457684, "percentage": 31.01, "elapsed_time": "0:30:08", "remaining_time": "1:07:03"}
{"current_steps": 2300, "total_steps": 7385, "loss": 0.7875, "learning_rate": 0.00017398887308316393, "epoch": 1.5572105619498986, "percentage": 31.14, "elapsed_time": "0:30:16", "remaining_time": "1:06:56"}
{"current_steps": 2310, "total_steps": 7385, "loss": 0.7395, "learning_rate": 0.00017367004562632556, "epoch": 1.5639810426540284, "percentage": 31.28, "elapsed_time": "0:30:24", "remaining_time": "1:06:47"}
{"current_steps": 2320, "total_steps": 7385, "loss": 0.734, "learning_rate": 0.00017334957202026305, "epoch": 1.5707515233581584, "percentage": 31.42, "elapsed_time": "0:30:32", "remaining_time": "1:06:40"}
{"current_steps": 2330, "total_steps": 7385, "loss": 0.732, "learning_rate": 0.0001730274594259246, "epoch": 1.5775220040622884, "percentage": 31.55, "elapsed_time": "0:30:39", "remaining_time": "1:06:31"}
{"current_steps": 2340, "total_steps": 7385, "loss": 0.7176, "learning_rate": 0.0001727037150408813, "epoch": 1.5842924847664184, "percentage": 31.69, "elapsed_time": "0:30:46", "remaining_time": "1:06:21"}
{"current_steps": 2350, "total_steps": 7385, "loss": 0.7883, "learning_rate": 0.00017237834609916668, "epoch": 1.5910629654705484, "percentage": 31.82, "elapsed_time": "0:30:54", "remaining_time": "1:06:13"}
{"current_steps": 2360, "total_steps": 7385, "loss": 0.7511, "learning_rate": 0.00017205135987111446, "epoch": 1.5978334461746784, "percentage": 31.96, "elapsed_time": "0:31:01", "remaining_time": "1:06:03"}
{"current_steps": 2370, "total_steps": 7385, "loss": 0.7344, "learning_rate": 0.0001717227636631968, "epoch": 1.6046039268788084, "percentage": 32.09, "elapsed_time": "0:31:08", "remaining_time": "1:05:53"}
{"current_steps": 2380, "total_steps": 7385, "loss": 0.7388, "learning_rate": 0.00017139256481786043, "epoch": 1.6113744075829384, "percentage": 32.23, "elapsed_time": "0:31:15", "remaining_time": "1:05:44"}
{"current_steps": 2390, "total_steps": 7385, "loss": 0.8181, "learning_rate": 0.00017106077071336298, "epoch": 1.6181448882870684, "percentage": 32.36, "elapsed_time": "0:31:25", "remaining_time": "1:05:39"}
{"current_steps": 2400, "total_steps": 7385, "loss": 0.7784, "learning_rate": 0.00017072738876360792, "epoch": 1.6249153689911984, "percentage": 32.5, "elapsed_time": "0:31:33", "remaining_time": "1:05:31"}
{"current_steps": 2410, "total_steps": 7385, "loss": 0.7631, "learning_rate": 0.00017039242641797895, "epoch": 1.6316858496953284, "percentage": 32.63, "elapsed_time": "0:31:40", "remaining_time": "1:05:23"}
{"current_steps": 2420, "total_steps": 7385, "loss": 0.7572, "learning_rate": 0.0001700558911611736, "epoch": 1.6384563303994584, "percentage": 32.77, "elapsed_time": "0:31:48", "remaining_time": "1:05:14"}
{"current_steps": 2430, "total_steps": 7385, "loss": 0.79, "learning_rate": 0.0001697177905130358, "epoch": 1.6452268111035884, "percentage": 32.9, "elapsed_time": "0:31:56", "remaining_time": "1:05:08"}
{"current_steps": 2440, "total_steps": 7385, "loss": 0.7389, "learning_rate": 0.00016937813202838817, "epoch": 1.6519972918077184, "percentage": 33.04, "elapsed_time": "0:32:03", "remaining_time": "1:04:58"}
{"current_steps": 2450, "total_steps": 7385, "loss": 0.8074, "learning_rate": 0.00016903692329686286, "epoch": 1.6587677725118484, "percentage": 33.18, "elapsed_time": "0:32:11", "remaining_time": "1:04:50"}
{"current_steps": 2460, "total_steps": 7385, "loss": 0.7493, "learning_rate": 0.00016869417194273216, "epoch": 1.6655382532159784, "percentage": 33.31, "elapsed_time": "0:32:19", "remaining_time": "1:04:41"}
{"current_steps": 2470, "total_steps": 7385, "loss": 0.7696, "learning_rate": 0.00016834988562473813, "epoch": 1.6723087339201084, "percentage": 33.45, "elapsed_time": "0:32:25", "remaining_time": "1:04:32"}
{"current_steps": 2480, "total_steps": 7385, "loss": 0.6736, "learning_rate": 0.00016800407203592144, "epoch": 1.6790792146242384, "percentage": 33.58, "elapsed_time": "0:32:34", "remaining_time": "1:04:25"}
{"current_steps": 2490, "total_steps": 7385, "loss": 0.7678, "learning_rate": 0.00016765673890344944, "epoch": 1.6858496953283684, "percentage": 33.72, "elapsed_time": "0:32:42", "remaining_time": "1:04:18"}
{"current_steps": 2500, "total_steps": 7385, "loss": 0.799, "learning_rate": 0.0001673078939884435, "epoch": 1.6926201760324981, "percentage": 33.85, "elapsed_time": "0:32:51", "remaining_time": "1:04:11"}
{"current_steps": 2510, "total_steps": 7385, "loss": 0.7445, "learning_rate": 0.00016695754508580556, "epoch": 1.6993906567366284, "percentage": 33.99, "elapsed_time": "0:32:59", "remaining_time": "1:04:04"}
{"current_steps": 2520, "total_steps": 7385, "loss": 0.7434, "learning_rate": 0.00016660570002404414, "epoch": 1.7061611374407581, "percentage": 34.12, "elapsed_time": "0:33:07", "remaining_time": "1:03:56"}
{"current_steps": 2530, "total_steps": 7385, "loss": 0.7785, "learning_rate": 0.0001662523666650992, "epoch": 1.7129316181448884, "percentage": 34.26, "elapsed_time": "0:33:15", "remaining_time": "1:03:48"}
{"current_steps": 2540, "total_steps": 7385, "loss": 0.7415, "learning_rate": 0.00016589755290416652, "epoch": 1.7197020988490181, "percentage": 34.39, "elapsed_time": "0:33:23", "remaining_time": "1:03:41"}
{"current_steps": 2550, "total_steps": 7385, "loss": 0.7568, "learning_rate": 0.0001655412666695213, "epoch": 1.7264725795531484, "percentage": 34.53, "elapsed_time": "0:33:30", "remaining_time": "1:03:31"}
{"current_steps": 2560, "total_steps": 7385, "loss": 0.714, "learning_rate": 0.00016518351592234102, "epoch": 1.7332430602572781, "percentage": 34.66, "elapsed_time": "0:33:37", "remaining_time": "1:03:22"}
{"current_steps": 2570, "total_steps": 7385, "loss": 0.8015, "learning_rate": 0.00016482430865652758, "epoch": 1.7400135409614084, "percentage": 34.8, "elapsed_time": "0:33:45", "remaining_time": "1:03:14"}
{"current_steps": 2580, "total_steps": 7385, "loss": 0.7517, "learning_rate": 0.0001644636528985286, "epoch": 1.7467840216655381, "percentage": 34.94, "elapsed_time": "0:33:52", "remaining_time": "1:03:06"}
{"current_steps": 2590, "total_steps": 7385, "loss": 0.7219, "learning_rate": 0.00016410155670715807, "epoch": 1.7535545023696684, "percentage": 35.07, "elapsed_time": "0:34:00", "remaining_time": "1:02:57"}
{"current_steps": 2600, "total_steps": 7385, "loss": 0.7544, "learning_rate": 0.00016373802817341631, "epoch": 1.7603249830737981, "percentage": 35.21, "elapsed_time": "0:34:08", "remaining_time": "1:02:50"}
{"current_steps": 2610, "total_steps": 7385, "loss": 0.7613, "learning_rate": 0.00016337307542030924, "epoch": 1.7670954637779284, "percentage": 35.34, "elapsed_time": "0:34:16", "remaining_time": "1:02:43"}
{"current_steps": 2620, "total_steps": 7385, "loss": 0.7028, "learning_rate": 0.00016300670660266678, "epoch": 1.7738659444820581, "percentage": 35.48, "elapsed_time": "0:34:25", "remaining_time": "1:02:35"}
{"current_steps": 2630, "total_steps": 7385, "loss": 0.7776, "learning_rate": 0.0001626389299069606, "epoch": 1.7806364251861884, "percentage": 35.61, "elapsed_time": "0:34:32", "remaining_time": "1:02:27"}
{"current_steps": 2640, "total_steps": 7385, "loss": 0.7127, "learning_rate": 0.00016226975355112134, "epoch": 1.7874069058903181, "percentage": 35.75, "elapsed_time": "0:34:39", "remaining_time": "1:02:18"}
{"current_steps": 2650, "total_steps": 7385, "loss": 0.7618, "learning_rate": 0.00016189918578435482, "epoch": 1.7941773865944484, "percentage": 35.88, "elapsed_time": "0:34:47", "remaining_time": "1:02:09"}
{"current_steps": 2660, "total_steps": 7385, "loss": 0.7364, "learning_rate": 0.00016152723488695783, "epoch": 1.8009478672985781, "percentage": 36.02, "elapsed_time": "0:34:55", "remaining_time": "1:02:01"}
{"current_steps": 2670, "total_steps": 7385, "loss": 0.7449, "learning_rate": 0.00016115390917013307, "epoch": 1.8077183480027081, "percentage": 36.15, "elapsed_time": "0:35:02", "remaining_time": "1:01:53"}
{"current_steps": 2680, "total_steps": 7385, "loss": 0.7766, "learning_rate": 0.00016077921697580343, "epoch": 1.8144888287068381, "percentage": 36.29, "elapsed_time": "0:35:10", "remaining_time": "1:01:45"}
{"current_steps": 2690, "total_steps": 7385, "loss": 0.7266, "learning_rate": 0.00016040316667642558, "epoch": 1.8212593094109681, "percentage": 36.43, "elapsed_time": "0:35:18", "remaining_time": "1:01:38"}
{"current_steps": 2700, "total_steps": 7385, "loss": 0.7344, "learning_rate": 0.00016002576667480288, "epoch": 1.8280297901150981, "percentage": 36.56, "elapsed_time": "0:35:26", "remaining_time": "1:01:30"}
{"current_steps": 2710, "total_steps": 7385, "loss": 0.7546, "learning_rate": 0.00015964702540389767, "epoch": 1.8348002708192281, "percentage": 36.7, "elapsed_time": "0:35:34", "remaining_time": "1:01:22"}
{"current_steps": 2720, "total_steps": 7385, "loss": 0.7482, "learning_rate": 0.0001592669513266428, "epoch": 1.8415707515233581, "percentage": 36.83, "elapsed_time": "0:35:42", "remaining_time": "1:01:13"}
{"current_steps": 2730, "total_steps": 7385, "loss": 0.7527, "learning_rate": 0.00015888555293575254, "epoch": 1.8483412322274881, "percentage": 36.97, "elapsed_time": "0:35:50", "remaining_time": "1:01:07"}
{"current_steps": 2740, "total_steps": 7385, "loss": 0.7672, "learning_rate": 0.0001585028387535328, "epoch": 1.8551117129316181, "percentage": 37.1, "elapsed_time": "0:35:59", "remaining_time": "1:01:00"}
{"current_steps": 2750, "total_steps": 7385, "loss": 0.7877, "learning_rate": 0.0001581188173316907, "epoch": 1.8618821936357481, "percentage": 37.24, "elapsed_time": "0:36:06", "remaining_time": "1:00:51"}
{"current_steps": 2760, "total_steps": 7385, "loss": 0.7711, "learning_rate": 0.00015773349725114352, "epoch": 1.8686526743398781, "percentage": 37.37, "elapsed_time": "0:36:14", "remaining_time": "1:00:43"}
{"current_steps": 2770, "total_steps": 7385, "loss": 0.7365, "learning_rate": 0.00015734688712182687, "epoch": 1.8754231550440081, "percentage": 37.51, "elapsed_time": "0:36:21", "remaining_time": "1:00:34"}
{"current_steps": 2780, "total_steps": 7385, "loss": 0.7144, "learning_rate": 0.0001569589955825024, "epoch": 1.8821936357481381, "percentage": 37.64, "elapsed_time": "0:36:28", "remaining_time": "1:00:25"}
{"current_steps": 2790, "total_steps": 7385, "loss": 0.7784, "learning_rate": 0.00015656983130056472, "epoch": 1.8889641164522681, "percentage": 37.78, "elapsed_time": "0:36:35", "remaining_time": "1:00:16"}
{"current_steps": 2800, "total_steps": 7385, "loss": 0.7455, "learning_rate": 0.00015617940297184775, "epoch": 1.8957345971563981, "percentage": 37.91, "elapsed_time": "0:36:43", "remaining_time": "1:00:08"}
{"current_steps": 2810, "total_steps": 7385, "loss": 0.7711, "learning_rate": 0.00015578771932043037, "epoch": 1.9025050778605281, "percentage": 38.05, "elapsed_time": "0:36:50", "remaining_time": "0:59:59"}
{"current_steps": 2820, "total_steps": 7385, "loss": 0.7485, "learning_rate": 0.00015539478909844156, "epoch": 1.9092755585646581, "percentage": 38.19, "elapsed_time": "0:36:57", "remaining_time": "0:59:50"}
{"current_steps": 2830, "total_steps": 7385, "loss": 0.7337, "learning_rate": 0.00015500062108586473, "epoch": 1.9160460392687881, "percentage": 38.32, "elapsed_time": "0:37:05", "remaining_time": "0:59:41"}
{"current_steps": 2840, "total_steps": 7385, "loss": 0.7547, "learning_rate": 0.0001546052240903416, "epoch": 1.9228165199729181, "percentage": 38.46, "elapsed_time": "0:37:13", "remaining_time": "0:59:33"}
{"current_steps": 2850, "total_steps": 7385, "loss": 0.7329, "learning_rate": 0.0001542086069469754, "epoch": 1.929587000677048, "percentage": 38.59, "elapsed_time": "0:37:21", "remaining_time": "0:59:27"}
{"current_steps": 2860, "total_steps": 7385, "loss": 0.6917, "learning_rate": 0.00015381077851813342, "epoch": 1.9363574813811781, "percentage": 38.73, "elapsed_time": "0:37:28", "remaining_time": "0:59:18"}
{"current_steps": 2870, "total_steps": 7385, "loss": 0.7293, "learning_rate": 0.000153411747693249, "epoch": 1.943127962085308, "percentage": 38.86, "elapsed_time": "0:37:36", "remaining_time": "0:59:10"}
{"current_steps": 2880, "total_steps": 7385, "loss": 0.7067, "learning_rate": 0.0001530115233886229, "epoch": 1.9498984427894381, "percentage": 39.0, "elapsed_time": "0:37:44", "remaining_time": "0:59:01"}
{"current_steps": 2890, "total_steps": 7385, "loss": 0.6613, "learning_rate": 0.00015261011454722402, "epoch": 1.956668923493568, "percentage": 39.13, "elapsed_time": "0:37:51", "remaining_time": "0:58:52"}
{"current_steps": 2900, "total_steps": 7385, "loss": 0.7931, "learning_rate": 0.00015220753013848965, "epoch": 1.9634394041976981, "percentage": 39.27, "elapsed_time": "0:37:58", "remaining_time": "0:58:44"}
{"current_steps": 2910, "total_steps": 7385, "loss": 0.6737, "learning_rate": 0.00015180377915812498, "epoch": 1.970209884901828, "percentage": 39.4, "elapsed_time": "0:38:06", "remaining_time": "0:58:36"}
{"current_steps": 2920, "total_steps": 7385, "loss": 0.7693, "learning_rate": 0.0001513988706279021, "epoch": 1.9769803656059581, "percentage": 39.54, "elapsed_time": "0:38:15", "remaining_time": "0:58:29"}
{"current_steps": 2930, "total_steps": 7385, "loss": 0.7222, "learning_rate": 0.00015099281359545844, "epoch": 1.983750846310088, "percentage": 39.68, "elapsed_time": "0:38:22", "remaining_time": "0:58:20"}
{"current_steps": 2940, "total_steps": 7385, "loss": 0.7813, "learning_rate": 0.00015058561713409465, "epoch": 1.9905213270142181, "percentage": 39.81, "elapsed_time": "0:38:29", "remaining_time": "0:58:10"}
{"current_steps": 2950, "total_steps": 7385, "loss": 0.7045, "learning_rate": 0.0001501772903425717, "epoch": 1.997291807718348, "percentage": 39.95, "elapsed_time": "0:38:36", "remaining_time": "0:58:03"}
{"current_steps": 2960, "total_steps": 7385, "loss": 0.6686, "learning_rate": 0.0001497678423449077, "epoch": 2.004062288422478, "percentage": 40.08, "elapsed_time": "0:38:45", "remaining_time": "0:57:55"}
{"current_steps": 2970, "total_steps": 7385, "loss": 0.5851, "learning_rate": 0.00014935728229017404, "epoch": 2.010832769126608, "percentage": 40.22, "elapsed_time": "0:38:53", "remaining_time": "0:57:49"}
{"current_steps": 2980, "total_steps": 7385, "loss": 0.5836, "learning_rate": 0.00014894561935229083, "epoch": 2.017603249830738, "percentage": 40.35, "elapsed_time": "0:39:02", "remaining_time": "0:57:42"}
{"current_steps": 2990, "total_steps": 7385, "loss": 0.5511, "learning_rate": 0.00014853286272982206, "epoch": 2.024373730534868, "percentage": 40.49, "elapsed_time": "0:39:10", "remaining_time": "0:57:34"}
{"current_steps": 3000, "total_steps": 7385, "loss": 0.5325, "learning_rate": 0.00014811902164576986, "epoch": 2.031144211238998, "percentage": 40.62, "elapsed_time": "0:39:17", "remaining_time": "0:57:26"}
{"current_steps": 3000, "total_steps": 7385, "eval_loss": 0.8718012571334839, "epoch": 2.031144211238998, "percentage": 40.62, "elapsed_time": "0:39:40", "remaining_time": "0:57:59"}
{"current_steps": 3010, "total_steps": 7385, "loss": 0.5722, "learning_rate": 0.0001477041053473687, "epoch": 2.037914691943128, "percentage": 40.76, "elapsed_time": "0:39:49", "remaining_time": "0:57:52"}
{"current_steps": 3020, "total_steps": 7385, "loss": 0.57, "learning_rate": 0.0001472881231058785, "epoch": 2.044685172647258, "percentage": 40.89, "elapsed_time": "0:39:56", "remaining_time": "0:57:44"}
{"current_steps": 3030, "total_steps": 7385, "loss": 0.5845, "learning_rate": 0.00014687108421637758, "epoch": 2.051455653351388, "percentage": 41.03, "elapsed_time": "0:40:04", "remaining_time": "0:57:35"}
{"current_steps": 3040, "total_steps": 7385, "loss": 0.533, "learning_rate": 0.0001464529979975549, "epoch": 2.058226134055518, "percentage": 41.16, "elapsed_time": "0:40:11", "remaining_time": "0:57:26"}
{"current_steps": 3050, "total_steps": 7385, "loss": 0.584, "learning_rate": 0.00014603387379150197, "epoch": 2.064996614759648, "percentage": 41.3, "elapsed_time": "0:40:19", "remaining_time": "0:57:18"}
{"current_steps": 3060, "total_steps": 7385, "loss": 0.5536, "learning_rate": 0.00014561372096350402, "epoch": 2.071767095463778, "percentage": 41.44, "elapsed_time": "0:40:27", "remaining_time": "0:57:10"}
{"current_steps": 3070, "total_steps": 7385, "loss": 0.5627, "learning_rate": 0.00014519254890183058, "epoch": 2.078537576167908, "percentage": 41.57, "elapsed_time": "0:40:34", "remaining_time": "0:57:01"}
{"current_steps": 3080, "total_steps": 7385, "loss": 0.5625, "learning_rate": 0.00014477036701752603, "epoch": 2.085308056872038, "percentage": 41.71, "elapsed_time": "0:40:42", "remaining_time": "0:56:53"}
{"current_steps": 3090, "total_steps": 7385, "loss": 0.6045, "learning_rate": 0.00014434718474419896, "epoch": 2.092078537576168, "percentage": 41.84, "elapsed_time": "0:40:49", "remaining_time": "0:56:45"}
{"current_steps": 3100, "total_steps": 7385, "loss": 0.5458, "learning_rate": 0.00014392301153781168, "epoch": 2.0988490182802977, "percentage": 41.98, "elapsed_time": "0:40:58", "remaining_time": "0:56:37"}
{"current_steps": 3110, "total_steps": 7385, "loss": 0.5798, "learning_rate": 0.00014349785687646879, "epoch": 2.105619498984428, "percentage": 42.11, "elapsed_time": "0:41:06", "remaining_time": "0:56:29"}
{"current_steps": 3120, "total_steps": 7385, "loss": 0.5566, "learning_rate": 0.00014307173026020524, "epoch": 2.1123899796885577, "percentage": 42.25, "elapsed_time": "0:41:14", "remaining_time": "0:56:22"}
{"current_steps": 3130, "total_steps": 7385, "loss": 0.5883, "learning_rate": 0.00014264464121077435, "epoch": 2.119160460392688, "percentage": 42.38, "elapsed_time": "0:41:22", "remaining_time": "0:56:14"}
{"current_steps": 3140, "total_steps": 7385, "loss": 0.5912, "learning_rate": 0.00014221659927143488, "epoch": 2.1259309410968177, "percentage": 42.52, "elapsed_time": "0:41:29", "remaining_time": "0:56:05"}
{"current_steps": 3150, "total_steps": 7385, "loss": 0.5421, "learning_rate": 0.00014178761400673778, "epoch": 2.132701421800948, "percentage": 42.65, "elapsed_time": "0:41:37", "remaining_time": "0:55:57"}
{"current_steps": 3160, "total_steps": 7385, "loss": 0.5477, "learning_rate": 0.00014135769500231259, "epoch": 2.1394719025050777, "percentage": 42.79, "elapsed_time": "0:41:45", "remaining_time": "0:55:49"}
{"current_steps": 3170, "total_steps": 7385, "loss": 0.5703, "learning_rate": 0.00014092685186465297, "epoch": 2.146242383209208, "percentage": 42.92, "elapsed_time": "0:41:52", "remaining_time": "0:55:40"}
{"current_steps": 3180, "total_steps": 7385, "loss": 0.6063, "learning_rate": 0.0001404950942209025, "epoch": 2.1530128639133377, "percentage": 43.06, "elapsed_time": "0:41:59", "remaining_time": "0:55:31"}
{"current_steps": 3190, "total_steps": 7385, "loss": 0.6101, "learning_rate": 0.00014006243171863907, "epoch": 2.159783344617468, "percentage": 43.2, "elapsed_time": "0:42:06", "remaining_time": "0:55:22"}
{"current_steps": 3200, "total_steps": 7385, "loss": 0.6067, "learning_rate": 0.00013962887402565967, "epoch": 2.1665538253215977, "percentage": 43.33, "elapsed_time": "0:42:14", "remaining_time": "0:55:14"}
{"current_steps": 3210, "total_steps": 7385, "loss": 0.5724, "learning_rate": 0.00013919443082976415, "epoch": 2.173324306025728, "percentage": 43.47, "elapsed_time": "0:42:21", "remaining_time": "0:55:06"}
{"current_steps": 3220, "total_steps": 7385, "loss": 0.5764, "learning_rate": 0.00013875911183853896, "epoch": 2.1800947867298577, "percentage": 43.6, "elapsed_time": "0:42:30", "remaining_time": "0:54:58"}
{"current_steps": 3230, "total_steps": 7385, "loss": 0.565, "learning_rate": 0.0001383229267791399, "epoch": 2.186865267433988, "percentage": 43.74, "elapsed_time": "0:42:38", "remaining_time": "0:54:51"}
{"current_steps": 3240, "total_steps": 7385, "loss": 0.525, "learning_rate": 0.00013788588539807517, "epoch": 2.1936357481381177, "percentage": 43.87, "elapsed_time": "0:42:46", "remaining_time": "0:54:43"}
{"current_steps": 3250, "total_steps": 7385, "loss": 0.6126, "learning_rate": 0.0001374479974609872, "epoch": 2.200406228842248, "percentage": 44.01, "elapsed_time": "0:42:53", "remaining_time": "0:54:34"}
{"current_steps": 3260, "total_steps": 7385, "loss": 0.5863, "learning_rate": 0.0001370092727524348, "epoch": 2.2071767095463777, "percentage": 44.14, "elapsed_time": "0:43:01", "remaining_time": "0:54:26"}
{"current_steps": 3270, "total_steps": 7385, "loss": 0.5568, "learning_rate": 0.00013656972107567423, "epoch": 2.213947190250508, "percentage": 44.28, "elapsed_time": "0:43:08", "remaining_time": "0:54:17"}
{"current_steps": 3280, "total_steps": 7385, "loss": 0.5777, "learning_rate": 0.0001361293522524403, "epoch": 2.2207176709546377, "percentage": 44.41, "elapsed_time": "0:43:15", "remaining_time": "0:54:08"}
{"current_steps": 3290, "total_steps": 7385, "loss": 0.549, "learning_rate": 0.0001356881761227269, "epoch": 2.227488151658768, "percentage": 44.55, "elapsed_time": "0:43:23", "remaining_time": "0:54:00"}
{"current_steps": 3300, "total_steps": 7385, "loss": 0.5828, "learning_rate": 0.00013524620254456705, "epoch": 2.2342586323628977, "percentage": 44.69, "elapsed_time": "0:43:31", "remaining_time": "0:53:52"}
{"current_steps": 3310, "total_steps": 7385, "loss": 0.5441, "learning_rate": 0.00013480344139381266, "epoch": 2.241029113067028, "percentage": 44.82, "elapsed_time": "0:43:38", "remaining_time": "0:53:43"}
{"current_steps": 3320, "total_steps": 7385, "loss": 0.6452, "learning_rate": 0.0001343599025639139, "epoch": 2.2477995937711577, "percentage": 44.96, "elapsed_time": "0:43:45", "remaining_time": "0:53:34"}
{"current_steps": 3330, "total_steps": 7385, "loss": 0.5803, "learning_rate": 0.00013391559596569815, "epoch": 2.254570074475288, "percentage": 45.09, "elapsed_time": "0:43:53", "remaining_time": "0:53:27"}
{"current_steps": 3340, "total_steps": 7385, "loss": 0.5768, "learning_rate": 0.0001334705315271483, "epoch": 2.2613405551794177, "percentage": 45.23, "elapsed_time": "0:44:02", "remaining_time": "0:53:20"}
{"current_steps": 3350, "total_steps": 7385, "loss": 0.5759, "learning_rate": 0.00013302471919318141, "epoch": 2.268111035883548, "percentage": 45.36, "elapsed_time": "0:44:10", "remaining_time": "0:53:12"}
{"current_steps": 3360, "total_steps": 7385, "loss": 0.5797, "learning_rate": 0.00013257816892542582, "epoch": 2.2748815165876777, "percentage": 45.5, "elapsed_time": "0:44:17", "remaining_time": "0:53:03"}
{"current_steps": 3370, "total_steps": 7385, "loss": 0.5747, "learning_rate": 0.0001321308907019992, "epoch": 2.281651997291808, "percentage": 45.63, "elapsed_time": "0:44:24", "remaining_time": "0:52:54"}
{"current_steps": 3380, "total_steps": 7385, "loss": 0.5114, "learning_rate": 0.0001316828945172852, "epoch": 2.2884224779959377, "percentage": 45.77, "elapsed_time": "0:44:32", "remaining_time": "0:52:46"}
{"current_steps": 3390, "total_steps": 7385, "loss": 0.5821, "learning_rate": 0.00013123419038171024, "epoch": 2.295192958700068, "percentage": 45.9, "elapsed_time": "0:44:39", "remaining_time": "0:52:37"}
{"current_steps": 3400, "total_steps": 7385, "loss": 0.6054, "learning_rate": 0.00013078478832151985, "epoch": 2.3019634394041977, "percentage": 46.04, "elapsed_time": "0:44:47", "remaining_time": "0:52:30"}
{"current_steps": 3410, "total_steps": 7385, "loss": 0.5621, "learning_rate": 0.00013033469837855457, "epoch": 2.3087339201083275, "percentage": 46.17, "elapsed_time": "0:44:55", "remaining_time": "0:52:21"}
{"current_steps": 3420, "total_steps": 7385, "loss": 0.5858, "learning_rate": 0.00012988393061002566, "epoch": 2.3155044008124577, "percentage": 46.31, "elapsed_time": "0:45:03", "remaining_time": "0:52:14"}
{"current_steps": 3430, "total_steps": 7385, "loss": 0.5961, "learning_rate": 0.0001294324950882903, "epoch": 2.322274881516588, "percentage": 46.45, "elapsed_time": "0:45:11", "remaining_time": "0:52:06"}
{"current_steps": 3440, "total_steps": 7385, "loss": 0.5667, "learning_rate": 0.00012898040190062647, "epoch": 2.3290453622207177, "percentage": 46.58, "elapsed_time": "0:45:18", "remaining_time": "0:51:57"}
{"current_steps": 3450, "total_steps": 7385, "loss": 0.5781, "learning_rate": 0.00012852766114900777, "epoch": 2.3358158429248475, "percentage": 46.72, "elapsed_time": "0:45:27", "remaining_time": "0:51:51"}
{"current_steps": 3460, "total_steps": 7385, "loss": 0.6048, "learning_rate": 0.00012807428294987744, "epoch": 2.3425863236289777, "percentage": 46.85, "elapsed_time": "0:45:34", "remaining_time": "0:51:41"}
{"current_steps": 3470, "total_steps": 7385, "loss": 0.5672, "learning_rate": 0.0001276202774339224, "epoch": 2.349356804333108, "percentage": 46.99, "elapsed_time": "0:45:41", "remaining_time": "0:51:33"}
{"current_steps": 3480, "total_steps": 7385, "loss": 0.5992, "learning_rate": 0.00012716565474584702, "epoch": 2.3561272850372377, "percentage": 47.12, "elapsed_time": "0:45:50", "remaining_time": "0:51:26"}
{"current_steps": 3490, "total_steps": 7385, "loss": 0.5853, "learning_rate": 0.00012671042504414619, "epoch": 2.3628977657413675, "percentage": 47.26, "elapsed_time": "0:45:57", "remaining_time": "0:51:17"}
{"current_steps": 3500, "total_steps": 7385, "loss": 0.5501, "learning_rate": 0.00012625459850087846, "epoch": 2.3696682464454977, "percentage": 47.39, "elapsed_time": "0:46:04", "remaining_time": "0:51:08"}
{"current_steps": 3510, "total_steps": 7385, "loss": 0.5684, "learning_rate": 0.00012579818530143884, "epoch": 2.3764387271496275, "percentage": 47.53, "elapsed_time": "0:46:11", "remaining_time": "0:51:00"}
{"current_steps": 3520, "total_steps": 7385, "loss": 0.578, "learning_rate": 0.000125341195644331, "epoch": 2.3832092078537577, "percentage": 47.66, "elapsed_time": "0:46:18", "remaining_time": "0:50:51"}
{"current_steps": 3530, "total_steps": 7385, "loss": 0.6235, "learning_rate": 0.0001248836397409396, "epoch": 2.3899796885578874, "percentage": 47.8, "elapsed_time": "0:46:26", "remaining_time": "0:50:43"}
{"current_steps": 3540, "total_steps": 7385, "loss": 0.5868, "learning_rate": 0.00012442552781530186, "epoch": 2.3967501692620177, "percentage": 47.94, "elapsed_time": "0:46:34", "remaining_time": "0:50:35"}
{"current_steps": 3550, "total_steps": 7385, "loss": 0.6091, "learning_rate": 0.00012396687010387942, "epoch": 2.4035206499661474, "percentage": 48.07, "elapsed_time": "0:46:41", "remaining_time": "0:50:26"}
{"current_steps": 3560, "total_steps": 7385, "loss": 0.5492, "learning_rate": 0.00012350767685532938, "epoch": 2.4102911306702777, "percentage": 48.21, "elapsed_time": "0:46:48", "remaining_time": "0:50:17"}
{"current_steps": 3570, "total_steps": 7385, "loss": 0.5809, "learning_rate": 0.00012304795833027534, "epoch": 2.4170616113744074, "percentage": 48.34, "elapsed_time": "0:46:56", "remaining_time": "0:50:09"}
{"current_steps": 3580, "total_steps": 7385, "loss": 0.5638, "learning_rate": 0.00012258772480107816, "epoch": 2.4238320920785377, "percentage": 48.48, "elapsed_time": "0:47:05", "remaining_time": "0:50:02"}
{"current_steps": 3590, "total_steps": 7385, "loss": 0.5644, "learning_rate": 0.00012212698655160637, "epoch": 2.4306025727826674, "percentage": 48.61, "elapsed_time": "0:47:12", "remaining_time": "0:49:54"}
{"current_steps": 3600, "total_steps": 7385, "loss": 0.5852, "learning_rate": 0.00012166575387700651, "epoch": 2.4373730534867977, "percentage": 48.75, "elapsed_time": "0:47:20", "remaining_time": "0:49:46"}
{"current_steps": 3610, "total_steps": 7385, "loss": 0.5753, "learning_rate": 0.00012120403708347298, "epoch": 2.4441435341909274, "percentage": 48.88, "elapsed_time": "0:47:29", "remaining_time": "0:49:39"}
{"current_steps": 3620, "total_steps": 7385, "loss": 0.5446, "learning_rate": 0.00012074184648801769, "epoch": 2.4509140148950577, "percentage": 49.02, "elapsed_time": "0:47:36", "remaining_time": "0:49:30"}
{"current_steps": 3630, "total_steps": 7385, "loss": 0.5771, "learning_rate": 0.00012027919241823964, "epoch": 2.4576844955991874, "percentage": 49.15, "elapsed_time": "0:47:45", "remaining_time": "0:49:23"}
{"current_steps": 3640, "total_steps": 7385, "loss": 0.5774, "learning_rate": 0.00011981608521209413, "epoch": 2.4644549763033177, "percentage": 49.29, "elapsed_time": "0:47:52", "remaining_time": "0:49:15"}
{"current_steps": 3650, "total_steps": 7385, "loss": 0.5718, "learning_rate": 0.00011935253521766174, "epoch": 2.4712254570074474, "percentage": 49.42, "elapsed_time": "0:48:00", "remaining_time": "0:49:07"}
{"current_steps": 3660, "total_steps": 7385, "loss": 0.6151, "learning_rate": 0.00011888855279291713, "epoch": 2.4779959377115777, "percentage": 49.56, "elapsed_time": "0:48:07", "remaining_time": "0:48:58"}
{"current_steps": 3670, "total_steps": 7385, "loss": 0.6025, "learning_rate": 0.00011842414830549748, "epoch": 2.4847664184157074, "percentage": 49.7, "elapsed_time": "0:48:15", "remaining_time": "0:48:50"}
{"current_steps": 3680, "total_steps": 7385, "loss": 0.6008, "learning_rate": 0.00011795933213247101, "epoch": 2.4915368991198377, "percentage": 49.83, "elapsed_time": "0:48:23", "remaining_time": "0:48:43"}
{"current_steps": 3690, "total_steps": 7385, "loss": 0.5598, "learning_rate": 0.000117494114660105, "epoch": 2.4983073798239674, "percentage": 49.97, "elapsed_time": "0:48:29", "remaining_time": "0:48:33"}
{"current_steps": 3700, "total_steps": 7385, "loss": 0.5636, "learning_rate": 0.00011702850628363365, "epoch": 2.5050778605280977, "percentage": 50.1, "elapsed_time": "0:48:37", "remaining_time": "0:48:25"}
{"current_steps": 3710, "total_steps": 7385, "loss": 0.5629, "learning_rate": 0.00011656251740702596, "epoch": 2.5118483412322274, "percentage": 50.24, "elapsed_time": "0:48:44", "remaining_time": "0:48:17"}
{"current_steps": 3720, "total_steps": 7385, "loss": 0.6066, "learning_rate": 0.00011609615844275305, "epoch": 2.518618821936357, "percentage": 50.37, "elapsed_time": "0:48:51", "remaining_time": "0:48:08"}
{"current_steps": 3730, "total_steps": 7385, "loss": 0.5491, "learning_rate": 0.00011562943981155575, "epoch": 2.5253893026404874, "percentage": 50.51, "elapsed_time": "0:48:59", "remaining_time": "0:47:59"}
{"current_steps": 3740, "total_steps": 7385, "loss": 0.6065, "learning_rate": 0.00011516237194221149, "epoch": 2.5321597833446177, "percentage": 50.64, "elapsed_time": "0:49:07", "remaining_time": "0:47:52"}
{"current_steps": 3750, "total_steps": 7385, "loss": 0.5705, "learning_rate": 0.0001146949652713015, "epoch": 2.5389302640487474, "percentage": 50.78, "elapsed_time": "0:49:13", "remaining_time": "0:47:43"}
{"current_steps": 3760, "total_steps": 7385, "loss": 0.5364, "learning_rate": 0.00011422723024297737, "epoch": 2.545700744752877, "percentage": 50.91, "elapsed_time": "0:49:21", "remaining_time": "0:47:35"}
{"current_steps": 3770, "total_steps": 7385, "loss": 0.6014, "learning_rate": 0.00011375917730872787, "epoch": 2.5524712254570074, "percentage": 51.05, "elapsed_time": "0:49:29", "remaining_time": "0:47:27"}
{"current_steps": 3780, "total_steps": 7385, "loss": 0.5477, "learning_rate": 0.00011329081692714534, "epoch": 2.5592417061611377, "percentage": 51.18, "elapsed_time": "0:49:35", "remaining_time": "0:47:18"}
{"current_steps": 3790, "total_steps": 7385, "loss": 0.6538, "learning_rate": 0.00011282215956369204, "epoch": 2.5660121868652674, "percentage": 51.32, "elapsed_time": "0:49:44", "remaining_time": "0:47:10"}
{"current_steps": 3800, "total_steps": 7385, "loss": 0.594, "learning_rate": 0.00011235321569046615, "epoch": 2.572782667569397, "percentage": 51.46, "elapsed_time": "0:49:52", "remaining_time": "0:47:02"}
{"current_steps": 3810, "total_steps": 7385, "loss": 0.5936, "learning_rate": 0.00011188399578596795, "epoch": 2.5795531482735274, "percentage": 51.59, "elapsed_time": "0:49:59", "remaining_time": "0:46:54"}
{"current_steps": 3820, "total_steps": 7385, "loss": 0.5633, "learning_rate": 0.00011141451033486564, "epoch": 2.5863236289776577, "percentage": 51.73, "elapsed_time": "0:50:07", "remaining_time": "0:46:46"}
{"current_steps": 3830, "total_steps": 7385, "loss": 0.553, "learning_rate": 0.00011094476982776096, "epoch": 2.5930941096817874, "percentage": 51.86, "elapsed_time": "0:50:15", "remaining_time": "0:46:39"}
{"current_steps": 3840, "total_steps": 7385, "loss": 0.5591, "learning_rate": 0.00011047478476095487, "epoch": 2.599864590385917, "percentage": 52.0, "elapsed_time": "0:50:23", "remaining_time": "0:46:31"}
{"current_steps": 3850, "total_steps": 7385, "loss": 0.5753, "learning_rate": 0.00011000456563621304, "epoch": 2.6066350710900474, "percentage": 52.13, "elapsed_time": "0:50:31", "remaining_time": "0:46:23"}
{"current_steps": 3860, "total_steps": 7385, "loss": 0.6055, "learning_rate": 0.00010953412296053105, "epoch": 2.6134055517941777, "percentage": 52.27, "elapsed_time": "0:50:39", "remaining_time": "0:46:16"}
{"current_steps": 3870, "total_steps": 7385, "loss": 0.6062, "learning_rate": 0.00010906346724589975, "epoch": 2.6201760324983074, "percentage": 52.4, "elapsed_time": "0:50:48", "remaining_time": "0:46:08"}
{"current_steps": 3880, "total_steps": 7385, "loss": 0.5867, "learning_rate": 0.00010859260900907038, "epoch": 2.626946513202437, "percentage": 52.54, "elapsed_time": "0:50:55", "remaining_time": "0:46:00"}
{"current_steps": 3890, "total_steps": 7385, "loss": 0.5953, "learning_rate": 0.00010812155877131945, "epoch": 2.6337169939065674, "percentage": 52.67, "elapsed_time": "0:51:04", "remaining_time": "0:45:53"}
{"current_steps": 3900, "total_steps": 7385, "loss": 0.5537, "learning_rate": 0.00010765032705821363, "epoch": 2.640487474610697, "percentage": 52.81, "elapsed_time": "0:51:11", "remaining_time": "0:45:44"}
{"current_steps": 3910, "total_steps": 7385, "loss": 0.572, "learning_rate": 0.0001071789243993748, "epoch": 2.6472579553148274, "percentage": 52.95, "elapsed_time": "0:51:19", "remaining_time": "0:45:36"}
{"current_steps": 3920, "total_steps": 7385, "loss": 0.5921, "learning_rate": 0.00010670736132824455, "epoch": 2.654028436018957, "percentage": 53.08, "elapsed_time": "0:51:26", "remaining_time": "0:45:28"}
{"current_steps": 3930, "total_steps": 7385, "loss": 0.5635, "learning_rate": 0.00010623564838184878, "epoch": 2.6607989167230874, "percentage": 53.22, "elapsed_time": "0:51:33", "remaining_time": "0:45:20"}
{"current_steps": 3940, "total_steps": 7385, "loss": 0.5886, "learning_rate": 0.00010576379610056249, "epoch": 2.667569397427217, "percentage": 53.35, "elapsed_time": "0:51:41", "remaining_time": "0:45:12"}
{"current_steps": 3950, "total_steps": 7385, "loss": 0.5831, "learning_rate": 0.0001052918150278739, "epoch": 2.6743398781313474, "percentage": 53.49, "elapsed_time": "0:51:48", "remaining_time": "0:45:03"}
{"current_steps": 3960, "total_steps": 7385, "loss": 0.5335, "learning_rate": 0.0001048197157101493, "epoch": 2.681110358835477, "percentage": 53.62, "elapsed_time": "0:51:55", "remaining_time": "0:44:54"}
{"current_steps": 3970, "total_steps": 7385, "loss": 0.5331, "learning_rate": 0.00010434750869639693, "epoch": 2.6878808395396074, "percentage": 53.76, "elapsed_time": "0:52:03", "remaining_time": "0:44:46"}
{"current_steps": 3980, "total_steps": 7385, "loss": 0.5931, "learning_rate": 0.00010387520453803166, "epoch": 2.694651320243737, "percentage": 53.89, "elapsed_time": "0:52:11", "remaining_time": "0:44:38"}
{"current_steps": 3990, "total_steps": 7385, "loss": 0.5472, "learning_rate": 0.00010340281378863892, "epoch": 2.7014218009478674, "percentage": 54.03, "elapsed_time": "0:52:17", "remaining_time": "0:44:29"}
{"current_steps": 4000, "total_steps": 7385, "loss": 0.5875, "learning_rate": 0.00010293034700373905, "epoch": 2.708192281651997, "percentage": 54.16, "elapsed_time": "0:52:25", "remaining_time": "0:44:21"}
{"current_steps": 4000, "total_steps": 7385, "eval_loss": 0.8555851578712463, "epoch": 2.708192281651997, "percentage": 54.16, "elapsed_time": "0:52:48", "remaining_time": "0:44:41"}
{"current_steps": 4010, "total_steps": 7385, "loss": 0.6028, "learning_rate": 0.0001024578147405514, "epoch": 2.7149627623561274, "percentage": 54.3, "elapsed_time": "0:52:56", "remaining_time": "0:44:33"}
{"current_steps": 4020, "total_steps": 7385, "loss": 0.5959, "learning_rate": 0.0001019852275577585, "epoch": 2.721733243060257, "percentage": 54.43, "elapsed_time": "0:53:03", "remaining_time": "0:44:25"}
{"current_steps": 4030, "total_steps": 7385, "loss": 0.6042, "learning_rate": 0.00010151259601526992, "epoch": 2.7285037237643874, "percentage": 54.57, "elapsed_time": "0:53:10", "remaining_time": "0:44:16"}
{"current_steps": 4040, "total_steps": 7385, "loss": 0.5943, "learning_rate": 0.00010103993067398649, "epoch": 2.735274204468517, "percentage": 54.71, "elapsed_time": "0:53:18", "remaining_time": "0:44:08"}
{"current_steps": 4050, "total_steps": 7385, "loss": 0.5853, "learning_rate": 0.00010056724209556431, "epoch": 2.7420446851726474, "percentage": 54.84, "elapsed_time": "0:53:27", "remaining_time": "0:44:00"}
{"current_steps": 4060, "total_steps": 7385, "loss": 0.5967, "learning_rate": 0.00010009454084217873, "epoch": 2.748815165876777, "percentage": 54.98, "elapsed_time": "0:53:34", "remaining_time": "0:43:52"}
{"current_steps": 4070, "total_steps": 7385, "loss": 0.5528, "learning_rate": 9.962183747628819e-05, "epoch": 2.755585646580907, "percentage": 55.11, "elapsed_time": "0:53:41", "remaining_time": "0:43:44"}
{"current_steps": 4080, "total_steps": 7385, "loss": 0.5641, "learning_rate": 9.914914256039847e-05, "epoch": 2.762356127285037, "percentage": 55.25, "elapsed_time": "0:53:49", "remaining_time": "0:43:36"}
{"current_steps": 4090, "total_steps": 7385, "loss": 0.5638, "learning_rate": 9.867646665682646e-05, "epoch": 2.7691266079891674, "percentage": 55.38, "elapsed_time": "0:53:57", "remaining_time": "0:43:28"}
{"current_steps": 4100, "total_steps": 7385, "loss": 0.5835, "learning_rate": 9.820382032746426e-05, "epoch": 2.775897088693297, "percentage": 55.52, "elapsed_time": "0:54:05", "remaining_time": "0:43:20"}
{"current_steps": 4110, "total_steps": 7385, "loss": 0.5809, "learning_rate": 9.773121413354311e-05, "epoch": 2.782667569397427, "percentage": 55.65, "elapsed_time": "0:54:13", "remaining_time": "0:43:12"}
{"current_steps": 4120, "total_steps": 7385, "loss": 0.5768, "learning_rate": 9.725865863539747e-05, "epoch": 2.789438050101557, "percentage": 55.79, "elapsed_time": "0:54:21", "remaining_time": "0:43:04"}
{"current_steps": 4130, "total_steps": 7385, "loss": 0.5758, "learning_rate": 9.678616439222899e-05, "epoch": 2.7962085308056874, "percentage": 55.92, "elapsed_time": "0:54:29", "remaining_time": "0:42:56"}
{"current_steps": 4140, "total_steps": 7385, "loss": 0.547, "learning_rate": 9.631374196187051e-05, "epoch": 2.802979011509817, "percentage": 56.06, "elapsed_time": "0:54:37", "remaining_time": "0:42:48"}
{"current_steps": 4150, "total_steps": 7385, "loss": 0.5315, "learning_rate": 9.584140190055035e-05, "epoch": 2.809749492213947, "percentage": 56.19, "elapsed_time": "0:54:45", "remaining_time": "0:42:40"}
{"current_steps": 4160, "total_steps": 7385, "loss": 0.5824, "learning_rate": 9.536915476265621e-05, "epoch": 2.816519972918077, "percentage": 56.33, "elapsed_time": "0:54:52", "remaining_time": "0:42:32"}
{"current_steps": 4170, "total_steps": 7385, "loss": 0.6094, "learning_rate": 9.489701110049944e-05, "epoch": 2.8232904536222074, "percentage": 56.47, "elapsed_time": "0:55:00", "remaining_time": "0:42:24"}
{"current_steps": 4180, "total_steps": 7385, "loss": 0.5914, "learning_rate": 9.442498146407927e-05, "epoch": 2.830060934326337, "percentage": 56.6, "elapsed_time": "0:55:08", "remaining_time": "0:42:16"}
{"current_steps": 4190, "total_steps": 7385, "loss": 0.5814, "learning_rate": 9.3953076400847e-05, "epoch": 2.836831415030467, "percentage": 56.74, "elapsed_time": "0:55:15", "remaining_time": "0:42:07"}
{"current_steps": 4200, "total_steps": 7385, "loss": 0.5663, "learning_rate": 9.348130645547042e-05, "epoch": 2.843601895734597, "percentage": 56.87, "elapsed_time": "0:55:23", "remaining_time": "0:42:00"}
{"current_steps": 4210, "total_steps": 7385, "loss": 0.5807, "learning_rate": 9.300968216959805e-05, "epoch": 2.850372376438727, "percentage": 57.01, "elapsed_time": "0:55:31", "remaining_time": "0:41:52"}
{"current_steps": 4220, "total_steps": 7385, "loss": 0.5868, "learning_rate": 9.253821408162366e-05, "epoch": 2.857142857142857, "percentage": 57.14, "elapsed_time": "0:55:38", "remaining_time": "0:41:43"}
{"current_steps": 4230, "total_steps": 7385, "loss": 0.5613, "learning_rate": 9.206691272645087e-05, "epoch": 2.863913337846987, "percentage": 57.28, "elapsed_time": "0:55:46", "remaining_time": "0:41:35"}
{"current_steps": 4240, "total_steps": 7385, "loss": 0.6245, "learning_rate": 9.159578863525762e-05, "epoch": 2.870683818551117, "percentage": 57.41, "elapsed_time": "0:55:54", "remaining_time": "0:41:27"}
{"current_steps": 4250, "total_steps": 7385, "loss": 0.547, "learning_rate": 9.11248523352609e-05, "epoch": 2.877454299255247, "percentage": 57.55, "elapsed_time": "0:56:01", "remaining_time": "0:41:19"}
{"current_steps": 4260, "total_steps": 7385, "loss": 0.5432, "learning_rate": 9.065411434948152e-05, "epoch": 2.884224779959377, "percentage": 57.68, "elapsed_time": "0:56:10", "remaining_time": "0:41:12"}
{"current_steps": 4270, "total_steps": 7385, "loss": 0.534, "learning_rate": 9.018358519650909e-05, "epoch": 2.890995260663507, "percentage": 57.82, "elapsed_time": "0:56:19", "remaining_time": "0:41:05"}
{"current_steps": 4280, "total_steps": 7385, "loss": 0.5651, "learning_rate": 8.97132753902667e-05, "epoch": 2.897765741367637, "percentage": 57.96, "elapsed_time": "0:56:26", "remaining_time": "0:40:56"}
{"current_steps": 4290, "total_steps": 7385, "loss": 0.5611, "learning_rate": 8.924319543977631e-05, "epoch": 2.904536222071767, "percentage": 58.09, "elapsed_time": "0:56:33", "remaining_time": "0:40:48"}
{"current_steps": 4300, "total_steps": 7385, "loss": 0.5584, "learning_rate": 8.877335584892369e-05, "epoch": 2.911306702775897, "percentage": 58.23, "elapsed_time": "0:56:41", "remaining_time": "0:40:40"}
{"current_steps": 4310, "total_steps": 7385, "loss": 0.5939, "learning_rate": 8.830376711622379e-05, "epoch": 2.918077183480027, "percentage": 58.36, "elapsed_time": "0:56:48", "remaining_time": "0:40:31"}
{"current_steps": 4320, "total_steps": 7385, "loss": 0.5912, "learning_rate": 8.783443973458625e-05, "epoch": 2.924847664184157, "percentage": 58.5, "elapsed_time": "0:56:56", "remaining_time": "0:40:24"}
{"current_steps": 4330, "total_steps": 7385, "loss": 0.6095, "learning_rate": 8.736538419108074e-05, "epoch": 2.931618144888287, "percentage": 58.63, "elapsed_time": "0:57:03", "remaining_time": "0:40:15"}
{"current_steps": 4340, "total_steps": 7385, "loss": 0.5618, "learning_rate": 8.689661096670285e-05, "epoch": 2.938388625592417, "percentage": 58.77, "elapsed_time": "0:57:11", "remaining_time": "0:40:07"}
{"current_steps": 4350, "total_steps": 7385, "loss": 0.5388, "learning_rate": 8.64281305361397e-05, "epoch": 2.945159106296547, "percentage": 58.9, "elapsed_time": "0:57:18", "remaining_time": "0:39:59"}
{"current_steps": 4360, "total_steps": 7385, "loss": 0.5891, "learning_rate": 8.595995336753597e-05, "epoch": 2.951929587000677, "percentage": 59.04, "elapsed_time": "0:57:26", "remaining_time": "0:39:51"}
{"current_steps": 4370, "total_steps": 7385, "loss": 0.5351, "learning_rate": 8.549208992226001e-05, "epoch": 2.958700067704807, "percentage": 59.17, "elapsed_time": "0:57:34", "remaining_time": "0:39:43"}
{"current_steps": 4380, "total_steps": 7385, "loss": 0.5939, "learning_rate": 8.502455065467006e-05, "epoch": 2.9654705484089368, "percentage": 59.31, "elapsed_time": "0:57:42", "remaining_time": "0:39:35"}
{"current_steps": 4390, "total_steps": 7385, "loss": 0.5488, "learning_rate": 8.45573460118806e-05, "epoch": 2.972241029113067, "percentage": 59.44, "elapsed_time": "0:57:49", "remaining_time": "0:39:27"}
{"current_steps": 4400, "total_steps": 7385, "loss": 0.6054, "learning_rate": 8.4090486433529e-05, "epoch": 2.979011509817197, "percentage": 59.58, "elapsed_time": "0:57:56", "remaining_time": "0:39:18"}
{"current_steps": 4410, "total_steps": 7385, "loss": 0.5542, "learning_rate": 8.362398235154213e-05, "epoch": 2.985781990521327, "percentage": 59.72, "elapsed_time": "0:58:04", "remaining_time": "0:39:10"}
{"current_steps": 4420, "total_steps": 7385, "loss": 0.5326, "learning_rate": 8.31578441899035e-05, "epoch": 2.9925524712254568, "percentage": 59.85, "elapsed_time": "0:58:12", "remaining_time": "0:39:02"}
{"current_steps": 4430, "total_steps": 7385, "loss": 0.5924, "learning_rate": 8.269208236442003e-05, "epoch": 2.999322951929587, "percentage": 59.99, "elapsed_time": "0:58:19", "remaining_time": "0:38:54"}
{"current_steps": 4440, "total_steps": 7385, "loss": 0.4272, "learning_rate": 8.222670728248941e-05, "epoch": 3.006093432633717, "percentage": 60.12, "elapsed_time": "0:58:27", "remaining_time": "0:38:46"}
{"current_steps": 4450, "total_steps": 7385, "loss": 0.4442, "learning_rate": 8.17617293428677e-05, "epoch": 3.012863913337847, "percentage": 60.26, "elapsed_time": "0:58:35", "remaining_time": "0:38:38"}
{"current_steps": 4460, "total_steps": 7385, "loss": 0.3873, "learning_rate": 8.129715893543681e-05, "epoch": 3.019634394041977, "percentage": 60.39, "elapsed_time": "0:58:41", "remaining_time": "0:38:29"}
{"current_steps": 4470, "total_steps": 7385, "loss": 0.3991, "learning_rate": 8.08330064409724e-05, "epoch": 3.026404874746107, "percentage": 60.53, "elapsed_time": "0:58:49", "remaining_time": "0:38:21"}
{"current_steps": 4480, "total_steps": 7385, "loss": 0.4557, "learning_rate": 8.036928223091187e-05, "epoch": 3.0331753554502368, "percentage": 60.66, "elapsed_time": "0:58:56", "remaining_time": "0:38:13"}
{"current_steps": 4490, "total_steps": 7385, "loss": 0.4077, "learning_rate": 7.990599666712268e-05, "epoch": 3.039945836154367, "percentage": 60.8, "elapsed_time": "0:59:04", "remaining_time": "0:38:05"}
{"current_steps": 4500, "total_steps": 7385, "loss": 0.3999, "learning_rate": 7.94431601016708e-05, "epoch": 3.0467163168584968, "percentage": 60.93, "elapsed_time": "0:59:12", "remaining_time": "0:37:57"}
{"current_steps": 4510, "total_steps": 7385, "loss": 0.3614, "learning_rate": 7.898078287658941e-05, "epoch": 3.053486797562627, "percentage": 61.07, "elapsed_time": "0:59:19", "remaining_time": "0:37:49"}
{"current_steps": 4520, "total_steps": 7385, "loss": 0.4038, "learning_rate": 7.85188753236477e-05, "epoch": 3.0602572782667568, "percentage": 61.21, "elapsed_time": "0:59:27", "remaining_time": "0:37:41"}
{"current_steps": 4530, "total_steps": 7385, "loss": 0.4229, "learning_rate": 7.805744776412012e-05, "epoch": 3.067027758970887, "percentage": 61.34, "elapsed_time": "0:59:35", "remaining_time": "0:37:33"}
{"current_steps": 4540, "total_steps": 7385, "loss": 0.3806, "learning_rate": 7.759651050855568e-05, "epoch": 3.0737982396750168, "percentage": 61.48, "elapsed_time": "0:59:42", "remaining_time": "0:37:25"}
{"current_steps": 4550, "total_steps": 7385, "loss": 0.3625, "learning_rate": 7.713607385654772e-05, "epoch": 3.080568720379147, "percentage": 61.61, "elapsed_time": "0:59:50", "remaining_time": "0:37:16"}
{"current_steps": 4560, "total_steps": 7385, "loss": 0.3889, "learning_rate": 7.667614809650351e-05, "epoch": 3.0873392010832768, "percentage": 61.75, "elapsed_time": "0:59:58", "remaining_time": "0:37:09"}
{"current_steps": 4570, "total_steps": 7385, "loss": 0.3775, "learning_rate": 7.621674350541461e-05, "epoch": 3.094109681787407, "percentage": 61.88, "elapsed_time": "1:00:06", "remaining_time": "0:37:01"}
{"current_steps": 4580, "total_steps": 7385, "loss": 0.4023, "learning_rate": 7.575787034862704e-05, "epoch": 3.1008801624915368, "percentage": 62.02, "elapsed_time": "1:00:14", "remaining_time": "0:36:53"}
{"current_steps": 4590, "total_steps": 7385, "loss": 0.3641, "learning_rate": 7.529953887961197e-05, "epoch": 3.107650643195667, "percentage": 62.15, "elapsed_time": "1:00:22", "remaining_time": "0:36:45"}
{"current_steps": 4600, "total_steps": 7385, "loss": 0.3818, "learning_rate": 7.484175933973668e-05, "epoch": 3.1144211238997968, "percentage": 62.29, "elapsed_time": "1:00:30", "remaining_time": "0:36:38"}
{"current_steps": 4610, "total_steps": 7385, "loss": 0.4187, "learning_rate": 7.438454195803559e-05, "epoch": 3.121191604603927, "percentage": 62.42, "elapsed_time": "1:00:38", "remaining_time": "0:36:30"}
{"current_steps": 4620, "total_steps": 7385, "loss": 0.3718, "learning_rate": 7.392789695098182e-05, "epoch": 3.1279620853080567, "percentage": 62.56, "elapsed_time": "1:00:45", "remaining_time": "0:36:21"}
{"current_steps": 4630, "total_steps": 7385, "loss": 0.3969, "learning_rate": 7.347183452225874e-05, "epoch": 3.134732566012187, "percentage": 62.69, "elapsed_time": "1:00:52", "remaining_time": "0:36:13"}
{"current_steps": 4640, "total_steps": 7385, "loss": 0.4193, "learning_rate": 7.301636486253215e-05, "epoch": 3.1415030467163167, "percentage": 62.83, "elapsed_time": "1:00:59", "remaining_time": "0:36:05"}
{"current_steps": 4650, "total_steps": 7385, "loss": 0.3923, "learning_rate": 7.256149814922253e-05, "epoch": 3.148273527420447, "percentage": 62.97, "elapsed_time": "1:01:07", "remaining_time": "0:35:56"}
{"current_steps": 4660, "total_steps": 7385, "loss": 0.3871, "learning_rate": 7.210724454627751e-05, "epoch": 3.1550440081245767, "percentage": 63.1, "elapsed_time": "1:01:14", "remaining_time": "0:35:48"}
{"current_steps": 4670, "total_steps": 7385, "loss": 0.4219, "learning_rate": 7.165361420394482e-05, "epoch": 3.161814488828707, "percentage": 63.24, "elapsed_time": "1:01:22", "remaining_time": "0:35:40"}
{"current_steps": 4680, "total_steps": 7385, "loss": 0.4219, "learning_rate": 7.120061725854554e-05, "epoch": 3.1685849695328367, "percentage": 63.37, "elapsed_time": "1:01:30", "remaining_time": "0:35:33"}
{"current_steps": 4690, "total_steps": 7385, "loss": 0.4002, "learning_rate": 7.074826383224761e-05, "epoch": 3.175355450236967, "percentage": 63.51, "elapsed_time": "1:01:38", "remaining_time": "0:35:25"}
{"current_steps": 4700, "total_steps": 7385, "loss": 0.3984, "learning_rate": 7.029656403283951e-05, "epoch": 3.1821259309410967, "percentage": 63.64, "elapsed_time": "1:01:45", "remaining_time": "0:35:17"}
{"current_steps": 4710, "total_steps": 7385, "loss": 0.4005, "learning_rate": 6.984552795350453e-05, "epoch": 3.188896411645227, "percentage": 63.78, "elapsed_time": "1:01:52", "remaining_time": "0:35:08"}
{"current_steps": 4720, "total_steps": 7385, "loss": 0.3999, "learning_rate": 6.939516567259523e-05, "epoch": 3.1956668923493567, "percentage": 63.91, "elapsed_time": "1:02:01", "remaining_time": "0:35:01"}
{"current_steps": 4730, "total_steps": 7385, "loss": 0.3844, "learning_rate": 6.894548725340822e-05, "epoch": 3.202437373053487, "percentage": 64.05, "elapsed_time": "1:02:10", "remaining_time": "0:34:53"}
{"current_steps": 4740, "total_steps": 7385, "loss": 0.4107, "learning_rate": 6.849650274395929e-05, "epoch": 3.2092078537576167, "percentage": 64.18, "elapsed_time": "1:02:18", "remaining_time": "0:34:45"}
{"current_steps": 4750, "total_steps": 7385, "loss": 0.3865, "learning_rate": 6.804822217675885e-05, "epoch": 3.215978334461747, "percentage": 64.32, "elapsed_time": "1:02:25", "remaining_time": "0:34:37"}
{"current_steps": 4760, "total_steps": 7385, "loss": 0.3635, "learning_rate": 6.760065556858786e-05, "epoch": 3.2227488151658767, "percentage": 64.45, "elapsed_time": "1:02:33", "remaining_time": "0:34:29"}
{"current_steps": 4770, "total_steps": 7385, "loss": 0.3754, "learning_rate": 6.715381292027385e-05, "epoch": 3.229519295870007, "percentage": 64.59, "elapsed_time": "1:02:41", "remaining_time": "0:34:21"}
{"current_steps": 4780, "total_steps": 7385, "loss": 0.4034, "learning_rate": 6.670770421646767e-05, "epoch": 3.2362897765741367, "percentage": 64.73, "elapsed_time": "1:02:48", "remaining_time": "0:34:13"}
{"current_steps": 4790, "total_steps": 7385, "loss": 0.3946, "learning_rate": 6.626233942542013e-05, "epoch": 3.243060257278267, "percentage": 64.86, "elapsed_time": "1:02:57", "remaining_time": "0:34:06"}
{"current_steps": 4800, "total_steps": 7385, "loss": 0.3638, "learning_rate": 6.581772849875951e-05, "epoch": 3.2498307379823967, "percentage": 65.0, "elapsed_time": "1:03:04", "remaining_time": "0:33:58"}
{"current_steps": 4810, "total_steps": 7385, "loss": 0.3607, "learning_rate": 6.537388137126899e-05, "epoch": 3.2566012186865265, "percentage": 65.13, "elapsed_time": "1:03:12", "remaining_time": "0:33:50"}
{"current_steps": 4820, "total_steps": 7385, "loss": 0.3797, "learning_rate": 6.493080796066477e-05, "epoch": 3.2633716993906567, "percentage": 65.27, "elapsed_time": "1:03:19", "remaining_time": "0:33:41"}
{"current_steps": 4830, "total_steps": 7385, "loss": 0.3552, "learning_rate": 6.448851816737443e-05, "epoch": 3.270142180094787, "percentage": 65.4, "elapsed_time": "1:03:27", "remaining_time": "0:33:34"}
{"current_steps": 4840, "total_steps": 7385, "loss": 0.3905, "learning_rate": 6.404702187431568e-05, "epoch": 3.2769126607989167, "percentage": 65.54, "elapsed_time": "1:03:35", "remaining_time": "0:33:26"}
{"current_steps": 4850, "total_steps": 7385, "loss": 0.3864, "learning_rate": 6.360632894667555e-05, "epoch": 3.2836831415030465, "percentage": 65.67, "elapsed_time": "1:03:42", "remaining_time": "0:33:18"}
{"current_steps": 4860, "total_steps": 7385, "loss": 0.3921, "learning_rate": 6.316644923169007e-05, "epoch": 3.2904536222071767, "percentage": 65.81, "elapsed_time": "1:03:49", "remaining_time": "0:33:09"}
{"current_steps": 4870, "total_steps": 7385, "loss": 0.4138, "learning_rate": 6.27273925584239e-05, "epoch": 3.2972241029113065, "percentage": 65.94, "elapsed_time": "1:03:57", "remaining_time": "0:33:01"}
{"current_steps": 4880, "total_steps": 7385, "loss": 0.3709, "learning_rate": 6.228916873755118e-05, "epoch": 3.3039945836154367, "percentage": 66.08, "elapsed_time": "1:04:06", "remaining_time": "0:32:54"}
{"current_steps": 4890, "total_steps": 7385, "loss": 0.3622, "learning_rate": 6.185178756113586e-05, "epoch": 3.3107650643195665, "percentage": 66.22, "elapsed_time": "1:04:13", "remaining_time": "0:32:46"}
{"current_steps": 4900, "total_steps": 7385, "loss": 0.3969, "learning_rate": 6.141525880241313e-05, "epoch": 3.3175355450236967, "percentage": 66.35, "elapsed_time": "1:04:20", "remaining_time": "0:32:37"}
{"current_steps": 4910, "total_steps": 7385, "loss": 0.394, "learning_rate": 6.097959221557108e-05, "epoch": 3.3243060257278265, "percentage": 66.49, "elapsed_time": "1:04:27", "remaining_time": "0:32:29"}
{"current_steps": 4920, "total_steps": 7385, "loss": 0.396, "learning_rate": 6.054479753553259e-05, "epoch": 3.3310765064319567, "percentage": 66.62, "elapsed_time": "1:04:35", "remaining_time": "0:32:21"}
{"current_steps": 4930, "total_steps": 7385, "loss": 0.415, "learning_rate": 6.0110884477737875e-05, "epoch": 3.3378469871360865, "percentage": 66.76, "elapsed_time": "1:04:42", "remaining_time": "0:32:13"}
{"current_steps": 4940, "total_steps": 7385, "loss": 0.399, "learning_rate": 5.9677862737927415e-05, "epoch": 3.3446174678402167, "percentage": 66.89, "elapsed_time": "1:04:50", "remaining_time": "0:32:05"}
{"current_steps": 4950, "total_steps": 7385, "loss": 0.3825, "learning_rate": 5.924574199192527e-05, "epoch": 3.3513879485443465, "percentage": 67.03, "elapsed_time": "1:04:57", "remaining_time": "0:31:57"}
{"current_steps": 4960, "total_steps": 7385, "loss": 0.3793, "learning_rate": 5.881453189542295e-05, "epoch": 3.3581584292484767, "percentage": 67.16, "elapsed_time": "1:05:05", "remaining_time": "0:31:49"}
{"current_steps": 4970, "total_steps": 7385, "loss": 0.3939, "learning_rate": 5.838424208376354e-05, "epoch": 3.3649289099526065, "percentage": 67.3, "elapsed_time": "1:05:12", "remaining_time": "0:31:41"}
{"current_steps": 4980, "total_steps": 7385, "loss": 0.4141, "learning_rate": 5.7954882171726444e-05, "epoch": 3.3716993906567367, "percentage": 67.43, "elapsed_time": "1:05:19", "remaining_time": "0:31:32"}
{"current_steps": 4990, "total_steps": 7385, "loss": 0.4112, "learning_rate": 5.752646175331267e-05, "epoch": 3.3784698713608665, "percentage": 67.57, "elapsed_time": "1:05:27", "remaining_time": "0:31:24"}
{"current_steps": 5000, "total_steps": 7385, "loss": 0.372, "learning_rate": 5.709899040153013e-05, "epoch": 3.3852403520649967, "percentage": 67.7, "elapsed_time": "1:05:35", "remaining_time": "0:31:17"}
{"current_steps": 5000, "total_steps": 7385, "eval_loss": 0.9812659621238708, "epoch": 3.3852403520649967, "percentage": 67.7, "elapsed_time": "1:05:58", "remaining_time": "0:31:28"}
{"current_steps": 5010, "total_steps": 7385, "loss": 0.385, "learning_rate": 5.667247766818018e-05, "epoch": 3.3920108327691265, "percentage": 67.84, "elapsed_time": "1:06:06", "remaining_time": "0:31:20"}
{"current_steps": 5020, "total_steps": 7385, "loss": 0.3759, "learning_rate": 5.6246933083643794e-05, "epoch": 3.3987813134732567, "percentage": 67.98, "elapsed_time": "1:06:14", "remaining_time": "0:31:12"}
{"current_steps": 5030, "total_steps": 7385, "loss": 0.3991, "learning_rate": 5.582236615666885e-05, "epoch": 3.4055517941773865, "percentage": 68.11, "elapsed_time": "1:06:22", "remaining_time": "0:31:04"}
{"current_steps": 5040, "total_steps": 7385, "loss": 0.3938, "learning_rate": 5.5398786374157564e-05, "epoch": 3.4123222748815167, "percentage": 68.25, "elapsed_time": "1:06:30", "remaining_time": "0:30:56"}
{"current_steps": 5050, "total_steps": 7385, "loss": 0.4, "learning_rate": 5.4976203200954425e-05, "epoch": 3.4190927555856465, "percentage": 68.38, "elapsed_time": "1:06:38", "remaining_time": "0:30:48"}
{"current_steps": 5060, "total_steps": 7385, "loss": 0.4117, "learning_rate": 5.4554626079634906e-05, "epoch": 3.4258632362897767, "percentage": 68.52, "elapsed_time": "1:06:45", "remaining_time": "0:30:40"}
{"current_steps": 5070, "total_steps": 7385, "loss": 0.409, "learning_rate": 5.413406443029433e-05, "epoch": 3.4326337169939065, "percentage": 68.65, "elapsed_time": "1:06:54", "remaining_time": "0:30:32"}
{"current_steps": 5080, "total_steps": 7385, "loss": 0.405, "learning_rate": 5.371452765033733e-05, "epoch": 3.4394041976980367, "percentage": 68.79, "elapsed_time": "1:07:02", "remaining_time": "0:30:25"}
{"current_steps": 5090, "total_steps": 7385, "loss": 0.3635, "learning_rate": 5.32960251142681e-05, "epoch": 3.4461746784021665, "percentage": 68.92, "elapsed_time": "1:07:09", "remaining_time": "0:30:17"}
{"current_steps": 5100, "total_steps": 7385, "loss": 0.4101, "learning_rate": 5.287856617348054e-05, "epoch": 3.4529451591062967, "percentage": 69.06, "elapsed_time": "1:07:17", "remaining_time": "0:30:09"}
{"current_steps": 5110, "total_steps": 7385, "loss": 0.3894, "learning_rate": 5.2462160156049765e-05, "epoch": 3.4597156398104265, "percentage": 69.19, "elapsed_time": "1:07:26", "remaining_time": "0:30:01"}
{"current_steps": 5120, "total_steps": 7385, "loss": 0.3909, "learning_rate": 5.2046816366523355e-05, "epoch": 3.4664861205145563, "percentage": 69.33, "elapsed_time": "1:07:33", "remaining_time": "0:29:53"}
{"current_steps": 5130, "total_steps": 7385, "loss": 0.367, "learning_rate": 5.1632544085713376e-05, "epoch": 3.4732566012186865, "percentage": 69.47, "elapsed_time": "1:07:40", "remaining_time": "0:29:45"}
{"current_steps": 5140, "total_steps": 7385, "loss": 0.4053, "learning_rate": 5.121935257048936e-05, "epoch": 3.4800270819228167, "percentage": 69.6, "elapsed_time": "1:07:49", "remaining_time": "0:29:37"}
{"current_steps": 5150, "total_steps": 7385, "loss": 0.3938, "learning_rate": 5.080725105357109e-05, "epoch": 3.4867975626269465, "percentage": 69.74, "elapsed_time": "1:07:56", "remaining_time": "0:29:29"}
{"current_steps": 5160, "total_steps": 7385, "loss": 0.3949, "learning_rate": 5.0396248743322526e-05, "epoch": 3.4935680433310763, "percentage": 69.87, "elapsed_time": "1:08:03", "remaining_time": "0:29:20"}
{"current_steps": 5170, "total_steps": 7385, "loss": 0.3593, "learning_rate": 4.998635482354598e-05, "epoch": 3.5003385240352065, "percentage": 70.01, "elapsed_time": "1:08:11", "remaining_time": "0:29:13"}
{"current_steps": 5180, "total_steps": 7385, "loss": 0.3835, "learning_rate": 4.9577578453276886e-05, "epoch": 3.5071090047393367, "percentage": 70.14, "elapsed_time": "1:08:19", "remaining_time": "0:29:05"}
{"current_steps": 5190, "total_steps": 7385, "loss": 0.4439, "learning_rate": 4.9169928766579164e-05, "epoch": 3.5138794854434665, "percentage": 70.28, "elapsed_time": "1:08:27", "remaining_time": "0:28:57"}
{"current_steps": 5200, "total_steps": 7385, "loss": 0.4055, "learning_rate": 4.876341487234105e-05, "epoch": 3.5206499661475963, "percentage": 70.41, "elapsed_time": "1:08:35", "remaining_time": "0:28:49"}
{"current_steps": 5210, "total_steps": 7385, "loss": 0.401, "learning_rate": 4.83580458540717e-05, "epoch": 3.5274204468517265, "percentage": 70.55, "elapsed_time": "1:08:43", "remaining_time": "0:28:41"}
{"current_steps": 5220, "total_steps": 7385, "loss": 0.3809, "learning_rate": 4.7953830769698125e-05, "epoch": 3.5341909275558567, "percentage": 70.68, "elapsed_time": "1:08:51", "remaining_time": "0:28:33"}
{"current_steps": 5230, "total_steps": 7385, "loss": 0.4251, "learning_rate": 4.755077865136274e-05, "epoch": 3.5409614082599865, "percentage": 70.82, "elapsed_time": "1:08:58", "remaining_time": "0:28:25"}
{"current_steps": 5240, "total_steps": 7385, "loss": 0.3812, "learning_rate": 4.7148898505221685e-05, "epoch": 3.5477318889641163, "percentage": 70.95, "elapsed_time": "1:09:06", "remaining_time": "0:28:17"}
{"current_steps": 5250, "total_steps": 7385, "loss": 0.3606, "learning_rate": 4.674819931124348e-05, "epoch": 3.5545023696682465, "percentage": 71.09, "elapsed_time": "1:09:15", "remaining_time": "0:28:09"}
{"current_steps": 5260, "total_steps": 7385, "loss": 0.4269, "learning_rate": 4.63486900230084e-05, "epoch": 3.5612728503723763, "percentage": 71.23, "elapsed_time": "1:09:24", "remaining_time": "0:28:02"}
{"current_steps": 5270, "total_steps": 7385, "loss": 0.4109, "learning_rate": 4.595037956750845e-05, "epoch": 3.5680433310765065, "percentage": 71.36, "elapsed_time": "1:09:31", "remaining_time": "0:27:54"}
{"current_steps": 5280, "total_steps": 7385, "loss": 0.4027, "learning_rate": 4.5553276844947726e-05, "epoch": 3.5748138117806363, "percentage": 71.5, "elapsed_time": "1:09:39", "remaining_time": "0:27:46"}
{"current_steps": 5290, "total_steps": 7385, "loss": 0.4377, "learning_rate": 4.515739072854376e-05, "epoch": 3.5815842924847665, "percentage": 71.63, "elapsed_time": "1:09:46", "remaining_time": "0:27:37"}
{"current_steps": 5300, "total_steps": 7385, "loss": 0.4058, "learning_rate": 4.4762730064329164e-05, "epoch": 3.5883547731888963, "percentage": 71.77, "elapsed_time": "1:09:54", "remaining_time": "0:27:29"}
{"current_steps": 5310, "total_steps": 7385, "loss": 0.3852, "learning_rate": 4.436930367095384e-05, "epoch": 3.5951252538930265, "percentage": 71.9, "elapsed_time": "1:10:02", "remaining_time": "0:27:22"}
{"current_steps": 5320, "total_steps": 7385, "loss": 0.4128, "learning_rate": 4.3977120339488174e-05, "epoch": 3.6018957345971563, "percentage": 72.04, "elapsed_time": "1:10:10", "remaining_time": "0:27:14"}
{"current_steps": 5330, "total_steps": 7385, "loss": 0.3848, "learning_rate": 4.358618883322639e-05, "epoch": 3.6086662153012865, "percentage": 72.17, "elapsed_time": "1:10:17", "remaining_time": "0:27:06"}
{"current_steps": 5340, "total_steps": 7385, "loss": 0.4186, "learning_rate": 4.319651788749084e-05, "epoch": 3.6154366960054163, "percentage": 72.31, "elapsed_time": "1:10:24", "remaining_time": "0:26:57"}
{"current_steps": 5350, "total_steps": 7385, "loss": 0.4213, "learning_rate": 4.280811620943682e-05, "epoch": 3.6222071767095465, "percentage": 72.44, "elapsed_time": "1:10:32", "remaining_time": "0:26:49"}
{"current_steps": 5360, "total_steps": 7385, "loss": 0.4063, "learning_rate": 4.2420992477857856e-05, "epoch": 3.6289776574136763, "percentage": 72.58, "elapsed_time": "1:10:39", "remaining_time": "0:26:41"}
{"current_steps": 5370, "total_steps": 7385, "loss": 0.3786, "learning_rate": 4.203515534299205e-05, "epoch": 3.6357481381178065, "percentage": 72.71, "elapsed_time": "1:10:47", "remaining_time": "0:26:33"}
{"current_steps": 5380, "total_steps": 7385, "loss": 0.406, "learning_rate": 4.16506134263285e-05, "epoch": 3.6425186188219363, "percentage": 72.85, "elapsed_time": "1:10:53", "remaining_time": "0:26:25"}
{"current_steps": 5390, "total_steps": 7385, "loss": 0.3845, "learning_rate": 4.12673753204149e-05, "epoch": 3.6492890995260665, "percentage": 72.99, "elapsed_time": "1:11:00", "remaining_time": "0:26:17"}
{"current_steps": 5400, "total_steps": 7385, "loss": 0.411, "learning_rate": 4.0885449588665395e-05, "epoch": 3.6560595802301963, "percentage": 73.12, "elapsed_time": "1:11:09", "remaining_time": "0:26:09"}
{"current_steps": 5410, "total_steps": 7385, "loss": 0.3926, "learning_rate": 4.050484476516926e-05, "epoch": 3.6628300609343265, "percentage": 73.26, "elapsed_time": "1:11:16", "remaining_time": "0:26:01"}
{"current_steps": 5420, "total_steps": 7385, "loss": 0.4232, "learning_rate": 4.012556935450027e-05, "epoch": 3.6696005416384563, "percentage": 73.39, "elapsed_time": "1:11:24", "remaining_time": "0:25:53"}
{"current_steps": 5430, "total_steps": 7385, "loss": 0.3882, "learning_rate": 3.97476318315265e-05, "epoch": 3.676371022342586, "percentage": 73.53, "elapsed_time": "1:11:32", "remaining_time": "0:25:45"}
{"current_steps": 5440, "total_steps": 7385, "loss": 0.3714, "learning_rate": 3.937104064122117e-05, "epoch": 3.6831415030467163, "percentage": 73.66, "elapsed_time": "1:11:40", "remaining_time": "0:25:37"}
{"current_steps": 5450, "total_steps": 7385, "loss": 0.3633, "learning_rate": 3.899580419847385e-05, "epoch": 3.6899119837508465, "percentage": 73.8, "elapsed_time": "1:11:47", "remaining_time": "0:25:29"}
{"current_steps": 5460, "total_steps": 7385, "loss": 0.3918, "learning_rate": 3.862193088790231e-05, "epoch": 3.6966824644549763, "percentage": 73.93, "elapsed_time": "1:11:55", "remaining_time": "0:25:21"}
{"current_steps": 5470, "total_steps": 7385, "loss": 0.4081, "learning_rate": 3.82494290636654e-05, "epoch": 3.703452945159106, "percentage": 74.07, "elapsed_time": "1:12:02", "remaining_time": "0:25:13"}
{"current_steps": 5480, "total_steps": 7385, "loss": 0.3772, "learning_rate": 3.7878307049276195e-05, "epoch": 3.7102234258632363, "percentage": 74.2, "elapsed_time": "1:12:11", "remaining_time": "0:25:05"}
{"current_steps": 5490, "total_steps": 7385, "loss": 0.3923, "learning_rate": 3.7508573137416095e-05, "epoch": 3.7169939065673665, "percentage": 74.34, "elapsed_time": "1:12:18", "remaining_time": "0:24:57"}
{"current_steps": 5500, "total_steps": 7385, "loss": 0.4204, "learning_rate": 3.71402355897495e-05, "epoch": 3.7237643872714963, "percentage": 74.48, "elapsed_time": "1:12:26", "remaining_time": "0:24:49"}
{"current_steps": 5510, "total_steps": 7385, "loss": 0.391, "learning_rate": 3.6773302636739116e-05, "epoch": 3.730534867975626, "percentage": 74.61, "elapsed_time": "1:12:34", "remaining_time": "0:24:41"}
{"current_steps": 5520, "total_steps": 7385, "loss": 0.3843, "learning_rate": 3.640778247746226e-05, "epoch": 3.7373053486797563, "percentage": 74.75, "elapsed_time": "1:12:41", "remaining_time": "0:24:33"}
{"current_steps": 5530, "total_steps": 7385, "loss": 0.3623, "learning_rate": 3.6043683279427484e-05, "epoch": 3.7440758293838865, "percentage": 74.88, "elapsed_time": "1:12:49", "remaining_time": "0:24:25"}
{"current_steps": 5540, "total_steps": 7385, "loss": 0.3923, "learning_rate": 3.568101317839205e-05, "epoch": 3.7508463100880163, "percentage": 75.02, "elapsed_time": "1:12:57", "remaining_time": "0:24:17"}
{"current_steps": 5550, "total_steps": 7385, "loss": 0.3918, "learning_rate": 3.531978027818027e-05, "epoch": 3.757616790792146, "percentage": 75.15, "elapsed_time": "1:13:05", "remaining_time": "0:24:09"}
{"current_steps": 5560, "total_steps": 7385, "loss": 0.4316, "learning_rate": 3.4959992650502346e-05, "epoch": 3.7643872714962763, "percentage": 75.29, "elapsed_time": "1:13:13", "remaining_time": "0:24:02"}
{"current_steps": 5570, "total_steps": 7385, "loss": 0.4183, "learning_rate": 3.4601658334774014e-05, "epoch": 3.7711577522004065, "percentage": 75.42, "elapsed_time": "1:13:22", "remaining_time": "0:23:54"}
{"current_steps": 5580, "total_steps": 7385, "loss": 0.4036, "learning_rate": 3.424478533793695e-05, "epoch": 3.7779282329045363, "percentage": 75.56, "elapsed_time": "1:13:29", "remaining_time": "0:23:46"}
{"current_steps": 5590, "total_steps": 7385, "loss": 0.3846, "learning_rate": 3.388938163427969e-05, "epoch": 3.784698713608666, "percentage": 75.69, "elapsed_time": "1:13:37", "remaining_time": "0:23:38"}
{"current_steps": 5600, "total_steps": 7385, "loss": 0.4339, "learning_rate": 3.3535455165259734e-05, "epoch": 3.7914691943127963, "percentage": 75.83, "elapsed_time": "1:13:45", "remaining_time": "0:23:30"}
{"current_steps": 5610, "total_steps": 7385, "loss": 0.4013, "learning_rate": 3.318301383932586e-05, "epoch": 3.798239675016926, "percentage": 75.96, "elapsed_time": "1:13:52", "remaining_time": "0:23:22"}
{"current_steps": 5620, "total_steps": 7385, "loss": 0.3765, "learning_rate": 3.283206553174144e-05, "epoch": 3.8050101557210563, "percentage": 76.1, "elapsed_time": "1:14:00", "remaining_time": "0:23:14"}
{"current_steps": 5630, "total_steps": 7385, "loss": 0.3846, "learning_rate": 3.248261808440858e-05, "epoch": 3.811780636425186, "percentage": 76.24, "elapsed_time": "1:14:08", "remaining_time": "0:23:06"}
{"current_steps": 5640, "total_steps": 7385, "loss": 0.3908, "learning_rate": 3.213467930569279e-05, "epoch": 3.8185511171293163, "percentage": 76.37, "elapsed_time": "1:14:15", "remaining_time": "0:22:58"}
{"current_steps": 5650, "total_steps": 7385, "loss": 0.4075, "learning_rate": 3.178825697024859e-05, "epoch": 3.825321597833446, "percentage": 76.51, "elapsed_time": "1:14:23", "remaining_time": "0:22:50"}
{"current_steps": 5660, "total_steps": 7385, "loss": 0.3949, "learning_rate": 3.14433588188457e-05, "epoch": 3.8320920785375763, "percentage": 76.64, "elapsed_time": "1:14:30", "remaining_time": "0:22:42"}
{"current_steps": 5670, "total_steps": 7385, "loss": 0.3708, "learning_rate": 3.109999255819607e-05, "epoch": 3.838862559241706, "percentage": 76.78, "elapsed_time": "1:14:39", "remaining_time": "0:22:34"}
{"current_steps": 5680, "total_steps": 7385, "loss": 0.3853, "learning_rate": 3.075816586078182e-05, "epoch": 3.8456330399458363, "percentage": 76.91, "elapsed_time": "1:14:46", "remaining_time": "0:22:26"}
{"current_steps": 5690, "total_steps": 7385, "loss": 0.3697, "learning_rate": 3.0417886364683578e-05, "epoch": 3.852403520649966, "percentage": 77.05, "elapsed_time": "1:14:54", "remaining_time": "0:22:18"}
{"current_steps": 5700, "total_steps": 7385, "loss": 0.3561, "learning_rate": 3.0079161673410006e-05, "epoch": 3.8591740013540963, "percentage": 77.18, "elapsed_time": "1:15:02", "remaining_time": "0:22:10"}
{"current_steps": 5710, "total_steps": 7385, "loss": 0.3759, "learning_rate": 2.974199935572781e-05, "epoch": 3.865944482058226, "percentage": 77.32, "elapsed_time": "1:15:08", "remaining_time": "0:22:02"}
{"current_steps": 5720, "total_steps": 7385, "loss": 0.3902, "learning_rate": 2.9406406945492616e-05, "epoch": 3.8727149627623563, "percentage": 77.45, "elapsed_time": "1:15:15", "remaining_time": "0:21:54"}
{"current_steps": 5730, "total_steps": 7385, "loss": 0.4045, "learning_rate": 2.907239194148066e-05, "epoch": 3.879485443466486, "percentage": 77.59, "elapsed_time": "1:15:24", "remaining_time": "0:21:46"}
{"current_steps": 5740, "total_steps": 7385, "loss": 0.4103, "learning_rate": 2.8739961807221127e-05, "epoch": 3.8862559241706163, "percentage": 77.73, "elapsed_time": "1:15:31", "remaining_time": "0:21:38"}
{"current_steps": 5750, "total_steps": 7385, "loss": 0.3718, "learning_rate": 2.840912397082954e-05, "epoch": 3.893026404874746, "percentage": 77.86, "elapsed_time": "1:15:39", "remaining_time": "0:21:30"}
{"current_steps": 5760, "total_steps": 7385, "loss": 0.3949, "learning_rate": 2.807988582484171e-05, "epoch": 3.8997968855788763, "percentage": 78.0, "elapsed_time": "1:15:47", "remaining_time": "0:21:22"}
{"current_steps": 5770, "total_steps": 7385, "loss": 0.3665, "learning_rate": 2.7752254726048422e-05, "epoch": 3.906567366283006, "percentage": 78.13, "elapsed_time": "1:15:54", "remaining_time": "0:21:14"}
{"current_steps": 5780, "total_steps": 7385, "loss": 0.3835, "learning_rate": 2.7426237995331296e-05, "epoch": 3.913337846987136, "percentage": 78.27, "elapsed_time": "1:16:01", "remaining_time": "0:21:06"}
{"current_steps": 5790, "total_steps": 7385, "loss": 0.4008, "learning_rate": 2.7101842917498997e-05, "epoch": 3.920108327691266, "percentage": 78.4, "elapsed_time": "1:16:09", "remaining_time": "0:20:58"}
{"current_steps": 5800, "total_steps": 7385, "loss": 0.4084, "learning_rate": 2.6779076741124576e-05, "epoch": 3.9268788083953963, "percentage": 78.54, "elapsed_time": "1:16:17", "remaining_time": "0:20:50"}
{"current_steps": 5810, "total_steps": 7385, "loss": 0.382, "learning_rate": 2.6457946678383448e-05, "epoch": 3.933649289099526, "percentage": 78.67, "elapsed_time": "1:16:24", "remaining_time": "0:20:42"}
{"current_steps": 5820, "total_steps": 7385, "loss": 0.3943, "learning_rate": 2.6138459904892177e-05, "epoch": 3.940419769803656, "percentage": 78.81, "elapsed_time": "1:16:31", "remaining_time": "0:20:34"}
{"current_steps": 5830, "total_steps": 7385, "loss": 0.3486, "learning_rate": 2.5820623559548285e-05, "epoch": 3.947190250507786, "percentage": 78.94, "elapsed_time": "1:16:39", "remaining_time": "0:20:26"}
{"current_steps": 5840, "total_steps": 7385, "loss": 0.3772, "learning_rate": 2.550444474437066e-05, "epoch": 3.9539607312119163, "percentage": 79.08, "elapsed_time": "1:16:47", "remaining_time": "0:20:18"}
{"current_steps": 5850, "total_steps": 7385, "loss": 0.3629, "learning_rate": 2.5189930524340767e-05, "epoch": 3.960731211916046, "percentage": 79.21, "elapsed_time": "1:16:54", "remaining_time": "0:20:10"}
{"current_steps": 5860, "total_steps": 7385, "loss": 0.4054, "learning_rate": 2.487708792724497e-05, "epoch": 3.967501692620176, "percentage": 79.35, "elapsed_time": "1:17:02", "remaining_time": "0:20:02"}
{"current_steps": 5870, "total_steps": 7385, "loss": 0.4003, "learning_rate": 2.4565923943517343e-05, "epoch": 3.974272173324306, "percentage": 79.49, "elapsed_time": "1:17:09", "remaining_time": "0:19:54"}
{"current_steps": 5880, "total_steps": 7385, "loss": 0.3977, "learning_rate": 2.425644552608356e-05, "epoch": 3.9810426540284363, "percentage": 79.62, "elapsed_time": "1:17:17", "remaining_time": "0:19:47"}
{"current_steps": 5890, "total_steps": 7385, "loss": 0.4088, "learning_rate": 2.3948659590205515e-05, "epoch": 3.987813134732566, "percentage": 79.76, "elapsed_time": "1:17:25", "remaining_time": "0:19:39"}
{"current_steps": 5900, "total_steps": 7385, "loss": 0.4008, "learning_rate": 2.3642573013326663e-05, "epoch": 3.994583615436696, "percentage": 79.89, "elapsed_time": "1:17:32", "remaining_time": "0:19:31"}
{"current_steps": 5910, "total_steps": 7385, "loss": 0.3427, "learning_rate": 2.3338192634918643e-05, "epoch": 4.001354096140826, "percentage": 80.03, "elapsed_time": "1:17:41", "remaining_time": "0:19:23"}
{"current_steps": 5920, "total_steps": 7385, "loss": 0.2699, "learning_rate": 2.3035525256328106e-05, "epoch": 4.008124576844956, "percentage": 80.16, "elapsed_time": "1:17:48", "remaining_time": "0:19:15"}
{"current_steps": 5930, "total_steps": 7385, "loss": 0.2694, "learning_rate": 2.2734577640625022e-05, "epoch": 4.014895057549086, "percentage": 80.3, "elapsed_time": "1:17:55", "remaining_time": "0:19:07"}
{"current_steps": 5940, "total_steps": 7385, "loss": 0.2822, "learning_rate": 2.2435356512451387e-05, "epoch": 4.021665538253216, "percentage": 80.43, "elapsed_time": "1:18:02", "remaining_time": "0:18:59"}
{"current_steps": 5950, "total_steps": 7385, "loss": 0.2965, "learning_rate": 2.2137868557871067e-05, "epoch": 4.028436018957346, "percentage": 80.57, "elapsed_time": "1:18:09", "remaining_time": "0:18:51"}
{"current_steps": 5960, "total_steps": 7385, "loss": 0.2551, "learning_rate": 2.1842120424220334e-05, "epoch": 4.035206499661476, "percentage": 80.7, "elapsed_time": "1:18:16", "remaining_time": "0:18:42"}
{"current_steps": 5970, "total_steps": 7385, "loss": 0.2903, "learning_rate": 2.1548118719959286e-05, "epoch": 4.041976980365606, "percentage": 80.84, "elapsed_time": "1:18:23", "remaining_time": "0:18:34"}
{"current_steps": 5980, "total_steps": 7385, "loss": 0.294, "learning_rate": 2.1255870014524327e-05, "epoch": 4.048747461069736, "percentage": 80.97, "elapsed_time": "1:18:31", "remaining_time": "0:18:26"}
{"current_steps": 5990, "total_steps": 7385, "loss": 0.2838, "learning_rate": 2.096538083818128e-05, "epoch": 4.055517941773866, "percentage": 81.11, "elapsed_time": "1:18:39", "remaining_time": "0:18:19"}
{"current_steps": 6000, "total_steps": 7385, "loss": 0.2649, "learning_rate": 2.067665768187941e-05, "epoch": 4.062288422477996, "percentage": 81.25, "elapsed_time": "1:18:48", "remaining_time": "0:18:11"}
{"current_steps": 6000, "total_steps": 7385, "eval_loss": 1.1342198848724365, "epoch": 4.062288422477996, "percentage": 81.25, "elapsed_time": "1:19:10", "remaining_time": "0:18:16"}
{"current_steps": 6010, "total_steps": 7385, "loss": 0.2606, "learning_rate": 2.0389706997106527e-05, "epoch": 4.069058903182126, "percentage": 81.38, "elapsed_time": "1:19:18", "remaining_time": "0:18:08"}
{"current_steps": 6020, "total_steps": 7385, "loss": 0.2848, "learning_rate": 2.0104535195744746e-05, "epoch": 4.075829383886256, "percentage": 81.52, "elapsed_time": "1:19:26", "remaining_time": "0:18:00"}
{"current_steps": 6030, "total_steps": 7385, "loss": 0.2724, "learning_rate": 1.9821148649927212e-05, "epoch": 4.082599864590386, "percentage": 81.65, "elapsed_time": "1:19:33", "remaining_time": "0:17:52"}
{"current_steps": 6040, "total_steps": 7385, "loss": 0.2745, "learning_rate": 1.953955369189574e-05, "epoch": 4.089370345294516, "percentage": 81.79, "elapsed_time": "1:19:41", "remaining_time": "0:17:44"}
{"current_steps": 6050, "total_steps": 7385, "loss": 0.2737, "learning_rate": 1.925975661385926e-05, "epoch": 4.096140825998646, "percentage": 81.92, "elapsed_time": "1:19:49", "remaining_time": "0:17:36"}
{"current_steps": 6060, "total_steps": 7385, "loss": 0.2606, "learning_rate": 1.8981763667853326e-05, "epoch": 4.102911306702776, "percentage": 82.06, "elapsed_time": "1:19:56", "remaining_time": "0:17:28"}
{"current_steps": 6070, "total_steps": 7385, "loss": 0.2621, "learning_rate": 1.870558106560035e-05, "epoch": 4.109681787406906, "percentage": 82.19, "elapsed_time": "1:20:03", "remaining_time": "0:17:20"}
{"current_steps": 6080, "total_steps": 7385, "loss": 0.2677, "learning_rate": 1.8431214978370758e-05, "epoch": 4.116452268111036, "percentage": 82.33, "elapsed_time": "1:20:11", "remaining_time": "0:17:12"}
{"current_steps": 6090, "total_steps": 7385, "loss": 0.2562, "learning_rate": 1.8158671536845186e-05, "epoch": 4.123222748815166, "percentage": 82.46, "elapsed_time": "1:20:19", "remaining_time": "0:17:04"}
{"current_steps": 6100, "total_steps": 7385, "loss": 0.2591, "learning_rate": 1.788795683097746e-05, "epoch": 4.129993229519296, "percentage": 82.6, "elapsed_time": "1:20:27", "remaining_time": "0:16:56"}
{"current_steps": 6110, "total_steps": 7385, "loss": 0.2823, "learning_rate": 1.761907690985847e-05, "epoch": 4.136763710223426, "percentage": 82.74, "elapsed_time": "1:20:34", "remaining_time": "0:16:48"}
{"current_steps": 6120, "total_steps": 7385, "loss": 0.2672, "learning_rate": 1.735203778158109e-05, "epoch": 4.143534190927556, "percentage": 82.87, "elapsed_time": "1:20:42", "remaining_time": "0:16:40"}
{"current_steps": 6130, "total_steps": 7385, "loss": 0.2607, "learning_rate": 1.7086845413105778e-05, "epoch": 4.150304671631686, "percentage": 83.01, "elapsed_time": "1:20:49", "remaining_time": "0:16:32"}
{"current_steps": 6140, "total_steps": 7385, "loss": 0.2653, "learning_rate": 1.6823505730127455e-05, "epoch": 4.157075152335816, "percentage": 83.14, "elapsed_time": "1:20:56", "remaining_time": "0:16:24"}
{"current_steps": 6150, "total_steps": 7385, "loss": 0.2787, "learning_rate": 1.656202461694293e-05, "epoch": 4.163845633039946, "percentage": 83.28, "elapsed_time": "1:21:04", "remaining_time": "0:16:16"}
{"current_steps": 6160, "total_steps": 7385, "loss": 0.2996, "learning_rate": 1.630240791631945e-05, "epoch": 4.170616113744076, "percentage": 83.41, "elapsed_time": "1:21:11", "remaining_time": "0:16:08"}
{"current_steps": 6170, "total_steps": 7385, "loss": 0.2617, "learning_rate": 1.6044661429364205e-05, "epoch": 4.177386594448206, "percentage": 83.55, "elapsed_time": "1:21:20", "remaining_time": "0:16:00"}
{"current_steps": 6180, "total_steps": 7385, "loss": 0.2627, "learning_rate": 1.5788790915394645e-05, "epoch": 4.184157075152336, "percentage": 83.68, "elapsed_time": "1:21:27", "remaining_time": "0:15:52"}
{"current_steps": 6190, "total_steps": 7385, "loss": 0.2734, "learning_rate": 1.5534802091809818e-05, "epoch": 4.190927555856466, "percentage": 83.82, "elapsed_time": "1:21:34", "remaining_time": "0:15:44"}
{"current_steps": 6200, "total_steps": 7385, "loss": 0.2765, "learning_rate": 1.528270063396262e-05, "epoch": 4.197698036560595, "percentage": 83.95, "elapsed_time": "1:21:41", "remaining_time": "0:15:36"}
{"current_steps": 6210, "total_steps": 7385, "loss": 0.2665, "learning_rate": 1.5032492175032876e-05, "epoch": 4.204468517264726, "percentage": 84.09, "elapsed_time": "1:21:49", "remaining_time": "0:15:28"}
{"current_steps": 6220, "total_steps": 7385, "loss": 0.2644, "learning_rate": 1.4784182305901672e-05, "epoch": 4.211238997968856, "percentage": 84.22, "elapsed_time": "1:21:57", "remaining_time": "0:15:20"}
{"current_steps": 6230, "total_steps": 7385, "loss": 0.2611, "learning_rate": 1.4537776575026207e-05, "epoch": 4.218009478672986, "percentage": 84.36, "elapsed_time": "1:22:03", "remaining_time": "0:15:12"}
{"current_steps": 6240, "total_steps": 7385, "loss": 0.2851, "learning_rate": 1.4293280488315986e-05, "epoch": 4.224779959377115, "percentage": 84.5, "elapsed_time": "1:22:12", "remaining_time": "0:15:05"}
{"current_steps": 6250, "total_steps": 7385, "loss": 0.2727, "learning_rate": 1.4050699509009679e-05, "epoch": 4.231550440081246, "percentage": 84.63, "elapsed_time": "1:22:19", "remaining_time": "0:14:57"}
{"current_steps": 6260, "total_steps": 7385, "loss": 0.2704, "learning_rate": 1.3810039057553138e-05, "epoch": 4.238320920785376, "percentage": 84.77, "elapsed_time": "1:22:26", "remaining_time": "0:14:48"}
{"current_steps": 6270, "total_steps": 7385, "loss": 0.2847, "learning_rate": 1.3571304511478188e-05, "epoch": 4.245091401489506, "percentage": 84.9, "elapsed_time": "1:22:34", "remaining_time": "0:14:41"}
{"current_steps": 6280, "total_steps": 7385, "loss": 0.2551, "learning_rate": 1.333450120528249e-05, "epoch": 4.251861882193635, "percentage": 85.04, "elapsed_time": "1:22:42", "remaining_time": "0:14:33"}
{"current_steps": 6290, "total_steps": 7385, "loss": 0.249, "learning_rate": 1.3099634430310403e-05, "epoch": 4.258632362897766, "percentage": 85.17, "elapsed_time": "1:22:50", "remaining_time": "0:14:25"}
{"current_steps": 6300, "total_steps": 7385, "loss": 0.2961, "learning_rate": 1.2866709434634684e-05, "epoch": 4.265402843601896, "percentage": 85.31, "elapsed_time": "1:22:58", "remaining_time": "0:14:17"}
{"current_steps": 6310, "total_steps": 7385, "loss": 0.2476, "learning_rate": 1.2635731422939212e-05, "epoch": 4.272173324306026, "percentage": 85.44, "elapsed_time": "1:23:06", "remaining_time": "0:14:09"}
{"current_steps": 6320, "total_steps": 7385, "loss": 0.275, "learning_rate": 1.2406705556402776e-05, "epoch": 4.278943805010155, "percentage": 85.58, "elapsed_time": "1:23:13", "remaining_time": "0:14:01"}
{"current_steps": 6330, "total_steps": 7385, "loss": 0.2605, "learning_rate": 1.217963695258364e-05, "epoch": 4.285714285714286, "percentage": 85.71, "elapsed_time": "1:23:21", "remaining_time": "0:13:53"}
{"current_steps": 6340, "total_steps": 7385, "loss": 0.2696, "learning_rate": 1.1954530685305287e-05, "epoch": 4.292484766418416, "percentage": 85.85, "elapsed_time": "1:23:29", "remaining_time": "0:13:45"}
{"current_steps": 6350, "total_steps": 7385, "loss": 0.2914, "learning_rate": 1.1731391784543e-05, "epoch": 4.299255247122546, "percentage": 85.99, "elapsed_time": "1:23:36", "remaining_time": "0:13:37"}
{"current_steps": 6360, "total_steps": 7385, "loss": 0.262, "learning_rate": 1.15102252363114e-05, "epoch": 4.306025727826675, "percentage": 86.12, "elapsed_time": "1:23:44", "remaining_time": "0:13:29"}
{"current_steps": 6370, "total_steps": 7385, "loss": 0.2702, "learning_rate": 1.1291035982553189e-05, "epoch": 4.312796208530806, "percentage": 86.26, "elapsed_time": "1:23:51", "remaining_time": "0:13:21"}
{"current_steps": 6380, "total_steps": 7385, "loss": 0.308, "learning_rate": 1.1073828921028606e-05, "epoch": 4.319566689234936, "percentage": 86.39, "elapsed_time": "1:23:59", "remaining_time": "0:13:13"}
{"current_steps": 6390, "total_steps": 7385, "loss": 0.2536, "learning_rate": 1.085860890520598e-05, "epoch": 4.326337169939066, "percentage": 86.53, "elapsed_time": "1:24:07", "remaining_time": "0:13:05"}
{"current_steps": 6400, "total_steps": 7385, "loss": 0.2713, "learning_rate": 1.0645380744153378e-05, "epoch": 4.333107650643195, "percentage": 86.66, "elapsed_time": "1:24:15", "remaining_time": "0:12:58"}
{"current_steps": 6410, "total_steps": 7385, "loss": 0.259, "learning_rate": 1.0434149202431054e-05, "epoch": 4.339878131347326, "percentage": 86.8, "elapsed_time": "1:24:23", "remaining_time": "0:12:50"}
{"current_steps": 6420, "total_steps": 7385, "loss": 0.2847, "learning_rate": 1.0224918999985044e-05, "epoch": 4.346648612051456, "percentage": 86.93, "elapsed_time": "1:24:30", "remaining_time": "0:12:42"}
{"current_steps": 6430, "total_steps": 7385, "loss": 0.2621, "learning_rate": 1.0017694812041656e-05, "epoch": 4.353419092755586, "percentage": 87.07, "elapsed_time": "1:24:38", "remaining_time": "0:12:34"}
{"current_steps": 6440, "total_steps": 7385, "loss": 0.2803, "learning_rate": 9.812481269002983e-06, "epoch": 4.360189573459715, "percentage": 87.2, "elapsed_time": "1:24:45", "remaining_time": "0:12:26"}
{"current_steps": 6450, "total_steps": 7385, "loss": 0.2962, "learning_rate": 9.609282956343557e-06, "epoch": 4.366960054163846, "percentage": 87.34, "elapsed_time": "1:24:52", "remaining_time": "0:12:18"}
{"current_steps": 6460, "total_steps": 7385, "loss": 0.2917, "learning_rate": 9.408104414507724e-06, "epoch": 4.373730534867976, "percentage": 87.47, "elapsed_time": "1:25:00", "remaining_time": "0:12:10"}
{"current_steps": 6470, "total_steps": 7385, "loss": 0.329, "learning_rate": 9.208950138808293e-06, "epoch": 4.380501015572106, "percentage": 87.61, "elapsed_time": "1:25:09", "remaining_time": "0:12:02"}
{"current_steps": 6480, "total_steps": 7385, "loss": 0.2768, "learning_rate": 9.011824579326144e-06, "epoch": 4.387271496276235, "percentage": 87.75, "elapsed_time": "1:25:15", "remaining_time": "0:11:54"}
{"current_steps": 6490, "total_steps": 7385, "loss": 0.2919, "learning_rate": 8.81673214081058e-06, "epoch": 4.394041976980366, "percentage": 87.88, "elapsed_time": "1:25:23", "remaining_time": "0:11:46"}
{"current_steps": 6500, "total_steps": 7385, "loss": 0.2719, "learning_rate": 8.623677182581135e-06, "epoch": 4.400812457684496, "percentage": 88.02, "elapsed_time": "1:25:30", "remaining_time": "0:11:38"}
{"current_steps": 6510, "total_steps": 7385, "loss": 0.2803, "learning_rate": 8.432664018430003e-06, "epoch": 4.407582938388625, "percentage": 88.15, "elapsed_time": "1:25:38", "remaining_time": "0:11:30"}
{"current_steps": 6520, "total_steps": 7385, "loss": 0.2508, "learning_rate": 8.243696916525745e-06, "epoch": 4.414353419092755, "percentage": 88.29, "elapsed_time": "1:25:46", "remaining_time": "0:11:22"}
{"current_steps": 6530, "total_steps": 7385, "loss": 0.2979, "learning_rate": 8.056780099317885e-06, "epoch": 4.421123899796886, "percentage": 88.42, "elapsed_time": "1:25:54", "remaining_time": "0:11:14"}
{"current_steps": 6540, "total_steps": 7385, "loss": 0.2901, "learning_rate": 7.871917743442513e-06, "epoch": 4.427894380501016, "percentage": 88.56, "elapsed_time": "1:26:02", "remaining_time": "0:11:07"}
{"current_steps": 6550, "total_steps": 7385, "loss": 0.2615, "learning_rate": 7.68911397962906e-06, "epoch": 4.434664861205146, "percentage": 88.69, "elapsed_time": "1:26:10", "remaining_time": "0:10:59"}
{"current_steps": 6560, "total_steps": 7385, "loss": 0.2608, "learning_rate": 7.5083728926079065e-06, "epoch": 4.441435341909275, "percentage": 88.83, "elapsed_time": "1:26:17", "remaining_time": "0:10:51"}
{"current_steps": 6570, "total_steps": 7385, "loss": 0.2904, "learning_rate": 7.329698521019157e-06, "epoch": 4.448205822613406, "percentage": 88.96, "elapsed_time": "1:26:26", "remaining_time": "0:10:43"}
{"current_steps": 6580, "total_steps": 7385, "loss": 0.2763, "learning_rate": 7.153094857322374e-06, "epoch": 4.454976303317536, "percentage": 89.1, "elapsed_time": "1:26:33", "remaining_time": "0:10:35"}
{"current_steps": 6590, "total_steps": 7385, "loss": 0.2644, "learning_rate": 6.978565847707352e-06, "epoch": 4.461746784021665, "percentage": 89.23, "elapsed_time": "1:26:41", "remaining_time": "0:10:27"}
{"current_steps": 6600, "total_steps": 7385, "loss": 0.2758, "learning_rate": 6.806115392006007e-06, "epoch": 4.468517264725795, "percentage": 89.37, "elapsed_time": "1:26:48", "remaining_time": "0:10:19"}
{"current_steps": 6610, "total_steps": 7385, "loss": 0.2952, "learning_rate": 6.635747343605181e-06, "epoch": 4.475287745429926, "percentage": 89.51, "elapsed_time": "1:26:56", "remaining_time": "0:10:11"}
{"current_steps": 6620, "total_steps": 7385, "loss": 0.272, "learning_rate": 6.4674655093605155e-06, "epoch": 4.482058226134056, "percentage": 89.64, "elapsed_time": "1:27:03", "remaining_time": "0:10:03"}
{"current_steps": 6630, "total_steps": 7385, "loss": 0.2638, "learning_rate": 6.301273649511464e-06, "epoch": 4.488828706838185, "percentage": 89.78, "elapsed_time": "1:27:11", "remaining_time": "0:09:55"}
{"current_steps": 6640, "total_steps": 7385, "loss": 0.271, "learning_rate": 6.137175477597213e-06, "epoch": 4.495599187542315, "percentage": 89.91, "elapsed_time": "1:27:19", "remaining_time": "0:09:47"}
{"current_steps": 6650, "total_steps": 7385, "loss": 0.2682, "learning_rate": 5.975174660373706e-06, "epoch": 4.502369668246446, "percentage": 90.05, "elapsed_time": "1:27:26", "remaining_time": "0:09:39"}
{"current_steps": 6660, "total_steps": 7385, "loss": 0.2926, "learning_rate": 5.815274817731753e-06, "epoch": 4.509140148950576, "percentage": 90.18, "elapsed_time": "1:27:34", "remaining_time": "0:09:32"}
{"current_steps": 6670, "total_steps": 7385, "loss": 0.2716, "learning_rate": 5.657479522616071e-06, "epoch": 4.515910629654705, "percentage": 90.32, "elapsed_time": "1:27:41", "remaining_time": "0:09:24"}
{"current_steps": 6680, "total_steps": 7385, "loss": 0.2812, "learning_rate": 5.501792300945507e-06, "epoch": 4.522681110358835, "percentage": 90.45, "elapsed_time": "1:27:49", "remaining_time": "0:09:16"}
{"current_steps": 6690, "total_steps": 7385, "loss": 0.2416, "learning_rate": 5.348216631534264e-06, "epoch": 4.529451591062966, "percentage": 90.59, "elapsed_time": "1:27:56", "remaining_time": "0:09:08"}
{"current_steps": 6700, "total_steps": 7385, "loss": 0.2571, "learning_rate": 5.196755946014065e-06, "epoch": 4.536222071767096, "percentage": 90.72, "elapsed_time": "1:28:04", "remaining_time": "0:09:00"}
{"current_steps": 6710, "total_steps": 7385, "loss": 0.2819, "learning_rate": 5.047413628757658e-06, "epoch": 4.542992552471225, "percentage": 90.86, "elapsed_time": "1:28:11", "remaining_time": "0:08:52"}
{"current_steps": 6720, "total_steps": 7385, "loss": 0.2881, "learning_rate": 4.900193016802956e-06, "epoch": 4.549763033175355, "percentage": 91.0, "elapsed_time": "1:28:20", "remaining_time": "0:08:44"}
{"current_steps": 6730, "total_steps": 7385, "loss": 0.2837, "learning_rate": 4.755097399778707e-06, "epoch": 4.556533513879486, "percentage": 91.13, "elapsed_time": "1:28:27", "remaining_time": "0:08:36"}
{"current_steps": 6740, "total_steps": 7385, "loss": 0.2648, "learning_rate": 4.612130019830774e-06, "epoch": 4.563303994583616, "percentage": 91.27, "elapsed_time": "1:28:35", "remaining_time": "0:08:28"}
{"current_steps": 6750, "total_steps": 7385, "loss": 0.2571, "learning_rate": 4.471294071549869e-06, "epoch": 4.570074475287745, "percentage": 91.4, "elapsed_time": "1:28:42", "remaining_time": "0:08:20"}
{"current_steps": 6760, "total_steps": 7385, "loss": 0.2567, "learning_rate": 4.332592701900085e-06, "epoch": 4.576844955991875, "percentage": 91.54, "elapsed_time": "1:28:49", "remaining_time": "0:08:12"}
{"current_steps": 6770, "total_steps": 7385, "loss": 0.2462, "learning_rate": 4.196029010148527e-06, "epoch": 4.583615436696006, "percentage": 91.67, "elapsed_time": "1:28:56", "remaining_time": "0:08:04"}
{"current_steps": 6780, "total_steps": 7385, "loss": 0.2695, "learning_rate": 4.0616060477961845e-06, "epoch": 4.590385917400136, "percentage": 91.81, "elapsed_time": "1:29:04", "remaining_time": "0:07:56"}
{"current_steps": 6790, "total_steps": 7385, "loss": 0.2816, "learning_rate": 3.929326818509638e-06, "epoch": 4.597156398104265, "percentage": 91.94, "elapsed_time": "1:29:12", "remaining_time": "0:07:49"}
{"current_steps": 6800, "total_steps": 7385, "loss": 0.3004, "learning_rate": 3.799194278054019e-06, "epoch": 4.603926878808395, "percentage": 92.08, "elapsed_time": "1:29:20", "remaining_time": "0:07:41"}
{"current_steps": 6810, "total_steps": 7385, "loss": 0.3155, "learning_rate": 3.6712113342269095e-06, "epoch": 4.610697359512526, "percentage": 92.21, "elapsed_time": "1:29:27", "remaining_time": "0:07:33"}
{"current_steps": 6820, "total_steps": 7385, "loss": 0.2598, "learning_rate": 3.5453808467933558e-06, "epoch": 4.617467840216655, "percentage": 92.35, "elapsed_time": "1:29:34", "remaining_time": "0:07:25"}
{"current_steps": 6830, "total_steps": 7385, "loss": 0.2893, "learning_rate": 3.421705627422067e-06, "epoch": 4.624238320920785, "percentage": 92.48, "elapsed_time": "1:29:42", "remaining_time": "0:07:17"}
{"current_steps": 6840, "total_steps": 7385, "loss": 0.2702, "learning_rate": 3.300188439622465e-06, "epoch": 4.631008801624915, "percentage": 92.62, "elapsed_time": "1:29:51", "remaining_time": "0:07:09"}
{"current_steps": 6850, "total_steps": 7385, "loss": 0.26, "learning_rate": 3.180831998682987e-06, "epoch": 4.637779282329046, "percentage": 92.76, "elapsed_time": "1:29:58", "remaining_time": "0:07:01"}
{"current_steps": 6860, "total_steps": 7385, "loss": 0.309, "learning_rate": 3.0636389716104607e-06, "epoch": 4.644549763033176, "percentage": 92.89, "elapsed_time": "1:30:06", "remaining_time": "0:06:53"}
{"current_steps": 6870, "total_steps": 7385, "loss": 0.2541, "learning_rate": 2.9486119770704144e-06, "epoch": 4.651320243737305, "percentage": 93.03, "elapsed_time": "1:30:14", "remaining_time": "0:06:45"}
{"current_steps": 6880, "total_steps": 7385, "loss": 0.3016, "learning_rate": 2.83575358532866e-06, "epoch": 4.658090724441435, "percentage": 93.16, "elapsed_time": "1:30:21", "remaining_time": "0:06:37"}
{"current_steps": 6890, "total_steps": 7385, "loss": 0.287, "learning_rate": 2.7250663181937808e-06, "epoch": 4.664861205145566, "percentage": 93.3, "elapsed_time": "1:30:29", "remaining_time": "0:06:30"}
{"current_steps": 6900, "total_steps": 7385, "loss": 0.2414, "learning_rate": 2.6165526489608016e-06, "epoch": 4.671631685849695, "percentage": 93.43, "elapsed_time": "1:30:37", "remaining_time": "0:06:22"}
{"current_steps": 6910, "total_steps": 7385, "loss": 0.2605, "learning_rate": 2.510215002355987e-06, "epoch": 4.678402166553825, "percentage": 93.57, "elapsed_time": "1:30:45", "remaining_time": "0:06:14"}
{"current_steps": 6920, "total_steps": 7385, "loss": 0.2536, "learning_rate": 2.4060557544825724e-06, "epoch": 4.685172647257955, "percentage": 93.7, "elapsed_time": "1:30:52", "remaining_time": "0:06:06"}
{"current_steps": 6930, "total_steps": 7385, "loss": 0.2773, "learning_rate": 2.3040772327676987e-06, "epoch": 4.691943127962086, "percentage": 93.84, "elapsed_time": "1:30:59", "remaining_time": "0:05:58"}
{"current_steps": 6940, "total_steps": 7385, "loss": 0.2801, "learning_rate": 2.2042817159104614e-06, "epoch": 4.698713608666216, "percentage": 93.97, "elapsed_time": "1:31:06", "remaining_time": "0:05:50"}
{"current_steps": 6950, "total_steps": 7385, "loss": 0.2343, "learning_rate": 2.106671433830909e-06, "epoch": 4.705484089370345, "percentage": 94.11, "elapsed_time": "1:31:14", "remaining_time": "0:05:42"}
{"current_steps": 6960, "total_steps": 7385, "loss": 0.2628, "learning_rate": 2.011248567620272e-06, "epoch": 4.712254570074475, "percentage": 94.25, "elapsed_time": "1:31:22", "remaining_time": "0:05:34"}
{"current_steps": 6970, "total_steps": 7385, "loss": 0.258, "learning_rate": 1.918015249492211e-06, "epoch": 4.719025050778606, "percentage": 94.38, "elapsed_time": "1:31:29", "remaining_time": "0:05:26"}
{"current_steps": 6980, "total_steps": 7385, "loss": 0.2807, "learning_rate": 1.8269735627351459e-06, "epoch": 4.725795531482735, "percentage": 94.52, "elapsed_time": "1:31:36", "remaining_time": "0:05:18"}
{"current_steps": 6990, "total_steps": 7385, "loss": 0.2476, "learning_rate": 1.7381255416657693e-06, "epoch": 4.732566012186865, "percentage": 94.65, "elapsed_time": "1:31:43", "remaining_time": "0:05:11"}
{"current_steps": 7000, "total_steps": 7385, "loss": 0.2722, "learning_rate": 1.6514731715835064e-06, "epoch": 4.739336492890995, "percentage": 94.79, "elapsed_time": "1:31:52", "remaining_time": "0:05:03"}
{"current_steps": 7000, "total_steps": 7385, "eval_loss": 1.1487771272659302, "epoch": 4.739336492890995, "percentage": 94.79, "elapsed_time": "1:32:15", "remaining_time": "0:05:04"}
{"current_steps": 7010, "total_steps": 7385, "loss": 0.253, "learning_rate": 1.5670183887262268e-06, "epoch": 4.746106973595126, "percentage": 94.92, "elapsed_time": "1:32:23", "remaining_time": "0:04:56"}
{"current_steps": 7020, "total_steps": 7385, "loss": 0.2886, "learning_rate": 1.4847630802269695e-06, "epoch": 4.752877454299255, "percentage": 95.06, "elapsed_time": "1:32:30", "remaining_time": "0:04:48"}
{"current_steps": 7030, "total_steps": 7385, "loss": 0.2645, "learning_rate": 1.4047090840716982e-06, "epoch": 4.759647935003385, "percentage": 95.19, "elapsed_time": "1:32:38", "remaining_time": "0:04:40"}
{"current_steps": 7040, "total_steps": 7385, "loss": 0.2834, "learning_rate": 1.3268581890583553e-06, "epoch": 4.766418415707515, "percentage": 95.33, "elapsed_time": "1:32:45", "remaining_time": "0:04:32"}
{"current_steps": 7050, "total_steps": 7385, "loss": 0.2967, "learning_rate": 1.251212134756763e-06, "epoch": 4.773188896411646, "percentage": 95.46, "elapsed_time": "1:32:53", "remaining_time": "0:04:24"}
{"current_steps": 7060, "total_steps": 7385, "loss": 0.2819, "learning_rate": 1.1777726114698628e-06, "epoch": 4.779959377115775, "percentage": 95.6, "elapsed_time": "1:33:00", "remaining_time": "0:04:16"}
{"current_steps": 7070, "total_steps": 7385, "loss": 0.2892, "learning_rate": 1.1065412601958813e-06, "epoch": 4.786729857819905, "percentage": 95.73, "elapsed_time": "1:33:08", "remaining_time": "0:04:08"}
{"current_steps": 7080, "total_steps": 7385, "loss": 0.2751, "learning_rate": 1.0375196725916693e-06, "epoch": 4.793500338524035, "percentage": 95.87, "elapsed_time": "1:33:15", "remaining_time": "0:04:01"}
{"current_steps": 7090, "total_steps": 7385, "loss": 0.277, "learning_rate": 9.707093909371745e-07, "epoch": 4.800270819228166, "percentage": 96.01, "elapsed_time": "1:33:23", "remaining_time": "0:03:53"}
{"current_steps": 7100, "total_steps": 7385, "loss": 0.2717, "learning_rate": 9.061119081009262e-07, "epoch": 4.807041299932295, "percentage": 96.14, "elapsed_time": "1:33:33", "remaining_time": "0:03:45"}
{"current_steps": 7110, "total_steps": 7385, "loss": 0.2589, "learning_rate": 8.437286675067046e-07, "epoch": 4.813811780636425, "percentage": 96.28, "elapsed_time": "1:33:40", "remaining_time": "0:03:37"}
{"current_steps": 7120, "total_steps": 7385, "loss": 0.2774, "learning_rate": 7.835610631013123e-07, "epoch": 4.820582261340555, "percentage": 96.41, "elapsed_time": "1:33:48", "remaining_time": "0:03:29"}
{"current_steps": 7130, "total_steps": 7385, "loss": 0.2826, "learning_rate": 7.256104393233654e-07, "epoch": 4.827352742044685, "percentage": 96.55, "elapsed_time": "1:33:56", "remaining_time": "0:03:21"}
{"current_steps": 7140, "total_steps": 7385, "loss": 0.287, "learning_rate": 6.698780910732949e-07, "epoch": 4.834123222748815, "percentage": 96.68, "elapsed_time": "1:34:04", "remaining_time": "0:03:13"}
{"current_steps": 7150, "total_steps": 7385, "loss": 0.2601, "learning_rate": 6.163652636844375e-07, "epoch": 4.840893703452945, "percentage": 96.82, "elapsed_time": "1:34:11", "remaining_time": "0:03:05"}
{"current_steps": 7160, "total_steps": 7385, "loss": 0.2671, "learning_rate": 5.650731528951237e-07, "epoch": 4.847664184157075, "percentage": 96.95, "elapsed_time": "1:34:19", "remaining_time": "0:02:57"}
{"current_steps": 7170, "total_steps": 7385, "loss": 0.2877, "learning_rate": 5.160029048220438e-07, "epoch": 4.854434664861206, "percentage": 97.09, "elapsed_time": "1:34:28", "remaining_time": "0:02:49"}
{"current_steps": 7180, "total_steps": 7385, "loss": 0.3145, "learning_rate": 4.691556159346133e-07, "epoch": 4.861205145565335, "percentage": 97.22, "elapsed_time": "1:34:35", "remaining_time": "0:02:42"}
{"current_steps": 7190, "total_steps": 7385, "loss": 0.2634, "learning_rate": 4.2453233303043627e-07, "epoch": 4.867975626269465, "percentage": 97.36, "elapsed_time": "1:34:43", "remaining_time": "0:02:34"}
{"current_steps": 7200, "total_steps": 7385, "loss": 0.257, "learning_rate": 3.8213405321195775e-07, "epoch": 4.874746106973595, "percentage": 97.49, "elapsed_time": "1:34:50", "remaining_time": "0:02:26"}
{"current_steps": 7210, "total_steps": 7385, "loss": 0.2942, "learning_rate": 3.4196172386417036e-07, "epoch": 4.881516587677725, "percentage": 97.63, "elapsed_time": "1:34:58", "remaining_time": "0:02:18"}
{"current_steps": 7220, "total_steps": 7385, "loss": 0.2984, "learning_rate": 3.0401624263344254e-07, "epoch": 4.888287068381855, "percentage": 97.77, "elapsed_time": "1:35:06", "remaining_time": "0:02:10"}
{"current_steps": 7230, "total_steps": 7385, "loss": 0.2775, "learning_rate": 2.682984574074565e-07, "epoch": 4.895057549085985, "percentage": 97.9, "elapsed_time": "1:35:13", "remaining_time": "0:02:02"}
{"current_steps": 7240, "total_steps": 7385, "loss": 0.2303, "learning_rate": 2.3480916629626816e-07, "epoch": 4.901828029790115, "percentage": 98.04, "elapsed_time": "1:35:22", "remaining_time": "0:01:54"}
{"current_steps": 7250, "total_steps": 7385, "loss": 0.2561, "learning_rate": 2.035491176144766e-07, "epoch": 4.908598510494246, "percentage": 98.17, "elapsed_time": "1:35:29", "remaining_time": "0:01:46"}
{"current_steps": 7260, "total_steps": 7385, "loss": 0.2478, "learning_rate": 1.7451900986450441e-07, "epoch": 4.915368991198375, "percentage": 98.31, "elapsed_time": "1:35:37", "remaining_time": "0:01:38"}
{"current_steps": 7270, "total_steps": 7385, "loss": 0.2644, "learning_rate": 1.4771949172097677e-07, "epoch": 4.922139471902505, "percentage": 98.44, "elapsed_time": "1:35:44", "remaining_time": "0:01:30"}
{"current_steps": 7280, "total_steps": 7385, "loss": 0.2687, "learning_rate": 1.2315116201623288e-07, "epoch": 4.928909952606635, "percentage": 98.58, "elapsed_time": "1:35:52", "remaining_time": "0:01:22"}
{"current_steps": 7290, "total_steps": 7385, "loss": 0.2782, "learning_rate": 1.0081456972694803e-07, "epoch": 4.935680433310765, "percentage": 98.71, "elapsed_time": "1:36:00", "remaining_time": "0:01:15"}
{"current_steps": 7300, "total_steps": 7385, "loss": 0.2503, "learning_rate": 8.07102139618765e-08, "epoch": 4.942450914014895, "percentage": 98.85, "elapsed_time": "1:36:08", "remaining_time": "0:01:07"}
{"current_steps": 7310, "total_steps": 7385, "loss": 0.2688, "learning_rate": 6.283854395067179e-08, "epoch": 4.949221394719025, "percentage": 98.98, "elapsed_time": "1:36:16", "remaining_time": "0:00:59"}
{"current_steps": 7320, "total_steps": 7385, "loss": 0.2713, "learning_rate": 4.719995903387231e-08, "epoch": 4.955991875423155, "percentage": 99.12, "elapsed_time": "1:36:24", "remaining_time": "0:00:51"}
{"current_steps": 7330, "total_steps": 7385, "loss": 0.2492, "learning_rate": 3.379480865397522e-08, "epoch": 4.962762356127285, "percentage": 99.26, "elapsed_time": "1:36:31", "remaining_time": "0:00:43"}
{"current_steps": 7340, "total_steps": 7385, "loss": 0.2528, "learning_rate": 2.2623392347620455e-08, "epoch": 4.969532836831415, "percentage": 99.39, "elapsed_time": "1:36:39", "remaining_time": "0:00:35"}
{"current_steps": 7350, "total_steps": 7385, "loss": 0.2797, "learning_rate": 1.3685959738907184e-08, "epoch": 4.976303317535545, "percentage": 99.53, "elapsed_time": "1:36:46", "remaining_time": "0:00:27"}
{"current_steps": 7360, "total_steps": 7385, "loss": 0.2527, "learning_rate": 6.982710533787185e-09, "epoch": 4.983073798239675, "percentage": 99.66, "elapsed_time": "1:36:54", "remaining_time": "0:00:19"}
{"current_steps": 7370, "total_steps": 7385, "loss": 0.3057, "learning_rate": 2.5137945156461507e-09, "epoch": 4.989844278943805, "percentage": 99.8, "elapsed_time": "1:37:02", "remaining_time": "0:00:11"}
{"current_steps": 7380, "total_steps": 7385, "loss": 0.2525, "learning_rate": 2.7931154193971964e-10, "epoch": 4.996614759647935, "percentage": 99.93, "elapsed_time": "1:37:09", "remaining_time": "0:00:03"}
{"current_steps": 7385, "total_steps": 7385, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "1:37:14", "remaining_time": "0:00:00"}